Skip to content

Commit b7bd454

Browse files
authored
Update vLLM-SR RouterArena submission (#131)
Signed-off-by: xunzhuo <xunzhuo@vllm-semantic-router.ai>
1 parent e82e74b commit b7bd454

3 files changed

Lines changed: 129954 additions & 64263 deletions

File tree

Lines changed: 15 additions & 27 deletions
Original file line numberDiff line numberDiff line change
@@ -1,30 +1,18 @@
11
{
22
"pipeline_params": {
3-
"router_name": "vllm-sr",
4-
"router_cls_name": "VLLMSR",
5-
"models": [
6-
"gpt-4o-mini",
7-
"claude-3-haiku-20240307",
8-
"gemini-2.0-flash-001"
9-
],
10-
"router_endpoint": "http://localhost:8080",
11-
"base_url": "http://localhost:8080",
12-
"default_model": "gpt-4o-mini",
13-
"category_model_mapping": {
14-
"biology_decision": "claude-3-haiku-20240307",
15-
"business_decision": "gemini-2.0-flash-001",
16-
"chemistry_decision": "gemini-2.0-flash-001",
17-
"economics_decision": "gpt-4o-mini",
18-
"engineering_decision": "gemini-2.0-flash-001",
19-
"general_decision": "claude-3-haiku-20240307",
20-
"health_decision": "claude-3-haiku-20240307",
21-
"history_decision": "gpt-4o-mini",
22-
"law_decision": "gemini-2.0-flash-001",
23-
"math_decision": "gemini-2.0-flash-001",
24-
"other": "gemini-2.0-flash-001",
25-
"philosophy_decision": "gpt-4o-mini",
26-
"physics_decision": "gemini-2.0-flash-001",
27-
"psychology_decision": "gemini-2.0-flash-001"
28-
}
3+
"router_name": "vllm-sr",
4+
"router_cls_name": "VLLMSR",
5+
"models": [
6+
"google/gemini-3.1-flash-lite",
7+
"gemini-2.5-flash",
8+
"deepseek/deepseek-v4-flash",
9+
"grok-4-1-fast-reasoning",
10+
"qwen/qwen3-235b-a22b-2507",
11+
"qwen/qwen3-next-80b-a3b-instruct",
12+
"Qwen/Qwen3-Coder-Next",
13+
"deepseek-reasoner"
14+
],
15+
"default_model": "google/gemini-3.1-flash-lite",
16+
"description": "vLLM Semantic Router submission using deterministic semantic, structural, domain-aware, and cost-aware routing over a compact model pool."
2917
}
30-
}
18+
}

0 commit comments

Comments
 (0)