RouteWorks
diff --git a/‎model_cost/model_cost.json‎
Lines changed: 40 additions & 0 deletions b/‎model_cost/model_cost.json‎
Lines changed: 40 additions & 0 deletions
diff --git a/‎router_inference/config/weave-router.json‎
Lines changed: 24 additions & 0 deletions b/‎router_inference/config/weave-router.json‎
Lines changed: 24 additions & 0 deletions
@@ -183,6 +183,46 @@
     "input_token_price_per_million": 1.00,
     "output_token_price_per_million": 3.20
   },
+  "claude-opus-4-7": {
+    "input_token_price_per_million": 15.00,
+    "output_token_price_per_million": 75.00
+  },
+  "claude-haiku-4-5": {
+    "input_token_price_per_million": 0.80,
+    "output_token_price_per_million": 4.00
+  },
+  "gpt-5.5": {
+    "input_token_price_per_million": 5.00,
+    "output_token_price_per_million": 30.00
+  },
+  "gpt-5.4-mini": {
+    "input_token_price_per_million": 0.40,
+    "output_token_price_per_million": 1.60
+  },
+  "gpt-4.1": {
+    "input_token_price_per_million": 2.00,
+    "output_token_price_per_million": 8.00
+  },
+  "gemini-3.1-pro-preview": {
+    "input_token_price_per_million": 2.00,
+    "output_token_price_per_million": 12.00
+  },
+  "gemini-3.1-flash-lite-preview": {
+    "input_token_price_per_million": 0.10,
+    "output_token_price_per_million": 0.40
+  },
+  "deepseek/deepseek-v4-pro": {
+    "input_token_price_per_million": 0.435,
+    "output_token_price_per_million": 0.870
+  },
+  "qwen/qwen3.5-flash-02-23": {
+    "input_token_price_per_million": 0.065,
+    "output_token_price_per_million": 0.260
+  },
+  "deepseek/deepseek-v4-flash": {
+    "input_token_price_per_million": 0.140,
+    "output_token_price_per_million": 0.280
+  },
   "qwen/qwen3-235b-a22b-2507": {
     "input_token_price_per_million": 0.071,
     "output_token_price_per_million": 0.1
 
@@ -0,0 +1,24 @@
+{
+  "pipeline_params": {
+    "router_name": "weave-router",
+    "router_cls_name": "WeaveRouter",
+    "models": [
+      "claude-opus-4-7",
+      "claude-sonnet-4-5",
+      "claude-haiku-4-5",
+      "gpt-5.5",
+      "gpt-5.4-mini",
+      "gpt-4.1",
+      "gemini-3.1-pro-preview",
+      "gemini-3.1-flash-lite-preview",
+      "deepseek/deepseek-v4-pro",
+      "qwen/qwen3.5-flash-02-23",
+      "deepseek/deepseek-v4-flash",
+      "moonshotai/kimi-k2.5"
+    ],
+    "description": "Weave Router (v0.27): cluster-routing over a 12-model BYOK pool spanning Anthropic, OpenAI, Google, and OpenRouter providers. Embeds each prompt, scores against per-cluster model rankings trained on RouterArena's full split, and selects the cost-quality optimum via an alpha-blended score (alpha=0.40). The pool is intentionally multi-provider so a customer who only brings an OpenAI key still gets a 3-tier choice.",
+    "alpha": 0.40,
+    "router_version": "v0.27",
+    "router_homepage": "https://workweave.ai"
+  }
+}