diff --git a/providers/chutes/models/MiniMaxAI/MiniMax-M2.1-TEE.toml b/providers/chutes/models/MiniMaxAI/MiniMax-M2.1-TEE.toml index a3bd6934..d8c50be6 100644 --- a/providers/chutes/models/MiniMaxAI/MiniMax-M2.1-TEE.toml +++ b/providers/chutes/models/MiniMaxAI/MiniMax-M2.1-TEE.toml @@ -1,7 +1,7 @@ name = "MiniMax M2.1 TEE" family = "minimaxai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -10,21 +10,16 @@ structured_output = true open_weights = true [cost] -input = 0.3 -output = 1.2 -reasoning = 1.8 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +input = 0.30 +output = 1.20 [limit] -context = 196608 -output = 65536 +context = 196_608 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/NousResearch/DeepHermes-3-Mistral-24B-Preview.toml b/providers/chutes/models/NousResearch/DeepHermes-3-Mistral-24B-Preview.toml index 3e8f9481..1ffec8c2 100644 --- a/providers/chutes/models/NousResearch/DeepHermes-3-Mistral-24B-Preview.toml +++ b/providers/chutes/models/NousResearch/DeepHermes-3-Mistral-24B-Preview.toml @@ -1,7 +1,7 @@ name = "DeepHermes 3 Mistral 24B Preview" family = "nousresearch" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -11,16 +11,12 @@ open_weights = true [cost] input = 0.02 -output = 0.1 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +output = 0.10 [limit] -context = 32768 -output = 32768 +context = 32_768 +output = 32_768 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/NousResearch/Hermes-4-14B.toml b/providers/chutes/models/NousResearch/Hermes-4-14B.toml index 8ef976ab..13280c9a 100644 --- a/providers/chutes/models/NousResearch/Hermes-4-14B.toml +++ b/providers/chutes/models/NousResearch/Hermes-4-14B.toml @@ -1,7 +1,7 @@ name = "Hermes 4 14B" family = "nousresearch" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.01 output = 0.05 -reasoning = 0.075 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 40960 -output = 40960 +context = 40_960 +output = 40_960 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/NousResearch/Hermes-4-405B-FP8-TEE.toml b/providers/chutes/models/NousResearch/Hermes-4-405B-FP8-TEE.toml index b5ac43ba..32935a65 100644 --- a/providers/chutes/models/NousResearch/Hermes-4-405B-FP8-TEE.toml +++ b/providers/chutes/models/NousResearch/Hermes-4-405B-FP8-TEE.toml @@ -1,7 +1,7 @@ name = "Hermes 4 405B FP8 TEE" family = "nousresearch" release_date = "2025-12-29" -last_updated = "2025-01-06" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -10,17 +10,16 @@ structured_output = true open_weights = true [cost] -input = 0.3 -output = 1.2 -reasoning = 1.8 +input = 0.30 +output = 1.20 [limit] -context = 131072 -output = 65536 +context = 131_072 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/NousResearch/Hermes-4-70B.toml b/providers/chutes/models/NousResearch/Hermes-4-70B.toml index 73d66ad1..c855eb60 100644 --- a/providers/chutes/models/NousResearch/Hermes-4-70B.toml +++ b/providers/chutes/models/NousResearch/Hermes-4-70B.toml @@ -1,7 +1,7 @@ name = "Hermes 4 70B" family = "nousresearch" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.11 output = 0.38 -reasoning = 0.57 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 131072 -output = 131072 +context = 131_072 +output = 131_072 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/NousResearch/Hermes-4.3-36B.toml b/providers/chutes/models/NousResearch/Hermes-4.3-36B.toml index 580bc714..1855c4d6 100644 --- a/providers/chutes/models/NousResearch/Hermes-4.3-36B.toml +++ b/providers/chutes/models/NousResearch/Hermes-4.3-36B.toml @@ -1,7 +1,7 @@ name = "Hermes 4.3 36B" family = "nousresearch" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -10,17 +10,13 @@ structured_output = false open_weights = true [cost] -input = 0.1 +input = 0.10 output = 0.39 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 524288 -output = 524288 +context = 32_768 +output = 8_192 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/OpenGVLab/InternVL3-78B-TEE.toml b/providers/chutes/models/OpenGVLab/InternVL3-78B-TEE.toml index 78ef0952..75cfe6dd 100644 --- a/providers/chutes/models/OpenGVLab/InternVL3-78B-TEE.toml +++ b/providers/chutes/models/OpenGVLab/InternVL3-78B-TEE.toml @@ -1,7 +1,7 @@ name = "InternVL3 78B TEE" family = "opengvlab" release_date = "2025-01-06" -last_updated = "2025-01-06" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -10,14 +10,13 @@ structured_output = true open_weights = true [cost] -input = 0.1 +input = 0.10 output = 0.39 [limit] -context = 32768 -output = 32768 +context = 32_768 +output = 32_768 [modalities] -input = ['text', 'image'] -output = ['text'] - +input = ["text", "image"] +output = ["text"] diff --git a/providers/chutes/models/Qwen/Qwen2.5-72B-Instruct.toml b/providers/chutes/models/Qwen/Qwen2.5-72B-Instruct.toml index 1731aa53..57eebab9 100644 --- a/providers/chutes/models/Qwen/Qwen2.5-72B-Instruct.toml +++ b/providers/chutes/models/Qwen/Qwen2.5-72B-Instruct.toml @@ -1,7 +1,7 @@ name = "Qwen2.5 72B Instruct" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.13 output = 0.52 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 32768 -output = 32768 +context = 32_768 +output = 32_768 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/Qwen/Qwen2.5-Coder-32B-Instruct.toml b/providers/chutes/models/Qwen/Qwen2.5-Coder-32B-Instruct.toml index 01f47210..6770cc04 100644 --- a/providers/chutes/models/Qwen/Qwen2.5-Coder-32B-Instruct.toml +++ b/providers/chutes/models/Qwen/Qwen2.5-Coder-32B-Instruct.toml @@ -1,7 +1,7 @@ name = "Qwen2.5 Coder 32B Instruct" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.03 output = 0.11 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 32768 -output = 32768 +context = 32_768 +output = 32_768 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/Qwen/Qwen2.5-VL-32B-Instruct.toml b/providers/chutes/models/Qwen/Qwen2.5-VL-32B-Instruct.toml index a2a51066..d2cfb35c 100644 --- a/providers/chutes/models/Qwen/Qwen2.5-VL-32B-Instruct.toml +++ b/providers/chutes/models/Qwen/Qwen2.5-VL-32B-Instruct.toml @@ -1,7 +1,7 @@ name = "Qwen2.5 VL 32B Instruct" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.05 output = 0.22 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 16384 -output = 16384 +context = 16_384 +output = 16_384 [modalities] -input = ['text', 'image'] -output = ['text'] +input = ["text", "image"] +output = ["text"] diff --git a/providers/chutes/models/Qwen/Qwen2.5-VL-72B-Instruct-TEE.toml b/providers/chutes/models/Qwen/Qwen2.5-VL-72B-Instruct-TEE.toml index 054321af..5014326c 100644 --- a/providers/chutes/models/Qwen/Qwen2.5-VL-72B-Instruct-TEE.toml +++ b/providers/chutes/models/Qwen/Qwen2.5-VL-72B-Instruct-TEE.toml @@ -1,26 +1,22 @@ name = "Qwen2.5 VL 72B Instruct TEE" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true tool_call = false -structured_output = false +structured_output = true open_weights = true [cost] input = 0.15 -output = 0.6 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +output = 0.60 [limit] -context = 40960 -output = 40960 +context = 32_768 +output = 32_768 [modalities] -input = ['text', 'image'] -output = ['text'] +input = ["text", "image"] +output = ["text"] diff --git a/providers/chutes/models/Qwen/Qwen3-14B.toml b/providers/chutes/models/Qwen/Qwen3-14B.toml index 0943e2e6..e73eb18e 100644 --- a/providers/chutes/models/Qwen/Qwen3-14B.toml +++ b/providers/chutes/models/Qwen/Qwen3-14B.toml @@ -1,7 +1,7 @@ name = "Qwen3 14B" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.05 output = 0.22 -reasoning = 0.33 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 40960 -output = 40960 +context = 40_960 +output = 40_960 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/Qwen/Qwen3-235B-A22B-Instruct-2507-TEE.toml b/providers/chutes/models/Qwen/Qwen3-235B-A22B-Instruct-2507-TEE.toml index bff94731..83db3970 100644 --- a/providers/chutes/models/Qwen/Qwen3-235B-A22B-Instruct-2507-TEE.toml +++ b/providers/chutes/models/Qwen/Qwen3-235B-A22B-Instruct-2507-TEE.toml @@ -1,7 +1,7 @@ name = "Qwen3 235B A22B Instruct 2507 TEE" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.08 output = 0.55 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 262144 -output = 65536 +context = 262_144 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/Qwen/Qwen3-235B-A22B-Thinking-2507.toml b/providers/chutes/models/Qwen/Qwen3-235B-A22B-Thinking-2507.toml index 73b062b7..bdb613f1 100644 --- a/providers/chutes/models/Qwen/Qwen3-235B-A22B-Thinking-2507.toml +++ b/providers/chutes/models/Qwen/Qwen3-235B-A22B-Thinking-2507.toml @@ -1,7 +1,7 @@ name = "Qwen3 235B A22B Thinking 2507" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -11,20 +11,15 @@ open_weights = true [cost] input = 0.11 -output = 0.6 -reasoning = 0.9 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +output = 0.60 [limit] -context = 262144 -output = 262144 +context = 262_144 +output = 262_144 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/Qwen/Qwen3-235B-A22B.toml b/providers/chutes/models/Qwen/Qwen3-235B-A22B.toml index 94e8ce9b..624a91ac 100644 --- a/providers/chutes/models/Qwen/Qwen3-235B-A22B.toml +++ b/providers/chutes/models/Qwen/Qwen3-235B-A22B.toml @@ -1,7 +1,7 @@ name = "Qwen3 235B A22B" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -10,21 +10,16 @@ structured_output = true open_weights = true [cost] -input = 0.3 -output = 1.2 -reasoning = 1.8 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +input = 0.30 +output = 1.20 [limit] -context = 40960 -output = 40960 +context = 40_960 +output = 40_960 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/Qwen/Qwen3-30B-A3B-Instruct-2507.toml b/providers/chutes/models/Qwen/Qwen3-30B-A3B-Instruct-2507.toml index a5fcabf3..52df2568 100644 --- a/providers/chutes/models/Qwen/Qwen3-30B-A3B-Instruct-2507.toml +++ b/providers/chutes/models/Qwen/Qwen3-30B-A3B-Instruct-2507.toml @@ -1,7 +1,7 @@ name = "Qwen3 30B A3B Instruct 2507" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.08 output = 0.33 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 262144 -output = 262144 +context = 262_144 +output = 262_144 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/Qwen/Qwen3-30B-A3B.toml b/providers/chutes/models/Qwen/Qwen3-30B-A3B.toml index c7ebaa99..809fcca2 100644 --- a/providers/chutes/models/Qwen/Qwen3-30B-A3B.toml +++ b/providers/chutes/models/Qwen/Qwen3-30B-A3B.toml @@ -1,7 +1,7 @@ name = "Qwen3 30B A3B" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.06 output = 0.22 -reasoning = 0.33 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 40960 -output = 40960 +context = 40_960 +output = 40_960 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/Qwen/Qwen3-32B.toml b/providers/chutes/models/Qwen/Qwen3-32B.toml index 4e7cd784..00f46f5e 100644 --- a/providers/chutes/models/Qwen/Qwen3-32B.toml +++ b/providers/chutes/models/Qwen/Qwen3-32B.toml @@ -1,7 +1,7 @@ name = "Qwen3 32B" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.08 output = 0.24 -reasoning = 0.36 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 40960 -output = 40960 +context = 40_960 +output = 40_960 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8-TEE.toml b/providers/chutes/models/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8-TEE.toml index e949b859..fa1481fd 100644 --- a/providers/chutes/models/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8-TEE.toml +++ b/providers/chutes/models/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8-TEE.toml @@ -1,7 +1,7 @@ name = "Qwen3 Coder 480B A35B Instruct FP8 TEE" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.22 output = 0.95 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 262144 -output = 262144 +context = 262_144 +output = 262_144 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/Qwen/Qwen3-Next-80B-A3B-Instruct.toml b/providers/chutes/models/Qwen/Qwen3-Next-80B-A3B-Instruct.toml index c6632b17..e38870ca 100644 --- a/providers/chutes/models/Qwen/Qwen3-Next-80B-A3B-Instruct.toml +++ b/providers/chutes/models/Qwen/Qwen3-Next-80B-A3B-Instruct.toml @@ -1,7 +1,7 @@ name = "Qwen3 Next 80B A3B Instruct" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -10,17 +10,13 @@ structured_output = true open_weights = true [cost] -input = 0.1 -output = 0.8 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +input = 0.10 +output = 0.80 [limit] -context = 262144 -output = 262144 +context = 262_144 +output = 262_144 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/Qwen/Qwen3-VL-235B-A22B-Instruct.toml b/providers/chutes/models/Qwen/Qwen3-VL-235B-A22B-Instruct.toml index b7a589ad..fb89f8d1 100644 --- a/providers/chutes/models/Qwen/Qwen3-VL-235B-A22B-Instruct.toml +++ b/providers/chutes/models/Qwen/Qwen3-VL-235B-A22B-Instruct.toml @@ -1,26 +1,22 @@ name = "Qwen3 VL 235B A22B Instruct" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true tool_call = true -structured_output = false +structured_output = true open_weights = true [cost] -input = 0.3 -output = 1.2 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +input = 0.30 +output = 1.20 [limit] -context = 262144 -output = 262144 +context = 262_144 +output = 262_144 [modalities] -input = ['text', 'image'] -output = ['text'] +input = ["text", "image"] +output = ["text"] diff --git a/providers/chutes/models/Qwen/Qwen3Guard-Gen-0.6B.toml b/providers/chutes/models/Qwen/Qwen3Guard-Gen-0.6B.toml index dc304893..6e2a0920 100644 --- a/providers/chutes/models/Qwen/Qwen3Guard-Gen-0.6B.toml +++ b/providers/chutes/models/Qwen/Qwen3Guard-Gen-0.6B.toml @@ -1,7 +1,7 @@ name = "Qwen3Guard Gen 0.6B" family = "qwen" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.01 output = 0.01 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 32768 -output = 32768 +context = 32_768 +output = 8_192 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/XiaomiMiMo/MiMo-V2-Flash.toml b/providers/chutes/models/XiaomiMiMo/MiMo-V2-Flash.toml index 00ebb09e..87eaae3d 100644 --- a/providers/chutes/models/XiaomiMiMo/MiMo-V2-Flash.toml +++ b/providers/chutes/models/XiaomiMiMo/MiMo-V2-Flash.toml @@ -1,7 +1,7 @@ name = "MiMo V2 Flash" family = "xiaomimimo" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.17 output = 0.65 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 262144 -output = 262144 +context = 32_768 +output = 8_192 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/chutesai/Mistral-Small-3.1-24B-Instruct-2503.toml b/providers/chutes/models/chutesai/Mistral-Small-3.1-24B-Instruct-2503.toml index 921311bb..3ba90df0 100644 --- a/providers/chutes/models/chutesai/Mistral-Small-3.1-24B-Instruct-2503.toml +++ b/providers/chutes/models/chutesai/Mistral-Small-3.1-24B-Instruct-2503.toml @@ -1,7 +1,7 @@ name = "Mistral Small 3.1 24B Instruct 2503" family = "chutesai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.03 output = 0.11 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 131072 -output = 131072 +context = 131_072 +output = 131_072 [modalities] -input = ['text', 'image'] -output = ['text'] +input = ["text", "image"] +output = ["text"] diff --git a/providers/chutes/models/chutesai/Mistral-Small-3.2-24B-Instruct-2506.toml b/providers/chutes/models/chutesai/Mistral-Small-3.2-24B-Instruct-2506.toml index 1b583d91..2d2b6034 100644 --- a/providers/chutes/models/chutesai/Mistral-Small-3.2-24B-Instruct-2506.toml +++ b/providers/chutes/models/chutesai/Mistral-Small-3.2-24B-Instruct-2506.toml @@ -1,7 +1,7 @@ name = "Mistral Small 3.2 24B Instruct 2506" family = "chutesai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.06 output = 0.18 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 131072 -output = 131072 +context = 131_072 +output = 131_072 [modalities] -input = ['text', 'image'] -output = ['text'] +input = ["text", "image"] +output = ["text"] diff --git a/providers/chutes/models/deepseek-ai/DeepSeek-R1-0528-TEE.toml b/providers/chutes/models/deepseek-ai/DeepSeek-R1-0528-TEE.toml index 40755b82..cd3e1935 100644 --- a/providers/chutes/models/deepseek-ai/DeepSeek-R1-0528-TEE.toml +++ b/providers/chutes/models/deepseek-ai/DeepSeek-R1-0528-TEE.toml @@ -1,7 +1,7 @@ name = "DeepSeek R1 0528 TEE" family = "deepseek-ai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -10,21 +10,16 @@ structured_output = true open_weights = true [cost] -input = 0.4 +input = 0.40 output = 1.75 -reasoning = 2.625 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 163840 -output = 65536 +context = 163_840 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/deepseek-ai/DeepSeek-R1-Distill-Llama-70B.toml b/providers/chutes/models/deepseek-ai/DeepSeek-R1-Distill-Llama-70B.toml index 70f15d6b..57ef48fd 100644 --- a/providers/chutes/models/deepseek-ai/DeepSeek-R1-Distill-Llama-70B.toml +++ b/providers/chutes/models/deepseek-ai/DeepSeek-R1-Distill-Llama-70B.toml @@ -1,7 +1,7 @@ name = "DeepSeek R1 Distill Llama 70B" family = "deepseek-ai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.03 output = 0.11 -reasoning = 0.165 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 131072 -output = 131072 +context = 131_072 +output = 131_072 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/deepseek-ai/DeepSeek-R1-TEE.toml b/providers/chutes/models/deepseek-ai/DeepSeek-R1-TEE.toml index af3963c2..38e3aa0f 100644 --- a/providers/chutes/models/deepseek-ai/DeepSeek-R1-TEE.toml +++ b/providers/chutes/models/deepseek-ai/DeepSeek-R1-TEE.toml @@ -1,7 +1,7 @@ name = "DeepSeek R1 TEE" family = "deepseek-ai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -10,21 +10,16 @@ structured_output = true open_weights = true [cost] -input = 0.3 -output = 1.2 -reasoning = 1.8 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +input = 0.30 +output = 1.20 [limit] -context = 163840 -output = 163840 +context = 163_840 +output = 163_840 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/deepseek-ai/DeepSeek-V3-0324-TEE.toml b/providers/chutes/models/deepseek-ai/DeepSeek-V3-0324-TEE.toml index 537c1723..43f3b898 100644 --- a/providers/chutes/models/deepseek-ai/DeepSeek-V3-0324-TEE.toml +++ b/providers/chutes/models/deepseek-ai/DeepSeek-V3-0324-TEE.toml @@ -1,7 +1,7 @@ name = "DeepSeek V3 0324 TEE" family = "deepseek-ai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.19 output = 0.87 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 163840 -output = 65536 +context = 163_840 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/deepseek-ai/DeepSeek-V3.1-TEE.toml b/providers/chutes/models/deepseek-ai/DeepSeek-V3.1-TEE.toml index 1b026fe2..b07ed111 100644 --- a/providers/chutes/models/deepseek-ai/DeepSeek-V3.1-TEE.toml +++ b/providers/chutes/models/deepseek-ai/DeepSeek-V3.1-TEE.toml @@ -1,7 +1,7 @@ name = "DeepSeek V3.1 TEE" family = "deepseek-ai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -10,21 +10,16 @@ structured_output = true open_weights = true [cost] -input = 0.2 -output = 0.8 -reasoning = 1.2 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +input = 0.20 +output = 0.80 [limit] -context = 163840 -output = 65536 +context = 163_840 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/deepseek-ai/DeepSeek-V3.1-Terminus-TEE.toml b/providers/chutes/models/deepseek-ai/DeepSeek-V3.1-Terminus-TEE.toml index c72ffd36..6b8f750b 100644 --- a/providers/chutes/models/deepseek-ai/DeepSeek-V3.1-Terminus-TEE.toml +++ b/providers/chutes/models/deepseek-ai/DeepSeek-V3.1-Terminus-TEE.toml @@ -1,7 +1,7 @@ name = "DeepSeek V3.1 Terminus TEE" family = "deepseek-ai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -11,20 +11,15 @@ open_weights = true [cost] input = 0.23 -output = 0.9 -reasoning = 1.35 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +output = 0.90 [limit] -context = 163840 -output = 65536 +context = 163_840 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/deepseek-ai/DeepSeek-V3.2-Speciale-TEE.toml b/providers/chutes/models/deepseek-ai/DeepSeek-V3.2-Speciale-TEE.toml index ad895cc1..af176265 100644 --- a/providers/chutes/models/deepseek-ai/DeepSeek-V3.2-Speciale-TEE.toml +++ b/providers/chutes/models/deepseek-ai/DeepSeek-V3.2-Speciale-TEE.toml @@ -1,7 +1,7 @@ name = "DeepSeek V3.2 Speciale TEE" family = "deepseek-ai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.27 output = 0.41 -reasoning = 0.615 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 163840 -output = 65536 +context = 163_840 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/deepseek-ai/DeepSeek-V3.2-TEE.toml b/providers/chutes/models/deepseek-ai/DeepSeek-V3.2-TEE.toml index 159b5d35..d8169876 100644 --- a/providers/chutes/models/deepseek-ai/DeepSeek-V3.2-TEE.toml +++ b/providers/chutes/models/deepseek-ai/DeepSeek-V3.2-TEE.toml @@ -1,7 +1,7 @@ name = "DeepSeek V3.2 TEE" family = "deepseek-ai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.25 output = 0.38 -reasoning = 0.57 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 163840 -output = 65536 +context = 163_840 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/deepseek-ai/DeepSeek-V3.toml b/providers/chutes/models/deepseek-ai/DeepSeek-V3.toml index fdc0c5bc..cc8fb5f2 100644 --- a/providers/chutes/models/deepseek-ai/DeepSeek-V3.toml +++ b/providers/chutes/models/deepseek-ai/DeepSeek-V3.toml @@ -1,7 +1,7 @@ name = "DeepSeek V3" family = "deepseek-ai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -10,17 +10,13 @@ structured_output = true open_weights = true [cost] -input = 0.3 -output = 1.2 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +input = 0.30 +output = 1.20 [limit] -context = 163840 -output = 163840 +context = 163_840 +output = 163_840 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/miromind-ai/MiroThinker-v1.5-235B.toml b/providers/chutes/models/miromind-ai/MiroThinker-v1.5-235B.toml new file mode 100644 index 00000000..f38c1551 --- /dev/null +++ b/providers/chutes/models/miromind-ai/MiroThinker-v1.5-235B.toml @@ -0,0 +1,21 @@ +name = "MiroThinker V1.5 235B" +release_date = "2026-01-10" +last_updated = "2026-01-10" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.30 +output = 1.20 + +[limit] +context = 32_768 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/mistralai/Devstral-2-123B-Instruct-2512-TEE.toml b/providers/chutes/models/mistralai/Devstral-2-123B-Instruct-2512-TEE.toml new file mode 100644 index 00000000..2aeea73f --- /dev/null +++ b/providers/chutes/models/mistralai/Devstral-2-123B-Instruct-2512-TEE.toml @@ -0,0 +1,21 @@ +name = "Devstral 2 123B Instruct 2512 TEE" +release_date = "2026-01-10" +last_updated = "2026-01-10" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.05 +output = 0.22 + +[limit] +context = 262_144 +output = 65_536 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/mistralai/Devstral-2-123B-Instruct-2512.toml b/providers/chutes/models/mistralai/Devstral-2-123B-Instruct-2512.toml index 666bbae6..b7477e0e 100644 --- a/providers/chutes/models/mistralai/Devstral-2-123B-Instruct-2512.toml +++ b/providers/chutes/models/mistralai/Devstral-2-123B-Instruct-2512.toml @@ -1,7 +1,7 @@ name = "Devstral 2 123B Instruct 2512" family = "mistralai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.05 output = 0.22 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 262144 -output = 65536 +context = 262_144 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/moonshotai/Kimi-K2-Instruct-0905.toml b/providers/chutes/models/moonshotai/Kimi-K2-Instruct-0905.toml index 94d1f64f..da0203e5 100644 --- a/providers/chutes/models/moonshotai/Kimi-K2-Instruct-0905.toml +++ b/providers/chutes/models/moonshotai/Kimi-K2-Instruct-0905.toml @@ -1,7 +1,7 @@ name = "Kimi K2 Instruct 0905" family = "moonshotai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -11,16 +11,12 @@ open_weights = true [cost] input = 0.39 -output = 1.9 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +output = 1.90 [limit] -context = 262144 -output = 262144 +context = 262_144 +output = 262_144 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/moonshotai/Kimi-K2-Thinking-TEE.toml b/providers/chutes/models/moonshotai/Kimi-K2-Thinking-TEE.toml index 8398aa68..8ddfcd8d 100644 --- a/providers/chutes/models/moonshotai/Kimi-K2-Thinking-TEE.toml +++ b/providers/chutes/models/moonshotai/Kimi-K2-Thinking-TEE.toml @@ -1,7 +1,7 @@ name = "Kimi K2 Thinking TEE" family = "moonshotai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -10,21 +10,16 @@ structured_output = true open_weights = true [cost] -input = 0.4 +input = 0.40 output = 1.75 -reasoning = 2.625 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 262144 -output = 65535 +context = 262_144 +output = 65_535 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16.toml b/providers/chutes/models/nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16.toml index ecc5479c..84a7e8ed 100644 --- a/providers/chutes/models/nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16.toml +++ b/providers/chutes/models/nvidia/NVIDIA-Nemotron-3-Nano-30B-A3B-BF16.toml @@ -1,7 +1,7 @@ name = "NVIDIA Nemotron 3 Nano 30B A3B BF16" family = "nvidia" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.06 output = 0.24 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 262144 -output = 262144 +context = 262_144 +output = 262_144 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/openai/gpt-oss-120b-TEE.toml b/providers/chutes/models/openai/gpt-oss-120b-TEE.toml index c3931143..08c044a1 100644 --- a/providers/chutes/models/openai/gpt-oss-120b-TEE.toml +++ b/providers/chutes/models/openai/gpt-oss-120b-TEE.toml @@ -1,7 +1,7 @@ name = "gpt oss 120b TEE" family = "openai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.04 output = 0.18 -reasoning = 0.27 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 131072 -output = 65536 +context = 131_072 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/openai/gpt-oss-20b.toml b/providers/chutes/models/openai/gpt-oss-20b.toml index 401649bd..7d382d98 100644 --- a/providers/chutes/models/openai/gpt-oss-20b.toml +++ b/providers/chutes/models/openai/gpt-oss-20b.toml @@ -1,7 +1,7 @@ name = "gpt oss 20b" family = "openai" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -11,20 +11,15 @@ open_weights = true [cost] input = 0.02 -output = 0.1 -reasoning = 0.15 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +output = 0.10 [limit] -context = 131072 -output = 131072 +context = 131_072 +output = 131_072 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/rednote-hilab/dots.ocr.toml b/providers/chutes/models/rednote-hilab/dots.ocr.toml index c66408e0..9e2891de 100644 --- a/providers/chutes/models/rednote-hilab/dots.ocr.toml +++ b/providers/chutes/models/rednote-hilab/dots.ocr.toml @@ -1,7 +1,7 @@ name = "dots.ocr" family = "rednote-hilab" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.01 output = 0.01 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 131072 -output = 131072 +context = 131_072 +output = 131_072 [modalities] -input = ['text', 'image'] -output = ['text'] +input = ["text", "image"] +output = ["text"] diff --git a/providers/chutes/models/tngtech/DeepSeek-R1T-Chimera.toml b/providers/chutes/models/tngtech/DeepSeek-R1T-Chimera.toml index bf6d0103..5c781447 100644 --- a/providers/chutes/models/tngtech/DeepSeek-R1T-Chimera.toml +++ b/providers/chutes/models/tngtech/DeepSeek-R1T-Chimera.toml @@ -1,7 +1,7 @@ name = "DeepSeek R1T Chimera" family = "tngtech" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -10,21 +10,16 @@ structured_output = true open_weights = true [cost] -input = 0.3 -output = 1.2 -reasoning = 1.8 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +input = 0.30 +output = 1.20 [limit] -context = 163840 -output = 163840 +context = 163_840 +output = 163_840 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/tngtech/DeepSeek-TNG-R1T2-Chimera-TEE.toml b/providers/chutes/models/tngtech/DeepSeek-TNG-R1T2-Chimera-TEE.toml deleted file mode 100644 index 9368d301..00000000 --- a/providers/chutes/models/tngtech/DeepSeek-TNG-R1T2-Chimera-TEE.toml +++ /dev/null @@ -1,27 +0,0 @@ -name = "DeepSeek TNG R1T2 Chimera TEE" -family = "tngtech" -release_date = "2025-01-06" -last_updated = "2025-01-06" -attachment = false -reasoning = true -temperature = true -tool_call = true -structured_output = true -open_weights = true - -[cost] -input = 0.25 -output = 0.85 -reasoning = 1.275 - -[limit] -context = 163840 -output = 65536 - -[modalities] -input = ['text'] -output = ['text'] - -[interleaved] -field = "reasoning_content" - diff --git a/providers/chutes/models/tngtech/DeepSeek-TNG-R1T2-Chimera.toml b/providers/chutes/models/tngtech/DeepSeek-TNG-R1T2-Chimera.toml index bcedee94..81ebd152 100644 --- a/providers/chutes/models/tngtech/DeepSeek-TNG-R1T2-Chimera.toml +++ b/providers/chutes/models/tngtech/DeepSeek-TNG-R1T2-Chimera.toml @@ -1,7 +1,7 @@ name = "DeepSeek TNG R1T2 Chimera" family = "tngtech" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.25 output = 0.85 -reasoning = 1.275 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 163840 -output = 163840 +context = 163_840 +output = 163_840 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/tngtech/TNG-R1T-Chimera-TEE.toml b/providers/chutes/models/tngtech/TNG-R1T-Chimera-TEE.toml index 62d2fbee..d45f9094 100644 --- a/providers/chutes/models/tngtech/TNG-R1T-Chimera-TEE.toml +++ b/providers/chutes/models/tngtech/TNG-R1T-Chimera-TEE.toml @@ -1,7 +1,7 @@ name = "TNG R1T Chimera TEE" family = "tngtech" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.25 output = 0.85 -reasoning = 1.275 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 163840 -output = 65536 +context = 163_840 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/unsloth/Mistral-Nemo-Instruct-2407.toml b/providers/chutes/models/unsloth/Mistral-Nemo-Instruct-2407.toml index 8a8d9a6c..dc28046a 100644 --- a/providers/chutes/models/unsloth/Mistral-Nemo-Instruct-2407.toml +++ b/providers/chutes/models/unsloth/Mistral-Nemo-Instruct-2407.toml @@ -1,7 +1,7 @@ name = "Mistral Nemo Instruct 2407" family = "unsloth" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.02 output = 0.04 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 131072 -output = 131072 +context = 131_072 +output = 131_072 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] diff --git a/providers/chutes/models/unsloth/Mistral-Small-24B-Instruct-2501.toml b/providers/chutes/models/unsloth/Mistral-Small-24B-Instruct-2501.toml index 9f842c00..ad834e3d 100644 --- a/providers/chutes/models/unsloth/Mistral-Small-24B-Instruct-2501.toml +++ b/providers/chutes/models/unsloth/Mistral-Small-24B-Instruct-2501.toml @@ -1,7 +1,7 @@ name = "Mistral Small 24B Instruct 2501" family = "unsloth" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.03 output = 0.11 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 32768 -output = 32768 +context = 32_768 +output = 32_768 [modalities] -input = ['text', 'image'] -output = ['text'] +input = ["text", "image"] +output = ["text"] diff --git a/providers/chutes/models/unsloth/gemma-3-12b-it.toml b/providers/chutes/models/unsloth/gemma-3-12b-it.toml index 1d2d0933..09fcbcd4 100644 --- a/providers/chutes/models/unsloth/gemma-3-12b-it.toml +++ b/providers/chutes/models/unsloth/gemma-3-12b-it.toml @@ -1,26 +1,22 @@ name = "gemma 3 12b it" family = "unsloth" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true tool_call = false -structured_output = false +structured_output = true open_weights = true [cost] input = 0.03 -output = 0.1 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +output = 0.10 [limit] -context = 131072 -output = 131072 +context = 131_072 +output = 131_072 [modalities] -input = ['text', 'image'] -output = ['text'] +input = ["text", "image"] +output = ["text"] diff --git a/providers/chutes/models/unsloth/gemma-3-27b-it.toml b/providers/chutes/models/unsloth/gemma-3-27b-it.toml index f425e446..aa11eba5 100644 --- a/providers/chutes/models/unsloth/gemma-3-27b-it.toml +++ b/providers/chutes/models/unsloth/gemma-3-27b-it.toml @@ -1,7 +1,7 @@ name = "gemma 3 27b it" family = "unsloth" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.04 output = 0.15 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 96000 -output = 96000 +context = 96_000 +output = 96_000 [modalities] -input = ['text', 'image'] -output = ['text'] +input = ["text", "image"] +output = ["text"] diff --git a/providers/chutes/models/unsloth/gemma-3-4b-it.toml b/providers/chutes/models/unsloth/gemma-3-4b-it.toml index 4a37b5ab..dffddfd5 100644 --- a/providers/chutes/models/unsloth/gemma-3-4b-it.toml +++ b/providers/chutes/models/unsloth/gemma-3-4b-it.toml @@ -1,7 +1,7 @@ name = "gemma 3 4b it" family = "unsloth" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = false temperature = true @@ -12,15 +12,11 @@ open_weights = true [cost] input = 0.01 output = 0.03 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 96000 -output = 96000 +context = 96_000 +output = 96_000 [modalities] -input = ['text', 'image'] -output = ['text'] +input = ["text", "image"] +output = ["text"] diff --git a/providers/chutes/models/zai-org/GLM-4.5-Air.toml b/providers/chutes/models/zai-org/GLM-4.5-Air.toml index 58dc23e8..b27a3951 100644 --- a/providers/chutes/models/zai-org/GLM-4.5-Air.toml +++ b/providers/chutes/models/zai-org/GLM-4.5-Air.toml @@ -1,7 +1,7 @@ name = "GLM 4.5 Air" family = "zai-org" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.05 output = 0.22 -reasoning = 0.33 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 131072 -output = 131072 +context = 131_072 +output = 131_072 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/zai-org/GLM-4.5-TEE.toml b/providers/chutes/models/zai-org/GLM-4.5-TEE.toml index c1603596..dcf4e484 100644 --- a/providers/chutes/models/zai-org/GLM-4.5-TEE.toml +++ b/providers/chutes/models/zai-org/GLM-4.5-TEE.toml @@ -1,7 +1,7 @@ name = "GLM 4.5 TEE" family = "zai-org" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -12,19 +12,14 @@ open_weights = true [cost] input = 0.35 output = 1.55 -reasoning = 2.325 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 [limit] -context = 131072 -output = 65536 +context = 131_072 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/zai-org/GLM-4.6-TEE.toml b/providers/chutes/models/zai-org/GLM-4.6-TEE.toml index 73a30219..5a7f6507 100644 --- a/providers/chutes/models/zai-org/GLM-4.6-TEE.toml +++ b/providers/chutes/models/zai-org/GLM-4.6-TEE.toml @@ -1,7 +1,7 @@ name = "GLM 4.6 TEE" family = "zai-org" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -11,20 +11,15 @@ open_weights = true [cost] input = 0.35 -output = 1.5 -reasoning = 2.25 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +output = 1.50 [limit] -context = 202752 -output = 65536 +context = 202_752 +output = 65_536 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/zai-org/GLM-4.6V.toml b/providers/chutes/models/zai-org/GLM-4.6V.toml index 7250ac42..f72cb9f9 100644 --- a/providers/chutes/models/zai-org/GLM-4.6V.toml +++ b/providers/chutes/models/zai-org/GLM-4.6V.toml @@ -1,7 +1,7 @@ name = "GLM 4.6V" family = "zai-org" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -10,21 +10,16 @@ structured_output = true open_weights = true [cost] -input = 0.3 -output = 0.9 -reasoning = 1.35 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +input = 0.30 +output = 0.90 [limit] -context = 131072 -output = 65536 +context = 131_072 +output = 65_536 [modalities] -input = ['text', 'image'] -output = ['text'] +input = ["text", "image"] +output = ["text"] [interleaved] field = "reasoning_content" diff --git a/providers/chutes/models/zai-org/GLM-4.7-TEE.toml b/providers/chutes/models/zai-org/GLM-4.7-TEE.toml index 82a62cab..7776ac80 100644 --- a/providers/chutes/models/zai-org/GLM-4.7-TEE.toml +++ b/providers/chutes/models/zai-org/GLM-4.7-TEE.toml @@ -1,7 +1,7 @@ name = "GLM 4.7 TEE" family = "zai-org" release_date = "2025-12-29" -last_updated = "2025-12-29" +last_updated = "2026-01-10" attachment = false reasoning = true temperature = true @@ -10,21 +10,16 @@ structured_output = true open_weights = true [cost] -input = 0.4 -output = 1.5 -reasoning = 2.25 -cache_read = 0.0 -cache_write = 0.0 -input_audio = 0.0 -output_audio = 0.0 +input = 0.40 +output = 1.50 [limit] -context = 202752 -output = 65535 +context = 202_752 +output = 65_535 [modalities] -input = ['text'] -output = ['text'] +input = ["text"] +output = ["text"] [interleaved] field = "reasoning_content"