diff --git a/packages/core/src/family.ts b/packages/core/src/family.ts index aeb6062a..fdf53326 100644 --- a/packages/core/src/family.ts +++ b/packages/core/src/family.ts @@ -218,6 +218,12 @@ export const ModelFamilyValues = [ // Falcon "falcon", + // Baichuan + "baichuan", + + // Skywork + "skywork", + // BART "bart", diff --git a/providers/novita-ai/logo.svg b/providers/novita-ai/logo.svg new file mode 100644 index 00000000..ac537b8d --- /dev/null +++ b/providers/novita-ai/logo.svg @@ -0,0 +1,10 @@ + + + + + + + + + + diff --git a/providers/novita-ai/models/baichuan/baichuan-m2-32b.toml b/providers/novita-ai/models/baichuan/baichuan-m2-32b.toml new file mode 100644 index 00000000..cc3f55f5 --- /dev/null +++ b/providers/novita-ai/models/baichuan/baichuan-m2-32b.toml @@ -0,0 +1,23 @@ +name = "baichuan-m2-32b" +family = "baichuan" +release_date = "2025-08-13" +last_updated = "2025-08-13" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-12" +tool_call = false +structured_output = false +open_weights = true + +[cost] +input = 0.07 +output = 0.07 + +[limit] +context = 131072 +output = 131072 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/baidu/ernie-4.5-21B-a3b-thinking.toml b/providers/novita-ai/models/baidu/ernie-4.5-21B-a3b-thinking.toml new file mode 100644 index 00000000..c757f684 --- /dev/null +++ b/providers/novita-ai/models/baidu/ernie-4.5-21B-a3b-thinking.toml @@ -0,0 +1,22 @@ +name = "ERNIE-4.5-21B-A3B-Thinking" +family = "ernie" +release_date = "2025-09-19" +last_updated = "2025-09-19" +attachment = false +reasoning = true +temperature = true +knowledge = "2025-03" +tool_call = false +open_weights = true + +[cost] +input = 0.07 +output = 0.28 + +[limit] +context = 131_072 +output = 65_536 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/baidu/ernie-4.5-21B-a3b.toml b/providers/novita-ai/models/baidu/ernie-4.5-21B-a3b.toml new file mode 100644 index 00000000..80b031e6 --- /dev/null +++ b/providers/novita-ai/models/baidu/ernie-4.5-21B-a3b.toml @@ -0,0 +1,22 @@ +name = "ERNIE 4.5 21B A3B" +family = "ernie" +release_date = "2025-06-30" +last_updated = "2025-06-30" +attachment = false +reasoning = false +temperature = true +knowledge = "2025-03" +tool_call = true +open_weights = true + +[cost] +input = 0.07 +output = 0.28 + +[limit] +context = 120_000 +output = 8_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/baidu/ernie-4.5-300b-a47b-paddle.toml b/providers/novita-ai/models/baidu/ernie-4.5-300b-a47b-paddle.toml new file mode 100644 index 00000000..577b09f5 --- /dev/null +++ b/providers/novita-ai/models/baidu/ernie-4.5-300b-a47b-paddle.toml @@ -0,0 +1,21 @@ +name = "ERNIE 4.5 300B A47B" +release_date = "2025-06-30" +last_updated = "2025-06-30" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.28 +output = 1.1 + +[limit] +context = 123_000 +output = 12_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/baidu/ernie-4.5-vl-28b-a3b-thinking.toml b/providers/novita-ai/models/baidu/ernie-4.5-vl-28b-a3b-thinking.toml new file mode 100644 index 00000000..997f72b4 --- /dev/null +++ b/providers/novita-ai/models/baidu/ernie-4.5-vl-28b-a3b-thinking.toml @@ -0,0 +1,21 @@ +name = "ERNIE-4.5-VL-28B-A3B-Thinking" +release_date = "2025-11-26" +last_updated = "2025-11-26" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.39 +output = 0.39 + +[limit] +context = 131_072 +output = 65_536 + +[modalities] +input = ["text", "image", "video"] +output = ["text"] diff --git a/providers/novita-ai/models/baidu/ernie-4.5-vl-28b-a3b.toml b/providers/novita-ai/models/baidu/ernie-4.5-vl-28b-a3b.toml new file mode 100644 index 00000000..04b5103d --- /dev/null +++ b/providers/novita-ai/models/baidu/ernie-4.5-vl-28b-a3b.toml @@ -0,0 +1,20 @@ +name = "ERNIE 4.5 VL 28B A3B" +release_date = "2025-06-30" +last_updated = "2025-06-30" +attachment = true +reasoning = true +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 1.4 +output = 5.6 + +[limit] +context = 30_000 +output = 8_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/baidu/ernie-4.5-vl-424b-a47b.toml b/providers/novita-ai/models/baidu/ernie-4.5-vl-424b-a47b.toml new file mode 100644 index 00000000..35c0dbb1 --- /dev/null +++ b/providers/novita-ai/models/baidu/ernie-4.5-vl-424b-a47b.toml @@ -0,0 +1,20 @@ +name = "ERNIE 4.5 VL 424B A47B" +release_date = "2025-06-30" +last_updated = "2025-06-30" +attachment = true +reasoning = true +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.42 +output = 1.25 + +[limit] +context = 123_000 +output = 16_000 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-ocr.toml b/providers/novita-ai/models/deepseek/deepseek-ocr.toml new file mode 100644 index 00000000..c7cfea6d --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-ocr.toml @@ -0,0 +1,21 @@ +name = "DeepSeek-OCR" +release_date = "2025-10-24" +last_updated = "2025-10-24" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.03 +output = 0.03 + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-prover-v2-671b.toml b/providers/novita-ai/models/deepseek/deepseek-prover-v2-671b.toml new file mode 100644 index 00000000..1ff1850a --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-prover-v2-671b.toml @@ -0,0 +1,20 @@ +name = "Deepseek Prover V2 671B" +release_date = "2025-04-30" +last_updated = "2025-04-30" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.7 +output = 2.5 + +[limit] +context = 160_000 +output = 160_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-r1-0528-qwen3-8b.toml b/providers/novita-ai/models/deepseek/deepseek-r1-0528-qwen3-8b.toml new file mode 100644 index 00000000..ffc5f222 --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-r1-0528-qwen3-8b.toml @@ -0,0 +1,20 @@ +name = "DeepSeek R1 0528 Qwen3 8B" +release_date = "2025-05-29" +last_updated = "2025-05-29" +attachment = false +reasoning = true +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.06 +output = 0.09 + +[limit] +context = 128_000 +output = 32_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-r1-0528.toml b/providers/novita-ai/models/deepseek/deepseek-r1-0528.toml new file mode 100644 index 00000000..81543d10 --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-r1-0528.toml @@ -0,0 +1,23 @@ +name = "DeepSeek R1 0528" +family = "deepseek-thinking" +release_date = "2025-05-28" +last_updated = "2025-05-28" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-07" +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.7 +output = 2.5 +cache_read = 0.35 +[limit] +context = 163_840 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-r1-distill-llama-70b.toml b/providers/novita-ai/models/deepseek/deepseek-r1-distill-llama-70b.toml new file mode 100644 index 00000000..66628e35 --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-r1-distill-llama-70b.toml @@ -0,0 +1,22 @@ +name = "DeepSeek R1 Distill LLama 70B" +family = "deepseek-thinking" +release_date = "2025-01-27" +last_updated = "2025-01-27" +attachment = false +reasoning = true +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.8 +output = 0.8 + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-r1-turbo.toml b/providers/novita-ai/models/deepseek/deepseek-r1-turbo.toml new file mode 100644 index 00000000..e949947d --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-r1-turbo.toml @@ -0,0 +1,20 @@ +name = "DeepSeek R1 (Turbo) " +release_date = "2025-03-05" +last_updated = "2025-03-05" +attachment = false +reasoning = true +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 0.7 +output = 2.5 + +[limit] +context = 64_000 +output = 16_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-v3-0324.toml b/providers/novita-ai/models/deepseek/deepseek-v3-0324.toml new file mode 100644 index 00000000..acf6baf9 --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-v3-0324.toml @@ -0,0 +1,24 @@ +name = "DeepSeek V3 0324" +family = "deepseek" +release_date = "2025-03-25" +last_updated = "2025-03-25" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-07" +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.27 +output = 1.12 +cache_read = 0.135 + +[limit] +context = 163_840 +output = 163_840 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-v3-turbo.toml b/providers/novita-ai/models/deepseek/deepseek-v3-turbo.toml new file mode 100644 index 00000000..c0349d39 --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-v3-turbo.toml @@ -0,0 +1,20 @@ +name = "DeepSeek V3 (Turbo) " +release_date = "2025-03-05" +last_updated = "2025-03-05" +attachment = false +reasoning = false +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 0.4 +output = 1.3 + +[limit] +context = 64_000 +output = 16_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-v3.1-terminus.toml b/providers/novita-ai/models/deepseek/deepseek-v3.1-terminus.toml new file mode 100644 index 00000000..00fa10ae --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-v3.1-terminus.toml @@ -0,0 +1,23 @@ +name = "Deepseek V3.1 Terminus" +family = "deepseek" +release_date = "2025-09-22" +last_updated = "2025-09-22" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.27 +output = 1.0 +cache_read = 0.135 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-v3.1.toml b/providers/novita-ai/models/deepseek/deepseek-v3.1.toml new file mode 100644 index 00000000..d6d527ee --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-v3.1.toml @@ -0,0 +1,23 @@ +name = "DeepSeek V3.1" +family = "deepseek" +release_date = "2025-08-21" +last_updated = "2025-08-21" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.27 +output = 1.0 +cache_read = 0.135 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-v3.2-exp.toml b/providers/novita-ai/models/deepseek/deepseek-v3.2-exp.toml new file mode 100644 index 00000000..7d2a4fa2 --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-v3.2-exp.toml @@ -0,0 +1,21 @@ +name = "Deepseek V3.2 Exp" +release_date = "2025-09-29" +last_updated = "2025-09-29" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.27 +output = 0.41 + +[limit] +context = 163_840 +output = 65_536 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/deepseek/deepseek-v3.2.toml b/providers/novita-ai/models/deepseek/deepseek-v3.2.toml new file mode 100644 index 00000000..08a55422 --- /dev/null +++ b/providers/novita-ai/models/deepseek/deepseek-v3.2.toml @@ -0,0 +1,26 @@ +name = "Deepseek V3.2" +family = "deepseek" +release_date = "2025-12-01" +last_updated = "2025-12-01" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.269 +output = 0.4 +cache_read = 0.1345 + +[limit] +context = 163_840 +output = 65_536 + +[interleaved] +field = "reasoning_content" + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/google/gemma-3-27b-it.toml b/providers/novita-ai/models/google/gemma-3-27b-it.toml new file mode 100644 index 00000000..50dcba72 --- /dev/null +++ b/providers/novita-ai/models/google/gemma-3-27b-it.toml @@ -0,0 +1,21 @@ +name = "Gemma 3 27B" +family = "gemma" +release_date = "2025-03-25" +last_updated = "2025-03-25" +attachment = true +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.119 +output = 0.2 + +[limit] +context = 98_304 +output = 16_384 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/gryphe/mythomax-l2-13b.toml b/providers/novita-ai/models/gryphe/mythomax-l2-13b.toml new file mode 100644 index 00000000..353f50d8 --- /dev/null +++ b/providers/novita-ai/models/gryphe/mythomax-l2-13b.toml @@ -0,0 +1,20 @@ +name = "Mythomax L2 13B" +release_date = "2024-04-25" +last_updated = "2024-04-25" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.09 +output = 0.09 + +[limit] +context = 4_096 +output = 3_200 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/kwaipilot/kat-coder-pro.toml b/providers/novita-ai/models/kwaipilot/kat-coder-pro.toml new file mode 100644 index 00000000..3ad30106 --- /dev/null +++ b/providers/novita-ai/models/kwaipilot/kat-coder-pro.toml @@ -0,0 +1,22 @@ +name = "Kat Coder Pro" +release_date = "2026-01-05" +last_updated = "2026-01-05" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.3 +output = 1.2 +cache_read = 0.06 + +[limit] +context = 256_000 +output = 128_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/kwaipilot/kat-coder.toml b/providers/novita-ai/models/kwaipilot/kat-coder.toml new file mode 100644 index 00000000..c46d0632 --- /dev/null +++ b/providers/novita-ai/models/kwaipilot/kat-coder.toml @@ -0,0 +1,21 @@ +name = "KAT-Coder-Pro V1(Free)" +release_date = "2025-09-30" +last_updated = "2025-09-30" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0 +output = 0 + +[limit] +context = 256_000 +output = 32_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/meta-llama/llama-3-70b-instruct.toml b/providers/novita-ai/models/meta-llama/llama-3-70b-instruct.toml new file mode 100644 index 00000000..17e7f7c6 --- /dev/null +++ b/providers/novita-ai/models/meta-llama/llama-3-70b-instruct.toml @@ -0,0 +1,22 @@ +name = "Llama3 70B Instruct" +family = "llama" +release_date = "2024-04-25" +last_updated = "2024-04-25" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.51 +output = 0.74 + +[limit] +context = 8_192 +output = 8_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/meta-llama/llama-3-8b-instruct.toml b/providers/novita-ai/models/meta-llama/llama-3-8b-instruct.toml new file mode 100644 index 00000000..9cac0390 --- /dev/null +++ b/providers/novita-ai/models/meta-llama/llama-3-8b-instruct.toml @@ -0,0 +1,21 @@ +name = "Llama 3 8B Instruct" +family = "llama" +release_date = "2024-04-25" +last_updated = "2024-04-25" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.04 +output = 0.04 + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/meta-llama/llama-3.1-8b-instruct.toml b/providers/novita-ai/models/meta-llama/llama-3.1-8b-instruct.toml new file mode 100644 index 00000000..305b8500 --- /dev/null +++ b/providers/novita-ai/models/meta-llama/llama-3.1-8b-instruct.toml @@ -0,0 +1,21 @@ +name = "Llama 3.1 8B Instruct" +family = "llama" +release_date = "2024-07-24" +last_updated = "2024-07-24" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.02 +output = 0.05 + +[limit] +context = 16_384 +output = 16_384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/meta-llama/llama-3.3-70b-instruct.toml b/providers/novita-ai/models/meta-llama/llama-3.3-70b-instruct.toml new file mode 100644 index 00000000..87d6ed94 --- /dev/null +++ b/providers/novita-ai/models/meta-llama/llama-3.3-70b-instruct.toml @@ -0,0 +1,22 @@ +name = "Llama 3.3 70B Instruct" +family = "llama" +release_date = "2024-12-07" +last_updated = "2024-12-07" +attachment = false +reasoning = false +temperature = true +knowledge = "2023-12" +tool_call = true +open_weights = true + +[cost] +input = 0.135 +output = 0.4 + +[limit] +context = 131_072 +output = 120_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/meta-llama/llama-4-maverick-17b-128e-instruct-fp8.toml b/providers/novita-ai/models/meta-llama/llama-4-maverick-17b-128e-instruct-fp8.toml new file mode 100644 index 00000000..2a4c2ea9 --- /dev/null +++ b/providers/novita-ai/models/meta-llama/llama-4-maverick-17b-128e-instruct-fp8.toml @@ -0,0 +1,20 @@ +name = "Llama 4 Maverick Instruct" +release_date = "2025-04-06" +last_updated = "2025-04-06" +attachment = true +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.27 +output = 0.85 + +[limit] +context = 1_048_576 +output = 8_192 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/meta-llama/llama-4-scout-17b-16e-instruct.toml b/providers/novita-ai/models/meta-llama/llama-4-scout-17b-16e-instruct.toml new file mode 100644 index 00000000..0c287206 --- /dev/null +++ b/providers/novita-ai/models/meta-llama/llama-4-scout-17b-16e-instruct.toml @@ -0,0 +1,20 @@ +name = "Llama 4 Scout Instruct" +release_date = "2025-04-06" +last_updated = "2025-04-06" +attachment = true +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.18 +output = 0.59 + +[limit] +context = 131_072 +output = 131_072 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/microsoft/wizardlm-2-8x22b.toml b/providers/novita-ai/models/microsoft/wizardlm-2-8x22b.toml new file mode 100644 index 00000000..1be1b783 --- /dev/null +++ b/providers/novita-ai/models/microsoft/wizardlm-2-8x22b.toml @@ -0,0 +1,20 @@ +name = "Wizardlm 2 8x22B" +release_date = "2024-04-24" +last_updated = "2024-04-24" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.62 +output = 0.62 + +[limit] +context = 65_535 +output = 8_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/minimax/minimax-m2.1.toml b/providers/novita-ai/models/minimax/minimax-m2.1.toml new file mode 100644 index 00000000..2c99708b --- /dev/null +++ b/providers/novita-ai/models/minimax/minimax-m2.1.toml @@ -0,0 +1,26 @@ +name = "Minimax M2.1" +family = "minimax" +release_date = "2025-12-23" +last_updated = "2025-12-23" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.3 +output = 1.2 +cache_read = 0.03 + +[limit] +context = 204_800 +output = 131_072 + +[interleaved] +field = "reasoning_content" + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/minimax/minimax-m2.toml b/providers/novita-ai/models/minimax/minimax-m2.toml new file mode 100644 index 00000000..806f4c39 --- /dev/null +++ b/providers/novita-ai/models/minimax/minimax-m2.toml @@ -0,0 +1,25 @@ +name = "MiniMax-M2" +family = "minimax" +release_date = "2025-10-27" +last_updated = "2025-10-27" +attachment = false +reasoning = true +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 0.3 +output = 1.2 +cache_read = 0.03 + +[limit] +context = 204_800 +output = 131_072 + +[interleaved] +field = "reasoning_content" + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/minimaxai/minimax-m1-80k.toml b/providers/novita-ai/models/minimaxai/minimax-m1-80k.toml new file mode 100644 index 00000000..26c25299 --- /dev/null +++ b/providers/novita-ai/models/minimaxai/minimax-m1-80k.toml @@ -0,0 +1,21 @@ +name = "MiniMax M1" +family = "minimax" +release_date = "2025-06-17" +last_updated = "2025-06-17" +attachment = false +reasoning = true +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 0.55 +output = 2.2 + +[limit] +context = 1_000_000 +output = 40_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/mistralai/mistral-nemo.toml b/providers/novita-ai/models/mistralai/mistral-nemo.toml new file mode 100644 index 00000000..c181663f --- /dev/null +++ b/providers/novita-ai/models/mistralai/mistral-nemo.toml @@ -0,0 +1,22 @@ +name = "Mistral Nemo" +family = "mistral-nemo" +release_date = "2024-07-30" +last_updated = "2024-07-30" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.04 +output = 0.17 + +[limit] +context = 60_288 +output = 16_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/moonshotai/kimi-k2-0905.toml b/providers/novita-ai/models/moonshotai/kimi-k2-0905.toml new file mode 100644 index 00000000..8d4a7876 --- /dev/null +++ b/providers/novita-ai/models/moonshotai/kimi-k2-0905.toml @@ -0,0 +1,23 @@ +name = "Kimi K2 0905" +family = "kimi" +release_date = "2025-09-05" +last_updated = "2025-09-05" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-10" +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.6 +output = 2.5 + +[limit] +context = 262_144 +output = 262_144 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/moonshotai/kimi-k2-instruct.toml b/providers/novita-ai/models/moonshotai/kimi-k2-instruct.toml new file mode 100644 index 00000000..20485e1d --- /dev/null +++ b/providers/novita-ai/models/moonshotai/kimi-k2-instruct.toml @@ -0,0 +1,21 @@ +name = "Kimi K2 Instruct" +release_date = "2025-07-11" +last_updated = "2025-07-11" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.57 +output = 2.3 + +[limit] +context = 131_072 +output = 131_072 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/moonshotai/kimi-k2-thinking.toml b/providers/novita-ai/models/moonshotai/kimi-k2-thinking.toml new file mode 100644 index 00000000..e07cece4 --- /dev/null +++ b/providers/novita-ai/models/moonshotai/kimi-k2-thinking.toml @@ -0,0 +1,25 @@ +name = "Kimi K2 Thinking" +family = "kimi" +release_date = "2025-11-07" +last_updated = "2025-11-07" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.6 +output = 2.5 + +[limit] +context = 262_144 +output = 262_144 + +[interleaved] +field = "reasoning_content" + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/nousresearch/hermes-2-pro-llama-3-8b.toml b/providers/novita-ai/models/nousresearch/hermes-2-pro-llama-3-8b.toml new file mode 100644 index 00000000..e3eb3ac8 --- /dev/null +++ b/providers/novita-ai/models/nousresearch/hermes-2-pro-llama-3-8b.toml @@ -0,0 +1,21 @@ +name = "Hermes 2 Pro Llama 3 8B" +release_date = "2024-06-27" +last_updated = "2024-06-27" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.14 +output = 0.14 + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/openai/gpt-oss-120b.toml b/providers/novita-ai/models/openai/gpt-oss-120b.toml new file mode 100644 index 00000000..ee1b1e5c --- /dev/null +++ b/providers/novita-ai/models/openai/gpt-oss-120b.toml @@ -0,0 +1,21 @@ +name = "OpenAI GPT OSS 120B" +release_date = "2025-08-06" +last_updated = "2025-08-06" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.05 +output = 0.25 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/openai/gpt-oss-20b.toml b/providers/novita-ai/models/openai/gpt-oss-20b.toml new file mode 100644 index 00000000..c6da8050 --- /dev/null +++ b/providers/novita-ai/models/openai/gpt-oss-20b.toml @@ -0,0 +1,21 @@ +name = "OpenAI: GPT OSS 20B" +release_date = "2025-08-06" +last_updated = "2025-08-06" +attachment = true +reasoning = true +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.04 +output = 0.15 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/paddlepaddle/paddleocr-vl.toml b/providers/novita-ai/models/paddlepaddle/paddleocr-vl.toml new file mode 100644 index 00000000..7297dd2f --- /dev/null +++ b/providers/novita-ai/models/paddlepaddle/paddleocr-vl.toml @@ -0,0 +1,20 @@ +name = "PaddleOCR-VL" +release_date = "2025-10-22" +last_updated = "2025-10-22" +attachment = true +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.02 +output = 0.02 + +[limit] +context = 16_384 +output = 16_384 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen-2.5-72b-instruct.toml b/providers/novita-ai/models/qwen/qwen-2.5-72b-instruct.toml new file mode 100644 index 00000000..cdc43572 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen-2.5-72b-instruct.toml @@ -0,0 +1,23 @@ +name = "Qwen 2.5 72B Instruct" +family = "qwen" +release_date = "2024-10-15" +last_updated = "2024-10-15" +attachment = false +reasoning = false +temperature = true +knowledge = "2024-04" +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.38 +output = 0.4 + +[limit] +context = 32_000 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen-mt-plus.toml b/providers/novita-ai/models/qwen/qwen-mt-plus.toml new file mode 100644 index 00000000..fd3d1c7e --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen-mt-plus.toml @@ -0,0 +1,20 @@ +name = "Qwen MT Plus" +release_date = "2025-09-03" +last_updated = "2025-09-03" +attachment = false +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.25 +output = 0.75 + +[limit] +context = 16_384 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen2.5-7b-instruct.toml b/providers/novita-ai/models/qwen/qwen2.5-7b-instruct.toml new file mode 100644 index 00000000..ee536988 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen2.5-7b-instruct.toml @@ -0,0 +1,21 @@ +name = "Qwen2.5 7B Instruct" +release_date = "2025-04-16" +last_updated = "2025-04-16" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.07 +output = 0.07 + +[limit] +context = 32_000 +output = 32_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen2.5-vl-72b-instruct.toml b/providers/novita-ai/models/qwen/qwen2.5-vl-72b-instruct.toml new file mode 100644 index 00000000..9fb43a69 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen2.5-vl-72b-instruct.toml @@ -0,0 +1,21 @@ +name = "Qwen2.5 VL 72B Instruct" +family = "qwen" +release_date = "2025-03-25" +last_updated = "2025-03-25" +attachment = true +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.8 +output = 0.8 + +[limit] +context = 32_768 +output = 32_768 + +[modalities] +input = ["text", "image", "video"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-235b-a22b-fp8.toml b/providers/novita-ai/models/qwen/qwen3-235b-a22b-fp8.toml new file mode 100644 index 00000000..df3731e6 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-235b-a22b-fp8.toml @@ -0,0 +1,20 @@ +name = "Qwen3 235B A22B" +release_date = "2025-04-29" +last_updated = "2025-04-29" +attachment = false +reasoning = true +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.2 +output = 0.8 + +[limit] +context = 40_960 +output = 20_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-235b-a22b-instruct-2507.toml b/providers/novita-ai/models/qwen/qwen3-235b-a22b-instruct-2507.toml new file mode 100644 index 00000000..b7840541 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-235b-a22b-instruct-2507.toml @@ -0,0 +1,23 @@ +name = "Qwen3 235B A22B Instruct 2507" +family = "qwen" +release_date = "2025-07-22" +last_updated = "2025-07-22" +attachment = false +reasoning = false +temperature = true +knowledge = "2025-04" +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.09 +output = 0.58 + +[limit] +context = 131_072 +output = 16_384 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-235b-a22b-thinking-2507.toml b/providers/novita-ai/models/qwen/qwen3-235b-a22b-thinking-2507.toml new file mode 100644 index 00000000..48bcca79 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-235b-a22b-thinking-2507.toml @@ -0,0 +1,22 @@ +name = "Qwen3 235B A22b Thinking 2507" +family = "qwen" +release_date = "2025-07-25" +last_updated = "2025-07-25" +attachment = false +reasoning = true +temperature = true +knowledge = "2025-04" +tool_call = true +open_weights = true + +[cost] +input = 0.3 +output = 3.0 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-30b-a3b-fp8.toml b/providers/novita-ai/models/qwen/qwen3-30b-a3b-fp8.toml new file mode 100644 index 00000000..72442a08 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-30b-a3b-fp8.toml @@ -0,0 +1,20 @@ +name = "Qwen3 30B A3B" +release_date = "2025-04-29" +last_updated = "2025-04-29" +attachment = false +reasoning = true +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.09 +output = 0.45 + +[limit] +context = 40_960 +output = 20_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-32b-fp8.toml b/providers/novita-ai/models/qwen/qwen3-32b-fp8.toml new file mode 100644 index 00000000..7d02d2a5 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-32b-fp8.toml @@ -0,0 +1,20 @@ +name = "Qwen3 32B" +release_date = "2025-04-29" +last_updated = "2025-04-29" +attachment = false +reasoning = true +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.1 +output = 0.45 + +[limit] +context = 40_960 +output = 20_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-4b-fp8.toml b/providers/novita-ai/models/qwen/qwen3-4b-fp8.toml new file mode 100644 index 00000000..37daea56 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-4b-fp8.toml @@ -0,0 +1,20 @@ +name = "Qwen3 4B" +release_date = "2025-04-29" +last_updated = "2025-04-29" +attachment = false +reasoning = true +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.03 +output = 0.03 + +[limit] +context = 128_000 +output = 20_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-8b-fp8.toml b/providers/novita-ai/models/qwen/qwen3-8b-fp8.toml new file mode 100644 index 00000000..3b083473 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-8b-fp8.toml @@ -0,0 +1,20 @@ +name = "Qwen3 8B" +release_date = "2025-04-29" +last_updated = "2025-04-29" +attachment = false +reasoning = true +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.035 +output = 0.138 + +[limit] +context = 128_000 +output = 20_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-coder-30b-a3b-instruct.toml b/providers/novita-ai/models/qwen/qwen3-coder-30b-a3b-instruct.toml new file mode 100644 index 00000000..335f6aec --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-coder-30b-a3b-instruct.toml @@ -0,0 +1,21 @@ +name = "Qwen3 Coder 30b A3B Instruct" +release_date = "2025-10-09" +last_updated = "2025-10-09" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.07 +output = 0.27 + +[limit] +context = 160_000 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-coder-480b-a35b-instruct.toml b/providers/novita-ai/models/qwen/qwen3-coder-480b-a35b-instruct.toml new file mode 100644 index 00000000..3d6678ba --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-coder-480b-a35b-instruct.toml @@ -0,0 +1,23 @@ +name = "Qwen3 Coder 480B A35B Instruct" +family = "qwen" +release_date = "2025-07-23" +last_updated = "2025-07-23" +attachment = false +reasoning = false +temperature = true +knowledge = "2025-04" +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.3 +output = 1.3 + +[limit] +context = 262_144 +output = 65_536 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-max.toml b/providers/novita-ai/models/qwen/qwen3-max.toml new file mode 100644 index 00000000..89324d45 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-max.toml @@ -0,0 +1,23 @@ +name = "Qwen3 Max" +family = "qwen" +release_date = "2025-09-24" +last_updated = "2025-09-24" +attachment = false +reasoning = false +temperature = true +knowledge = "2025-04" +tool_call = true +structured_output = true +open_weights = false + +[cost] +input = 2.11 +output = 8.45 + +[limit] +context = 262_144 +output = 65_536 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-next-80b-a3b-instruct.toml b/providers/novita-ai/models/qwen/qwen3-next-80b-a3b-instruct.toml new file mode 100644 index 00000000..32486927 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-next-80b-a3b-instruct.toml @@ -0,0 +1,21 @@ +name = "Qwen3 Next 80B A3B Instruct" +release_date = "2025-09-10" +last_updated = "2025-09-10" +attachment = false +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.15 +output = 1.5 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-next-80b-a3b-thinking.toml b/providers/novita-ai/models/qwen/qwen3-next-80b-a3b-thinking.toml new file mode 100644 index 00000000..d1d3ce92 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-next-80b-a3b-thinking.toml @@ -0,0 +1,21 @@ +name = "Qwen3 Next 80B A3B Thinking" +release_date = "2025-09-10" +last_updated = "2025-09-10" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.15 +output = 1.5 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-omni-30b-a3b-instruct.toml b/providers/novita-ai/models/qwen/qwen3-omni-30b-a3b-instruct.toml new file mode 100644 index 00000000..aa98b3ac --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-omni-30b-a3b-instruct.toml @@ -0,0 +1,24 @@ +name = "Qwen3 Omni 30B A3B Instruct" +family = "qwen" +release_date = "2025-09-24" +last_updated = "2025-09-24" +attachment = true +reasoning = false +temperature = true +knowledge = "2024-04" +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.25 +output = 0.97 +input_audio = 2.2 # Cost per million audio input tokens (USD) +output_audio = 1.788 +[limit] +context = 65_536 +output = 16_384 + +[modalities] +input = ["text", "video", "audio", "image"] +output = ["text", "audio"] diff --git a/providers/novita-ai/models/qwen/qwen3-omni-30b-a3b-thinking.toml b/providers/novita-ai/models/qwen/qwen3-omni-30b-a3b-thinking.toml new file mode 100644 index 00000000..ffdaa1b4 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-omni-30b-a3b-thinking.toml @@ -0,0 +1,23 @@ +name = "Qwen3 Omni 30B A3B Thinking" +release_date = "2025-09-24" +last_updated = "2025-09-24" +attachment = true +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.25 +output = 0.97 +input_audio = 2.2 # Cost per million audio input tokens (USD) +output_audio = 1.788 + +[limit] +context = 65_536 +output = 16_384 + +[modalities] +input = ["text", "audio", "video", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-vl-235b-a22b-instruct.toml b/providers/novita-ai/models/qwen/qwen3-vl-235b-a22b-instruct.toml new file mode 100644 index 00000000..7aa9b6ff --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-vl-235b-a22b-instruct.toml @@ -0,0 +1,21 @@ +name = "Qwen3 VL 235B A22B Instruct" +release_date = "2025-09-24" +last_updated = "2025-09-24" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.3 +output = 1.5 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text", "image", "video"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-vl-235b-a22b-thinking.toml b/providers/novita-ai/models/qwen/qwen3-vl-235b-a22b-thinking.toml new file mode 100644 index 00000000..b6a625c7 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-vl-235b-a22b-thinking.toml @@ -0,0 +1,20 @@ +name = "Qwen3 VL 235B A22B Thinking" +release_date = "2025-09-24" +last_updated = "2025-09-24" +attachment = true +reasoning = true +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.98 +output = 3.95 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text", "image", "video"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-vl-30b-a3b-instruct.toml b/providers/novita-ai/models/qwen/qwen3-vl-30b-a3b-instruct.toml new file mode 100644 index 00000000..e8bb6855 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-vl-30b-a3b-instruct.toml @@ -0,0 +1,21 @@ +name = "qwen/qwen3-vl-30b-a3b-instruct" +release_date = "2025-10-11" +last_updated = "2025-10-11" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.2 +output = 0.7 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text", "video", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-vl-30b-a3b-thinking.toml b/providers/novita-ai/models/qwen/qwen3-vl-30b-a3b-thinking.toml new file mode 100644 index 00000000..e45423c5 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-vl-30b-a3b-thinking.toml @@ -0,0 +1,21 @@ +name = "qwen/qwen3-vl-30b-a3b-thinking" +release_date = "2025-10-11" +last_updated = "2025-10-11" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.2 +output = 1.0 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text", "image", "video"] +output = ["text"] diff --git a/providers/novita-ai/models/qwen/qwen3-vl-8b-instruct.toml b/providers/novita-ai/models/qwen/qwen3-vl-8b-instruct.toml new file mode 100644 index 00000000..f9a51092 --- /dev/null +++ b/providers/novita-ai/models/qwen/qwen3-vl-8b-instruct.toml @@ -0,0 +1,21 @@ +name = "qwen/qwen3-vl-8b-instruct" +release_date = "2025-10-17" +last_updated = "2025-10-17" +attachment = true +reasoning = false +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.08 +output = 0.5 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text", "image", "video"] +output = ["text"] diff --git a/providers/novita-ai/models/sao10k/L3-8B-Stheno-v3.2.toml b/providers/novita-ai/models/sao10k/L3-8B-Stheno-v3.2.toml new file mode 100644 index 00000000..dc17bf62 --- /dev/null +++ b/providers/novita-ai/models/sao10k/L3-8B-Stheno-v3.2.toml @@ -0,0 +1,20 @@ +name = "L3 8B Stheno V3.2" +release_date = "2024-11-29" +last_updated = "2024-11-29" +attachment = false +reasoning = false +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 0.05 +output = 0.05 + +[limit] +context = 8_192 +output = 32_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/sao10k/l3-70b-euryale-v2.1.toml b/providers/novita-ai/models/sao10k/l3-70b-euryale-v2.1.toml new file mode 100644 index 00000000..d6a7a78f --- /dev/null +++ b/providers/novita-ai/models/sao10k/l3-70b-euryale-v2.1.toml @@ -0,0 +1,20 @@ +name = "L3 70B Euryale V2.1 " +release_date = "2024-06-18" +last_updated = "2024-06-18" +attachment = false +reasoning = false +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 1.48 +output = 1.48 + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/sao10k/l3-8b-lunaris.toml b/providers/novita-ai/models/sao10k/l3-8b-lunaris.toml new file mode 100644 index 00000000..e2bc4a9d --- /dev/null +++ b/providers/novita-ai/models/sao10k/l3-8b-lunaris.toml @@ -0,0 +1,21 @@ +name = "Sao10k L3 8B Lunaris " +release_date = "2024-11-28" +last_updated = "2024-11-28" +attachment = false +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.05 +output = 0.05 + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/sao10k/l31-70b-euryale-v2.2.toml b/providers/novita-ai/models/sao10k/l31-70b-euryale-v2.2.toml new file mode 100644 index 00000000..926e20a1 --- /dev/null +++ b/providers/novita-ai/models/sao10k/l31-70b-euryale-v2.2.toml @@ -0,0 +1,20 @@ +name = "L31 70B Euryale V2.2" +release_date = "2024-09-19" +last_updated = "2024-09-19" +attachment = false +reasoning = false +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 1.48 +output = 1.48 + +[limit] +context = 8_192 +output = 8_192 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/skywork/r1v4-lite.toml b/providers/novita-ai/models/skywork/r1v4-lite.toml new file mode 100644 index 00000000..b4bd3f45 --- /dev/null +++ b/providers/novita-ai/models/skywork/r1v4-lite.toml @@ -0,0 +1,22 @@ +name = "Skywork R1V4-Lite" +family = "skywork" +release_date = "2025-11-18" +last_updated = "2025-11-18" +attachment = true +reasoning = false +temperature = true +tool_call = false +structured_output = true +open_weights = true + +[cost] +input = 0.2 +output = 0.6 + +[limit] +context = 262_144 +output = 65_536 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/xiaomimimo/mimo-v2-flash.toml b/providers/novita-ai/models/xiaomimimo/mimo-v2-flash.toml new file mode 100644 index 00000000..94bbda8e --- /dev/null +++ b/providers/novita-ai/models/xiaomimimo/mimo-v2-flash.toml @@ -0,0 +1,24 @@ +name = "XiaomiMiMo/MiMo-V2-Flash" +family = "mimo" +release_date = "2025-12-19" +last_updated = "2025-12-19" +attachment = false +reasoning = true +temperature = true +knowledge = "2024-12" +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.1 +output = 0.3 +cache_read = 0.30 + +[limit] +context = 262_144 +output = 32_000 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/zai-org/autoglm-phone-9b-multilingual.toml b/providers/novita-ai/models/zai-org/autoglm-phone-9b-multilingual.toml new file mode 100644 index 00000000..2b38dd27 --- /dev/null +++ b/providers/novita-ai/models/zai-org/autoglm-phone-9b-multilingual.toml @@ -0,0 +1,20 @@ +name = "AutoGLM-Phone-9B-Multilingual" +release_date = "2025-12-10" +last_updated = "2025-12-10" +attachment = true +reasoning = false +temperature = true +tool_call = false +open_weights = true + +[cost] +input = 0.035 +output = 0.138 + +[limit] +context = 65_536 +output = 65_536 + +[modalities] +input = ["text", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/zai-org/glm-4.5-air.toml b/providers/novita-ai/models/zai-org/glm-4.5-air.toml new file mode 100644 index 00000000..498308c6 --- /dev/null +++ b/providers/novita-ai/models/zai-org/glm-4.5-air.toml @@ -0,0 +1,22 @@ +name = "GLM 4.5 Air" +family = "glm-air" +release_date = "2025-10-13" +last_updated = "2025-10-13" +attachment = false +reasoning = true +temperature = true +knowledge = "2025-04" +tool_call = true +open_weights = true + +[cost] +input = 0.13 +output = 0.85 + +[limit] +context = 131_072 +output = 98_304 + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/zai-org/glm-4.5.toml b/providers/novita-ai/models/zai-org/glm-4.5.toml new file mode 100644 index 00000000..687f722b --- /dev/null +++ b/providers/novita-ai/models/zai-org/glm-4.5.toml @@ -0,0 +1,25 @@ +name = "GLM-4.5" +family = "glm" +release_date = "2025-07-28" +last_updated = "2025-07-28" +attachment = false +reasoning = true +temperature = true +tool_call = true +open_weights = true + +[cost] +input = 0.6 +output = 2.2 +cache_read = 0.11 + +[limit] +context = 131_072 +output = 98_304 + +[interleaved] +field = "reasoning_content" + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/zai-org/glm-4.5v.toml b/providers/novita-ai/models/zai-org/glm-4.5v.toml new file mode 100644 index 00000000..e5d7e4fb --- /dev/null +++ b/providers/novita-ai/models/zai-org/glm-4.5v.toml @@ -0,0 +1,23 @@ +name = "GLM 4.5V" +family = "glmv" +release_date = "2025-08-11" +last_updated = "2025-08-11" +attachment = true +reasoning = true +temperature = true +knowledge = "2025-04" +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.6 +output = 1.8 +cache_read = 0.11 +[limit] +context = 65_536 +output = 16_384 + +[modalities] +input = ["text", "video", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/zai-org/glm-4.6.toml b/providers/novita-ai/models/zai-org/glm-4.6.toml new file mode 100644 index 00000000..d5d6b952 --- /dev/null +++ b/providers/novita-ai/models/zai-org/glm-4.6.toml @@ -0,0 +1,26 @@ +name = "GLM 4.6" +family = "glm" +release_date = "2025-09-30" +last_updated = "2025-09-30" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.55 +output = 2.2 +cache_read = 0.11 + +[limit] +context = 204_800 +output = 131_072 + +[interleaved] +field = "reasoning_content" + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/models/zai-org/glm-4.6v.toml b/providers/novita-ai/models/zai-org/glm-4.6v.toml new file mode 100644 index 00000000..a07c1998 --- /dev/null +++ b/providers/novita-ai/models/zai-org/glm-4.6v.toml @@ -0,0 +1,24 @@ +name = "GLM 4.6V" +family = "glmv" +release_date = "2025-12-08" +last_updated = "2025-12-08" +attachment = true +reasoning = true +temperature = true +knowledge = "2025-04" +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.3 +output = 0.9 +cache_read = 0.055 + +[limit] +context = 131_072 +output = 32_768 + +[modalities] +input = ["text", "video", "image"] +output = ["text"] diff --git a/providers/novita-ai/models/zai-org/glm-4.7.toml b/providers/novita-ai/models/zai-org/glm-4.7.toml new file mode 100644 index 00000000..4a0743c0 --- /dev/null +++ b/providers/novita-ai/models/zai-org/glm-4.7.toml @@ -0,0 +1,26 @@ +name = "GLM-4.7" +family = "glm" +release_date = "2025-12-22" +last_updated = "2025-12-22" +attachment = false +reasoning = true +temperature = true +tool_call = true +structured_output = true +open_weights = true + +[cost] +input = 0.6 +output = 2.2 +cache_read = 0.11 + +[limit] +context = 204_800 +output = 131_072 + +[interleaved] +field = "reasoning_content" + +[modalities] +input = ["text"] +output = ["text"] diff --git a/providers/novita-ai/provider.toml b/providers/novita-ai/provider.toml new file mode 100644 index 00000000..05acfd40 --- /dev/null +++ b/providers/novita-ai/provider.toml @@ -0,0 +1,5 @@ +name = "NovitaAI" +env = ["NOVITA_API_KEY"] +npm = "@ai-sdk/openai-compatible" +doc = "https://novita.ai/docs/guides/introduction" +api = "https://api.novita.ai/openai"