Skip to content

Commit 490763b

Browse files
Update model_prices_and_context_window.json to version generated on 2025-02-16 (#1069)
Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com>
1 parent 83c538b commit 490763b

File tree

1 file changed

+131
-42
lines changed

1 file changed

+131
-42
lines changed

model_cost_data/model_prices_and_context_window.json

+131-42
Original file line numberDiff line numberDiff line change
@@ -1412,6 +1412,19 @@
14121412
"deprecation_date": "2025-03-31",
14131413
"supports_tool_choice": true
14141414
},
1415+
"azure/gpt-3.5-turbo-0125": {
1416+
"max_tokens": 4096,
1417+
"max_input_tokens": 16384,
1418+
"max_output_tokens": 4096,
1419+
"input_cost_per_token": 0.0000005,
1420+
"output_cost_per_token": 0.0000015,
1421+
"litellm_provider": "azure",
1422+
"mode": "chat",
1423+
"supports_function_calling": true,
1424+
"supports_parallel_function_calling": true,
1425+
"deprecation_date": "2025-03-31",
1426+
"supports_tool_choice": true
1427+
},
14151428
"azure/gpt-35-turbo-16k": {
14161429
"max_tokens": 4096,
14171430
"max_input_tokens": 16385,
@@ -1433,6 +1446,17 @@
14331446
"supports_function_calling": true,
14341447
"supports_tool_choice": true
14351448
},
1449+
"azure/gpt-3.5-turbo": {
1450+
"max_tokens": 4096,
1451+
"max_input_tokens": 4097,
1452+
"max_output_tokens": 4096,
1453+
"input_cost_per_token": 0.0000005,
1454+
"output_cost_per_token": 0.0000015,
1455+
"litellm_provider": "azure",
1456+
"mode": "chat",
1457+
"supports_function_calling": true,
1458+
"supports_tool_choice": true
1459+
},
14361460
"azure/gpt-3.5-turbo-instruct-0914": {
14371461
"max_tokens": 4097,
14381462
"max_input_tokens": 4097,
@@ -3634,6 +3658,42 @@
36343658
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models",
36353659
"supports_tool_choice": true
36363660
},
3661+
"gemini-2.0-pro-exp-02-05": {
3662+
"max_tokens": 8192,
3663+
"max_input_tokens": 2097152,
3664+
"max_output_tokens": 8192,
3665+
"max_images_per_prompt": 3000,
3666+
"max_videos_per_prompt": 10,
3667+
"max_video_length": 1,
3668+
"max_audio_length_hours": 8.4,
3669+
"max_audio_per_prompt": 1,
3670+
"max_pdf_size_mb": 30,
3671+
"input_cost_per_image": 0,
3672+
"input_cost_per_video_per_second": 0,
3673+
"input_cost_per_audio_per_second": 0,
3674+
"input_cost_per_token": 0,
3675+
"input_cost_per_character": 0,
3676+
"input_cost_per_token_above_128k_tokens": 0,
3677+
"input_cost_per_character_above_128k_tokens": 0,
3678+
"input_cost_per_image_above_128k_tokens": 0,
3679+
"input_cost_per_video_per_second_above_128k_tokens": 0,
3680+
"input_cost_per_audio_per_second_above_128k_tokens": 0,
3681+
"output_cost_per_token": 0,
3682+
"output_cost_per_character": 0,
3683+
"output_cost_per_token_above_128k_tokens": 0,
3684+
"output_cost_per_character_above_128k_tokens": 0,
3685+
"litellm_provider": "vertex_ai-language-models",
3686+
"mode": "chat",
3687+
"supports_system_messages": true,
3688+
"supports_function_calling": true,
3689+
"supports_vision": true,
3690+
"supports_audio_input": true,
3691+
"supports_video_input": true,
3692+
"supports_pdf_input": true,
3693+
"supports_response_schema": true,
3694+
"supports_tool_choice": true,
3695+
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing"
3696+
},
36373697
"gemini-2.0-flash-exp": {
36383698
"max_tokens": 8192,
36393699
"max_input_tokens": 1048576,
@@ -7035,7 +7095,9 @@
70357095
"input_cost_per_token": 0.00000072,
70367096
"output_cost_per_token": 0.00000072,
70377097
"litellm_provider": "bedrock_converse",
7038-
"mode": "chat"
7098+
"mode": "chat",
7099+
"supports_function_calling": true,
7100+
"supports_tool_choice": false
70397101
},
70407102
"meta.llama2-13b-chat-v1": {
70417103
"max_tokens": 4096,
@@ -7375,6 +7437,17 @@
73757437
"supports_function_calling": true,
73767438
"supports_tool_choice": false
73777439
},
7440+
"us.meta.llama3-3-70b-instruct-v1:0": {
7441+
"max_tokens": 4096,
7442+
"max_input_tokens": 128000,
7443+
"max_output_tokens": 4096,
7444+
"input_cost_per_token": 0.00000072,
7445+
"output_cost_per_token": 0.00000072,
7446+
"litellm_provider": "bedrock_converse",
7447+
"mode": "chat",
7448+
"supports_function_calling": true,
7449+
"supports_tool_choice": false
7450+
},
73787451
"512-x-512/50-steps/stability.stable-diffusion-xl-v0": {
73797452
"max_tokens": 77,
73807453
"max_input_tokens": 77,
@@ -8084,8 +8157,7 @@
80848157
"input_cost_per_token": 0.00000035,
80858158
"output_cost_per_token": 0.00000140,
80868159
"litellm_provider": "perplexity",
8087-
"mode": "chat" ,
8088-
"supports_tool_choice": true
8160+
"mode": "chat"
80898161
},
80908162
"perplexity/codellama-70b-instruct": {
80918163
"max_tokens": 16384,
@@ -8094,8 +8166,7 @@
80948166
"input_cost_per_token": 0.00000070,
80958167
"output_cost_per_token": 0.00000280,
80968168
"litellm_provider": "perplexity",
8097-
"mode": "chat" ,
8098-
"supports_tool_choice": true
8169+
"mode": "chat"
80998170
},
81008171
"perplexity/llama-3.1-70b-instruct": {
81018172
"max_tokens": 131072,
@@ -8104,8 +8175,7 @@
81048175
"input_cost_per_token": 0.000001,
81058176
"output_cost_per_token": 0.000001,
81068177
"litellm_provider": "perplexity",
8107-
"mode": "chat" ,
8108-
"supports_tool_choice": true
8178+
"mode": "chat"
81098179
},
81108180
"perplexity/llama-3.1-8b-instruct": {
81118181
"max_tokens": 131072,
@@ -8114,8 +8184,7 @@
81148184
"input_cost_per_token": 0.0000002,
81158185
"output_cost_per_token": 0.0000002,
81168186
"litellm_provider": "perplexity",
8117-
"mode": "chat" ,
8118-
"supports_tool_choice": true
8187+
"mode": "chat"
81198188
},
81208189
"perplexity/llama-3.1-sonar-huge-128k-online": {
81218190
"max_tokens": 127072,
@@ -8125,8 +8194,7 @@
81258194
"output_cost_per_token": 0.000005,
81268195
"litellm_provider": "perplexity",
81278196
"mode": "chat",
8128-
"deprecation_date": "2025-02-22",
8129-
"supports_tool_choice": true
8197+
"deprecation_date": "2025-02-22"
81308198
},
81318199
"perplexity/llama-3.1-sonar-large-128k-online": {
81328200
"max_tokens": 127072,
@@ -8136,8 +8204,7 @@
81368204
"output_cost_per_token": 0.000001,
81378205
"litellm_provider": "perplexity",
81388206
"mode": "chat",
8139-
"deprecation_date": "2025-02-22",
8140-
"supports_tool_choice": true
8207+
"deprecation_date": "2025-02-22"
81418208
},
81428209
"perplexity/llama-3.1-sonar-large-128k-chat": {
81438210
"max_tokens": 131072,
@@ -8147,8 +8214,7 @@
81478214
"output_cost_per_token": 0.000001,
81488215
"litellm_provider": "perplexity",
81498216
"mode": "chat",
8150-
"deprecation_date": "2025-02-22",
8151-
"supports_tool_choice": true
8217+
"deprecation_date": "2025-02-22"
81528218
},
81538219
"perplexity/llama-3.1-sonar-small-128k-chat": {
81548220
"max_tokens": 131072,
@@ -8158,8 +8224,7 @@
81588224
"output_cost_per_token": 0.0000002,
81598225
"litellm_provider": "perplexity",
81608226
"mode": "chat",
8161-
"deprecation_date": "2025-02-22",
8162-
"supports_tool_choice": true
8227+
"deprecation_date": "2025-02-22"
81638228
},
81648229
"perplexity/llama-3.1-sonar-small-128k-online": {
81658230
"max_tokens": 127072,
@@ -8169,8 +8234,43 @@
81698234
"output_cost_per_token": 0.0000002,
81708235
"litellm_provider": "perplexity",
81718236
"mode": "chat" ,
8172-
"deprecation_date": "2025-02-22",
8173-
"supports_tool_choice": true
8237+
"deprecation_date": "2025-02-22"
8238+
},
8239+
"perplexity/sonar": {
8240+
"max_tokens": 127072,
8241+
"max_input_tokens": 127072,
8242+
"max_output_tokens": 127072,
8243+
"input_cost_per_token": 0.000001,
8244+
"output_cost_per_token": 0.000001,
8245+
"litellm_provider": "perplexity",
8246+
"mode": "chat"
8247+
},
8248+
"perplexity/sonar-pro": {
8249+
"max_tokens": 200000,
8250+
"max_input_tokens": 200000,
8251+
"max_output_tokens": 8096,
8252+
"input_cost_per_token": 0.000003,
8253+
"output_cost_per_token": 0.000015,
8254+
"litellm_provider": "perplexity",
8255+
"mode": "chat"
8256+
},
8257+
"perplexity/sonar": {
8258+
"max_tokens": 127072,
8259+
"max_input_tokens": 127072,
8260+
"max_output_tokens": 127072,
8261+
"input_cost_per_token": 0.000001,
8262+
"output_cost_per_token": 0.000001,
8263+
"litellm_provider": "perplexity",
8264+
"mode": "chat"
8265+
},
8266+
"perplexity/sonar-pro": {
8267+
"max_tokens": 200000,
8268+
"max_input_tokens": 200000,
8269+
"max_output_tokens": 8096,
8270+
"input_cost_per_token": 0.000003,
8271+
"output_cost_per_token": 0.000015,
8272+
"litellm_provider": "perplexity",
8273+
"mode": "chat"
81748274
},
81758275
"perplexity/pplx-7b-chat": {
81768276
"max_tokens": 8192,
@@ -8179,8 +8279,7 @@
81798279
"input_cost_per_token": 0.00000007,
81808280
"output_cost_per_token": 0.00000028,
81818281
"litellm_provider": "perplexity",
8182-
"mode": "chat" ,
8183-
"supports_tool_choice": true
8282+
"mode": "chat"
81848283
},
81858284
"perplexity/pplx-70b-chat": {
81868285
"max_tokens": 4096,
@@ -8189,8 +8288,7 @@
81898288
"input_cost_per_token": 0.00000070,
81908289
"output_cost_per_token": 0.00000280,
81918290
"litellm_provider": "perplexity",
8192-
"mode": "chat" ,
8193-
"supports_tool_choice": true
8291+
"mode": "chat"
81948292
},
81958293
"perplexity/pplx-7b-online": {
81968294
"max_tokens": 4096,
@@ -8200,8 +8298,7 @@
82008298
"output_cost_per_token": 0.00000028,
82018299
"input_cost_per_request": 0.005,
82028300
"litellm_provider": "perplexity",
8203-
"mode": "chat" ,
8204-
"supports_tool_choice": true
8301+
"mode": "chat"
82058302
},
82068303
"perplexity/pplx-70b-online": {
82078304
"max_tokens": 4096,
@@ -8211,8 +8308,7 @@
82118308
"output_cost_per_token": 0.00000280,
82128309
"input_cost_per_request": 0.005,
82138310
"litellm_provider": "perplexity",
8214-
"mode": "chat" ,
8215-
"supports_tool_choice": true
8311+
"mode": "chat"
82168312
},
82178313
"perplexity/llama-2-70b-chat": {
82188314
"max_tokens": 4096,
@@ -8221,8 +8317,7 @@
82218317
"input_cost_per_token": 0.00000070,
82228318
"output_cost_per_token": 0.00000280,
82238319
"litellm_provider": "perplexity",
8224-
"mode": "chat" ,
8225-
"supports_tool_choice": true
8320+
"mode": "chat"
82268321
},
82278322
"perplexity/mistral-7b-instruct": {
82288323
"max_tokens": 4096,
@@ -8231,8 +8326,7 @@
82318326
"input_cost_per_token": 0.00000007,
82328327
"output_cost_per_token": 0.00000028,
82338328
"litellm_provider": "perplexity",
8234-
"mode": "chat" ,
8235-
"supports_tool_choice": true
8329+
"mode": "chat"
82368330
},
82378331
"perplexity/mixtral-8x7b-instruct": {
82388332
"max_tokens": 4096,
@@ -8241,8 +8335,7 @@
82418335
"input_cost_per_token": 0.00000007,
82428336
"output_cost_per_token": 0.00000028,
82438337
"litellm_provider": "perplexity",
8244-
"mode": "chat",
8245-
"supports_tool_choice": true
8338+
"mode": "chat"
82468339
},
82478340
"perplexity/sonar-small-chat": {
82488341
"max_tokens": 16384,
@@ -8251,8 +8344,7 @@
82518344
"input_cost_per_token": 0.00000007,
82528345
"output_cost_per_token": 0.00000028,
82538346
"litellm_provider": "perplexity",
8254-
"mode": "chat",
8255-
"supports_tool_choice": true
8347+
"mode": "chat"
82568348
},
82578349
"perplexity/sonar-small-online": {
82588350
"max_tokens": 12000,
@@ -8262,8 +8354,7 @@
82628354
"output_cost_per_token": 0.00000028,
82638355
"input_cost_per_request": 0.005,
82648356
"litellm_provider": "perplexity",
8265-
"mode": "chat",
8266-
"supports_tool_choice": true
8357+
"mode": "chat"
82678358
},
82688359
"perplexity/sonar-medium-chat": {
82698360
"max_tokens": 16384,
@@ -8272,8 +8363,7 @@
82728363
"input_cost_per_token": 0.0000006,
82738364
"output_cost_per_token": 0.0000018,
82748365
"litellm_provider": "perplexity",
8275-
"mode": "chat",
8276-
"supports_tool_choice": true
8366+
"mode": "chat"
82778367
},
82788368
"perplexity/sonar-medium-online": {
82798369
"max_tokens": 12000,
@@ -8283,8 +8373,7 @@
82838373
"output_cost_per_token": 0.0000018,
82848374
"input_cost_per_request": 0.005,
82858375
"litellm_provider": "perplexity",
8286-
"mode": "chat",
8287-
"supports_tool_choice": true
8376+
"mode": "chat"
82888377
},
82898378
"fireworks_ai/accounts/fireworks/models/llama-v3p2-1b-instruct": {
82908379
"max_tokens": 16384,
@@ -9044,4 +9133,4 @@
90449133
"output_cost_per_second": 0.00,
90459134
"litellm_provider": "assemblyai"
90469135
}
9047-
}
9136+
}

0 commit comments

Comments
 (0)