Skip to content

Commit 84a675c

Browse files
Update model_prices_and_context_window.json to version generated on 2025-03-30 (#1325)
Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> Co-authored-by: Luke Hinds <[email protected]>
1 parent 6aefe0b commit 84a675c

File tree

1 file changed

+138
-3
lines changed

1 file changed

+138
-3
lines changed

Diff for: model_cost_data/model_prices_and_context_window.json

+138-3
Original file line numberDiff line numberDiff line change
@@ -1176,21 +1176,40 @@
11761176
"output_cost_per_pixel": 0.0,
11771177
"litellm_provider": "openai"
11781178
},
1179+
"gpt-4o-transcribe": {
1180+
"mode": "audio_transcription",
1181+
"input_cost_per_token": 0.0000025,
1182+
"input_cost_per_audio_token": 0.000006,
1183+
"output_cost_per_token": 0.00001,
1184+
"litellm_provider": "openai",
1185+
"supported_endpoints": ["/v1/audio/transcriptions"]
1186+
},
1187+
"gpt-4o-mini-transcribe": {
1188+
"mode": "audio_transcription",
1189+
"input_cost_per_token": 0.00000125,
1190+
"input_cost_per_audio_token": 0.000003,
1191+
"output_cost_per_token": 0.000005,
1192+
"litellm_provider": "openai",
1193+
"supported_endpoints": ["/v1/audio/transcriptions"]
1194+
},
11791195
"whisper-1": {
11801196
"mode": "audio_transcription",
11811197
"input_cost_per_second": 0.0001,
11821198
"output_cost_per_second": 0.0001,
1183-
"litellm_provider": "openai"
1199+
"litellm_provider": "openai",
1200+
"supported_endpoints": ["/v1/audio/transcriptions"]
11841201
},
11851202
"tts-1": {
11861203
"mode": "audio_speech",
11871204
"input_cost_per_character": 0.000015,
1188-
"litellm_provider": "openai"
1205+
"litellm_provider": "openai",
1206+
"supported_endpoints": ["/v1/audio/speech"]
11891207
},
11901208
"tts-1-hd": {
11911209
"mode": "audio_speech",
11921210
"input_cost_per_character": 0.000030,
1193-
"litellm_provider": "openai"
1211+
"litellm_provider": "openai",
1212+
"supported_endpoints": ["/v1/audio/speech"]
11941213
},
11951214
"azure/gpt-4o-mini-realtime-preview-2024-12-17": {
11961215
"max_tokens": 4096,
@@ -4595,6 +4614,28 @@
45954614
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash",
45964615
"supports_tool_choice": true
45974616
},
4617+
"gemini-2.0-flash-lite": {
4618+
"max_input_tokens": 1048576,
4619+
"max_output_tokens": 8192,
4620+
"max_images_per_prompt": 3000,
4621+
"max_videos_per_prompt": 10,
4622+
"max_video_length": 1,
4623+
"max_audio_length_hours": 8.4,
4624+
"max_audio_per_prompt": 1,
4625+
"max_pdf_size_mb": 50,
4626+
"input_cost_per_audio_token": 0.000000075,
4627+
"input_cost_per_token": 0.000000075,
4628+
"output_cost_per_token": 0.0000003,
4629+
"litellm_provider": "vertex_ai-language-models",
4630+
"mode": "chat",
4631+
"supports_system_messages": true,
4632+
"supports_function_calling": true,
4633+
"supports_vision": true,
4634+
"supports_response_schema": true,
4635+
"supports_audio_output": true,
4636+
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash",
4637+
"supports_tool_choice": true
4638+
},
45984639
"gemini/gemini-2.0-pro-exp-02-05": {
45994640
"max_tokens": 8192,
46004641
"max_input_tokens": 2097152,
@@ -4655,9 +4696,35 @@
46554696
"supports_vision": true,
46564697
"supports_response_schema": true,
46574698
"supports_audio_output": true,
4699+
"supports_audio_input": true,
4700+
"supported_modalities": ["text", "image", "audio", "video"],
46584701
"supports_tool_choice": true,
46594702
"source": "https://ai.google.dev/pricing#2_0flash"
46604703
},
4704+
"gemini/gemini-2.0-flash-lite": {
4705+
"max_input_tokens": 1048576,
4706+
"max_output_tokens": 8192,
4707+
"max_images_per_prompt": 3000,
4708+
"max_videos_per_prompt": 10,
4709+
"max_video_length": 1,
4710+
"max_audio_length_hours": 8.4,
4711+
"max_audio_per_prompt": 1,
4712+
"max_pdf_size_mb": 50,
4713+
"input_cost_per_audio_token": 0.000000075,
4714+
"input_cost_per_token": 0.000000075,
4715+
"output_cost_per_token": 0.0000003,
4716+
"litellm_provider": "gemini",
4717+
"mode": "chat",
4718+
"tpm": 4000000,
4719+
"rpm": 4000,
4720+
"supports_system_messages": true,
4721+
"supports_function_calling": true,
4722+
"supports_vision": true,
4723+
"supports_response_schema": true,
4724+
"supports_audio_output": true,
4725+
"supports_tool_choice": true,
4726+
"source": "https://ai.google.dev/gemini-api/docs/pricing#gemini-2.0-flash-lite"
4727+
},
46614728
"gemini/gemini-2.0-flash-001": {
46624729
"max_tokens": 8192,
46634730
"max_input_tokens": 1048576,
@@ -5153,6 +5220,29 @@
51535220
"supports_function_calling": true,
51545221
"supports_tool_choice": true
51555222
},
5223+
"vertex_ai/mistral-small-2503@001": {
5224+
"max_tokens": 8191,
5225+
"max_input_tokens": 32000,
5226+
"max_output_tokens": 8191,
5227+
"input_cost_per_token": 0.000001,
5228+
"output_cost_per_token": 0.000003,
5229+
"litellm_provider": "vertex_ai-mistral_models",
5230+
"supports_function_calling": true,
5231+
"mode": "chat",
5232+
"supports_tool_choice": true
5233+
},
5234+
"vertex_ai/mistral-small-2503": {
5235+
"max_tokens": 128000,
5236+
"max_input_tokens": 128000,
5237+
"max_output_tokens": 128000,
5238+
"input_cost_per_token": 0.000001,
5239+
"output_cost_per_token": 0.000003,
5240+
"litellm_provider": "vertex_ai-mistral_models",
5241+
"mode": "chat",
5242+
"supports_function_calling": true,
5243+
"supports_vision": true,
5244+
"supports_tool_choice": true
5245+
},
51565246
"vertex_ai/jamba-1.5-mini@001": {
51575247
"max_tokens": 256000,
51585248
"max_input_tokens": 256000,
@@ -5304,6 +5394,51 @@
53045394
"mode": "embedding",
53055395
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models"
53065396
},
5397+
"multimodalembedding": {
5398+
"max_tokens": 2048,
5399+
"max_input_tokens": 2048,
5400+
"output_vector_size": 768,
5401+
"input_cost_per_character": 0.0000002,
5402+
"input_cost_per_image": 0.0001,
5403+
"input_cost_per_video_per_second": 0.0005,
5404+
"input_cost_per_video_per_second_above_8s_interval": 0.0010,
5405+
"input_cost_per_video_per_second_above_15s_interval": 0.0020,
5406+
"input_cost_per_token": 0.0000008,
5407+
"output_cost_per_token": 0,
5408+
"litellm_provider": "vertex_ai-embedding-models",
5409+
"mode": "embedding",
5410+
"supported_endpoints": ["/v1/embeddings"],
5411+
"supported_modalities": ["text", "image", "video"],
5412+
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models"
5413+
},
5414+
"multimodalembedding@001": {
5415+
"max_tokens": 2048,
5416+
"max_input_tokens": 2048,
5417+
"output_vector_size": 768,
5418+
"input_cost_per_character": 0.0000002,
5419+
"input_cost_per_image": 0.0001,
5420+
"input_cost_per_video_per_second": 0.0005,
5421+
"input_cost_per_video_per_second_above_8s_interval": 0.0010,
5422+
"input_cost_per_video_per_second_above_15s_interval": 0.0020,
5423+
"input_cost_per_token": 0.0000008,
5424+
"output_cost_per_token": 0,
5425+
"litellm_provider": "vertex_ai-embedding-models",
5426+
"mode": "embedding",
5427+
"supported_endpoints": ["/v1/embeddings"],
5428+
"supported_modalities": ["text", "image", "video"],
5429+
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models"
5430+
},
5431+
"text-embedding-large-exp-03-07": {
5432+
"max_tokens": 8192,
5433+
"max_input_tokens": 8192,
5434+
"output_vector_size": 3072,
5435+
"input_cost_per_character": 0.000000025,
5436+
"input_cost_per_token": 0.0000001,
5437+
"output_cost_per_token": 0,
5438+
"litellm_provider": "vertex_ai-embedding-models",
5439+
"mode": "embedding",
5440+
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models"
5441+
},
53075442
"textembedding-gecko": {
53085443
"max_tokens": 3072,
53095444
"max_input_tokens": 3072,

0 commit comments

Comments
 (0)