|
1176 | 1176 | "output_cost_per_pixel": 0.0,
|
1177 | 1177 | "litellm_provider": "openai"
|
1178 | 1178 | },
|
| 1179 | + "gpt-4o-transcribe": { |
| 1180 | + "mode": "audio_transcription", |
| 1181 | + "input_cost_per_token": 0.0000025, |
| 1182 | + "input_cost_per_audio_token": 0.000006, |
| 1183 | + "output_cost_per_token": 0.00001, |
| 1184 | + "litellm_provider": "openai", |
| 1185 | + "supported_endpoints": ["/v1/audio/transcriptions"] |
| 1186 | + }, |
| 1187 | + "gpt-4o-mini-transcribe": { |
| 1188 | + "mode": "audio_transcription", |
| 1189 | + "input_cost_per_token": 0.00000125, |
| 1190 | + "input_cost_per_audio_token": 0.000003, |
| 1191 | + "output_cost_per_token": 0.000005, |
| 1192 | + "litellm_provider": "openai", |
| 1193 | + "supported_endpoints": ["/v1/audio/transcriptions"] |
| 1194 | + }, |
1179 | 1195 | "whisper-1": {
|
1180 | 1196 | "mode": "audio_transcription",
|
1181 | 1197 | "input_cost_per_second": 0.0001,
|
1182 | 1198 | "output_cost_per_second": 0.0001,
|
1183 |
| - "litellm_provider": "openai" |
| 1199 | + "litellm_provider": "openai", |
| 1200 | + "supported_endpoints": ["/v1/audio/transcriptions"] |
1184 | 1201 | },
|
1185 | 1202 | "tts-1": {
|
1186 | 1203 | "mode": "audio_speech",
|
1187 | 1204 | "input_cost_per_character": 0.000015,
|
1188 |
| - "litellm_provider": "openai" |
| 1205 | + "litellm_provider": "openai", |
| 1206 | + "supported_endpoints": ["/v1/audio/speech"] |
1189 | 1207 | },
|
1190 | 1208 | "tts-1-hd": {
|
1191 | 1209 | "mode": "audio_speech",
|
1192 | 1210 | "input_cost_per_character": 0.000030,
|
1193 |
| - "litellm_provider": "openai" |
| 1211 | + "litellm_provider": "openai", |
| 1212 | + "supported_endpoints": ["/v1/audio/speech"] |
1194 | 1213 | },
|
1195 | 1214 | "azure/gpt-4o-mini-realtime-preview-2024-12-17": {
|
1196 | 1215 | "max_tokens": 4096,
|
|
4595 | 4614 | "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash",
|
4596 | 4615 | "supports_tool_choice": true
|
4597 | 4616 | },
|
| 4617 | + "gemini-2.0-flash-lite": { |
| 4618 | + "max_input_tokens": 1048576, |
| 4619 | + "max_output_tokens": 8192, |
| 4620 | + "max_images_per_prompt": 3000, |
| 4621 | + "max_videos_per_prompt": 10, |
| 4622 | + "max_video_length": 1, |
| 4623 | + "max_audio_length_hours": 8.4, |
| 4624 | + "max_audio_per_prompt": 1, |
| 4625 | + "max_pdf_size_mb": 50, |
| 4626 | + "input_cost_per_audio_token": 0.000000075, |
| 4627 | + "input_cost_per_token": 0.000000075, |
| 4628 | + "output_cost_per_token": 0.0000003, |
| 4629 | + "litellm_provider": "vertex_ai-language-models", |
| 4630 | + "mode": "chat", |
| 4631 | + "supports_system_messages": true, |
| 4632 | + "supports_function_calling": true, |
| 4633 | + "supports_vision": true, |
| 4634 | + "supports_response_schema": true, |
| 4635 | + "supports_audio_output": true, |
| 4636 | + "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", |
| 4637 | + "supports_tool_choice": true |
| 4638 | + }, |
4598 | 4639 | "gemini/gemini-2.0-pro-exp-02-05": {
|
4599 | 4640 | "max_tokens": 8192,
|
4600 | 4641 | "max_input_tokens": 2097152,
|
|
4655 | 4696 | "supports_vision": true,
|
4656 | 4697 | "supports_response_schema": true,
|
4657 | 4698 | "supports_audio_output": true,
|
| 4699 | + "supports_audio_input": true, |
| 4700 | + "supported_modalities": ["text", "image", "audio", "video"], |
4658 | 4701 | "supports_tool_choice": true,
|
4659 | 4702 | "source": "https://ai.google.dev/pricing#2_0flash"
|
4660 | 4703 | },
|
| 4704 | + "gemini/gemini-2.0-flash-lite": { |
| 4705 | + "max_input_tokens": 1048576, |
| 4706 | + "max_output_tokens": 8192, |
| 4707 | + "max_images_per_prompt": 3000, |
| 4708 | + "max_videos_per_prompt": 10, |
| 4709 | + "max_video_length": 1, |
| 4710 | + "max_audio_length_hours": 8.4, |
| 4711 | + "max_audio_per_prompt": 1, |
| 4712 | + "max_pdf_size_mb": 50, |
| 4713 | + "input_cost_per_audio_token": 0.000000075, |
| 4714 | + "input_cost_per_token": 0.000000075, |
| 4715 | + "output_cost_per_token": 0.0000003, |
| 4716 | + "litellm_provider": "gemini", |
| 4717 | + "mode": "chat", |
| 4718 | + "tpm": 4000000, |
| 4719 | + "rpm": 4000, |
| 4720 | + "supports_system_messages": true, |
| 4721 | + "supports_function_calling": true, |
| 4722 | + "supports_vision": true, |
| 4723 | + "supports_response_schema": true, |
| 4724 | + "supports_audio_output": true, |
| 4725 | + "supports_tool_choice": true, |
| 4726 | + "source": "https://ai.google.dev/gemini-api/docs/pricing#gemini-2.0-flash-lite" |
| 4727 | + }, |
4661 | 4728 | "gemini/gemini-2.0-flash-001": {
|
4662 | 4729 | "max_tokens": 8192,
|
4663 | 4730 | "max_input_tokens": 1048576,
|
|
5153 | 5220 | "supports_function_calling": true,
|
5154 | 5221 | "supports_tool_choice": true
|
5155 | 5222 | },
|
| 5223 | + "vertex_ai/mistral-small-2503@001": { |
| 5224 | + "max_tokens": 8191, |
| 5225 | + "max_input_tokens": 32000, |
| 5226 | + "max_output_tokens": 8191, |
| 5227 | + "input_cost_per_token": 0.000001, |
| 5228 | + "output_cost_per_token": 0.000003, |
| 5229 | + "litellm_provider": "vertex_ai-mistral_models", |
| 5230 | + "supports_function_calling": true, |
| 5231 | + "mode": "chat", |
| 5232 | + "supports_tool_choice": true |
| 5233 | + }, |
| 5234 | + "vertex_ai/mistral-small-2503": { |
| 5235 | + "max_tokens": 128000, |
| 5236 | + "max_input_tokens": 128000, |
| 5237 | + "max_output_tokens": 128000, |
| 5238 | + "input_cost_per_token": 0.000001, |
| 5239 | + "output_cost_per_token": 0.000003, |
| 5240 | + "litellm_provider": "vertex_ai-mistral_models", |
| 5241 | + "mode": "chat", |
| 5242 | + "supports_function_calling": true, |
| 5243 | + "supports_vision": true, |
| 5244 | + "supports_tool_choice": true |
| 5245 | + }, |
5156 | 5246 | "vertex_ai/jamba-1.5-mini@001": {
|
5157 | 5247 | "max_tokens": 256000,
|
5158 | 5248 | "max_input_tokens": 256000,
|
|
5304 | 5394 | "mode": "embedding",
|
5305 | 5395 | "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models"
|
5306 | 5396 | },
|
| 5397 | + "multimodalembedding": { |
| 5398 | + "max_tokens": 2048, |
| 5399 | + "max_input_tokens": 2048, |
| 5400 | + "output_vector_size": 768, |
| 5401 | + "input_cost_per_character": 0.0000002, |
| 5402 | + "input_cost_per_image": 0.0001, |
| 5403 | + "input_cost_per_video_per_second": 0.0005, |
| 5404 | + "input_cost_per_video_per_second_above_8s_interval": 0.0010, |
| 5405 | + "input_cost_per_video_per_second_above_15s_interval": 0.0020, |
| 5406 | + "input_cost_per_token": 0.0000008, |
| 5407 | + "output_cost_per_token": 0, |
| 5408 | + "litellm_provider": "vertex_ai-embedding-models", |
| 5409 | + "mode": "embedding", |
| 5410 | + "supported_endpoints": ["/v1/embeddings"], |
| 5411 | + "supported_modalities": ["text", "image", "video"], |
| 5412 | + "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models" |
| 5413 | + }, |
| 5414 | + "multimodalembedding@001": { |
| 5415 | + "max_tokens": 2048, |
| 5416 | + "max_input_tokens": 2048, |
| 5417 | + "output_vector_size": 768, |
| 5418 | + "input_cost_per_character": 0.0000002, |
| 5419 | + "input_cost_per_image": 0.0001, |
| 5420 | + "input_cost_per_video_per_second": 0.0005, |
| 5421 | + "input_cost_per_video_per_second_above_8s_interval": 0.0010, |
| 5422 | + "input_cost_per_video_per_second_above_15s_interval": 0.0020, |
| 5423 | + "input_cost_per_token": 0.0000008, |
| 5424 | + "output_cost_per_token": 0, |
| 5425 | + "litellm_provider": "vertex_ai-embedding-models", |
| 5426 | + "mode": "embedding", |
| 5427 | + "supported_endpoints": ["/v1/embeddings"], |
| 5428 | + "supported_modalities": ["text", "image", "video"], |
| 5429 | + "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models" |
| 5430 | + }, |
| 5431 | + "text-embedding-large-exp-03-07": { |
| 5432 | + "max_tokens": 8192, |
| 5433 | + "max_input_tokens": 8192, |
| 5434 | + "output_vector_size": 3072, |
| 5435 | + "input_cost_per_character": 0.000000025, |
| 5436 | + "input_cost_per_token": 0.0000001, |
| 5437 | + "output_cost_per_token": 0, |
| 5438 | + "litellm_provider": "vertex_ai-embedding-models", |
| 5439 | + "mode": "embedding", |
| 5440 | + "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models" |
| 5441 | + }, |
5307 | 5442 | "textembedding-gecko": {
|
5308 | 5443 | "max_tokens": 3072,
|
5309 | 5444 | "max_input_tokens": 3072,
|
|
0 commit comments