{ "sample_spec": { "max_tokens": "LEGACY parameter. set to max_output_tokens if provider specifies it. IF not set to max_input_tokens, if provider specifies it.", "max_input_tokens": "max input tokens, if the provider specifies it. if not default to max_tokens", "max_output_tokens": "max output tokens, if the provider specifies it. if not default to max_tokens", "input_cost_per_token": 0.0000, "output_cost_per_token": 0.000, "litellm_provider": "one of https://docs.litellm.ai/docs/providers", "mode": "one of chat, embedding, completion, image_generation, audio_transcription, audio_speech", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_audio_input": true, "supports_audio_output": true, "supports_prompt_caching": true, "supports_response_schema": true, "supports_system_messages": true, "deprecation_date": "date when the model becomes deprecated in the format YYYY-MM-DD" }, "omni-moderation-latest": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "openai", "mode": "moderation" }, "omni-moderation-latest-intents": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "openai", "mode": "moderation" }, "omni-moderation-2024-09-26": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "openai", "mode": "moderation" }, "gpt-4": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.000010, "input_cost_per_token_batches": 0.00000125, "output_cost_per_token_batches": 0.00000500, "cache_read_input_token_cost": 0.00000125, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-audio-preview": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.0001, "output_cost_per_token": 0.000010, "output_cost_per_audio_token": 0.0002, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_audio_input": true, "supports_audio_output": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-audio-preview-2024-12-17": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.00004, "output_cost_per_token": 0.000010, "output_cost_per_audio_token": 0.00008, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_audio_input": true, "supports_audio_output": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-audio-preview-2024-10-01": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "input_cost_per_audio_token": 0.0001, "output_cost_per_token": 0.000010, "output_cost_per_audio_token": 0.0002, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_audio_input": true, "supports_audio_output": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-mini-audio-preview-2024-12-17": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "input_cost_per_audio_token": 0.00001, "output_cost_per_token": 0.0000006, "output_cost_per_audio_token": 0.00002, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_audio_input": true, "supports_audio_output": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-mini": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000060, "input_cost_per_token_batches": 0.000000075, "output_cost_per_token_batches": 0.00000030, "cache_read_input_token_cost": 0.000000075, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-mini-2024-07-18": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000060, "input_cost_per_token_batches": 0.000000075, "output_cost_per_token_batches": 0.00000030, "cache_read_input_token_cost": 0.000000075, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "o1": { "max_tokens": 100000, "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.00006, "cache_read_input_token_cost": 0.0000075, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_response_schema": true, "supports_tool_choice": true }, "o1-mini": { "max_tokens": 65536, "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000055, "litellm_provider": "openai", "mode": "chat", "supports_vision": true, "supports_prompt_caching": true }, "o3-mini": { "max_tokens": 100000, "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000055, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": false, "supports_vision": false, "supports_prompt_caching": true, "supports_response_schema": true, "supports_tool_choice": true }, "o3-mini-2025-01-31": { "max_tokens": 100000, "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000055, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": false, "supports_vision": false, "supports_prompt_caching": true, "supports_response_schema": true, "supports_tool_choice": true }, "o1-mini-2024-09-12": { "max_tokens": 65536, "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000012, "cache_read_input_token_cost": 0.0000015, "litellm_provider": "openai", "mode": "chat", "supports_vision": true, "supports_prompt_caching": true }, "o1-preview": { "max_tokens": 32768, "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000060, "cache_read_input_token_cost": 0.0000075, "litellm_provider": "openai", "mode": "chat", "supports_vision": true, "supports_prompt_caching": true }, "o1-preview-2024-09-12": { "max_tokens": 32768, "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000060, "cache_read_input_token_cost": 0.0000075, "litellm_provider": "openai", "mode": "chat", "supports_vision": true, "supports_prompt_caching": true }, "o1-2024-12-17": { "max_tokens": 100000, "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000060, "cache_read_input_token_cost": 0.0000075, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_response_schema": true, "supports_tool_choice": true }, "chatgpt-4o-latest": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-2024-05-13": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015, "input_cost_per_token_batches": 0.0000025, "output_cost_per_token_batches": 0.0000075, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-2024-08-06": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.000010, "input_cost_per_token_batches": 0.00000125, "output_cost_per_token_batches": 0.0000050, "cache_read_input_token_cost": 0.00000125, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-2024-11-20": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.000010, "input_cost_per_token_batches": 0.00000125, "output_cost_per_token_batches": 0.0000050, "cache_read_input_token_cost": 0.00000125, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-realtime-preview-2024-10-01": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "input_cost_per_audio_token": 0.0001, "cache_read_input_token_cost": 0.0000025, "cache_creation_input_audio_token_cost": 0.00002, "output_cost_per_token": 0.00002, "output_cost_per_audio_token": 0.0002, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_audio_input": true, "supports_audio_output": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-realtime-preview": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "input_cost_per_audio_token": 0.00004, "cache_read_input_token_cost": 0.0000025, "output_cost_per_token": 0.00002, "output_cost_per_audio_token": 0.00008, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_audio_input": true, "supports_audio_output": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-realtime-preview-2024-12-17": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "input_cost_per_audio_token": 0.00004, "cache_read_input_token_cost": 0.0000025, "output_cost_per_token": 0.00002, "output_cost_per_audio_token": 0.00008, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_audio_input": true, "supports_audio_output": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-mini-realtime-preview": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000006, "input_cost_per_audio_token": 0.00001, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_audio_token_cost": 0.0000003, "output_cost_per_token": 0.0000024, "output_cost_per_audio_token": 0.00002, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_audio_input": true, "supports_audio_output": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4o-mini-realtime-preview-2024-12-17": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000006, "input_cost_per_audio_token": 0.00001, "cache_read_input_token_cost": 0.0000003, "cache_creation_input_audio_token_cost": 0.0000003, "output_cost_per_token": 0.0000024, "output_cost_per_audio_token": 0.00002, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_audio_input": true, "supports_audio_output": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4-turbo-preview": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4-0314": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006, "litellm_provider": "openai", "mode": "chat", "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4-0613": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_prompt_caching": true, "supports_system_messages": true, "deprecation_date": "2025-06-06", "supports_tool_choice": true }, "gpt-4-32k": { "max_tokens": 4096, "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0.00006, "output_cost_per_token": 0.00012, "litellm_provider": "openai", "mode": "chat", "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4-32k-0314": { "max_tokens": 4096, "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0.00006, "output_cost_per_token": 0.00012, "litellm_provider": "openai", "mode": "chat", "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4-32k-0613": { "max_tokens": 4096, "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0.00006, "output_cost_per_token": 0.00012, "litellm_provider": "openai", "mode": "chat", "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4-turbo": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4-turbo-2024-04-09": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4-1106-preview": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4-0125-preview": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-4-vision-preview": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "openai", "mode": "chat", "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "deprecation_date": "2024-12-06", "supports_tool_choice": true }, "gpt-4-1106-vision-preview": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "openai", "mode": "chat", "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "deprecation_date": "2024-12-06", "supports_tool_choice": true }, "gpt-3.5-turbo": { "max_tokens": 4097, "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-3.5-turbo-0301": { "max_tokens": 4097, "max_input_tokens": 4097, "max_output_tokens": 4096, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002, "litellm_provider": "openai", "mode": "chat", "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-3.5-turbo-0613": { "max_tokens": 4097, "max_input_tokens": 4097, "max_output_tokens": 4096, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-3.5-turbo-1106": { "max_tokens": 16385, "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.0000010, "output_cost_per_token": 0.0000020, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-3.5-turbo-0125": { "max_tokens": 16385, "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-3.5-turbo-16k": { "max_tokens": 16385, "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000004, "litellm_provider": "openai", "mode": "chat", "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "gpt-3.5-turbo-16k-0613": { "max_tokens": 16385, "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000004, "litellm_provider": "openai", "mode": "chat", "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "ft:gpt-3.5-turbo": { "max_tokens": 4096, "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000006, "input_cost_per_token_batches": 0.0000015, "output_cost_per_token_batches": 0.000003, "litellm_provider": "openai", "mode": "chat", "supports_system_messages": true, "supports_tool_choice": true }, "ft:gpt-3.5-turbo-0125": { "max_tokens": 4096, "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000006, "litellm_provider": "openai", "mode": "chat", "supports_system_messages": true, "supports_tool_choice": true }, "ft:gpt-3.5-turbo-1106": { "max_tokens": 4096, "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000006, "litellm_provider": "openai", "mode": "chat", "supports_system_messages": true, "supports_tool_choice": true }, "ft:gpt-3.5-turbo-0613": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000006, "litellm_provider": "openai", "mode": "chat", "supports_system_messages": true, "supports_tool_choice": true }, "ft:gpt-4-0613": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "source": "OpenAI needs to add pricing for this ft model, will be updated when added by OpenAI. Defaulting to base model pricing", "supports_system_messages": true, "supports_tool_choice": true }, "ft:gpt-4o-2024-08-06": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000375, "output_cost_per_token": 0.000015, "input_cost_per_token_batches": 0.000001875, "output_cost_per_token_batches": 0.000007500, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_system_messages": true, "supports_tool_choice": true }, "ft:gpt-4o-2024-11-20": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000375, "cache_creation_input_token_cost": 0.000001875, "output_cost_per_token": 0.000015, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "ft:gpt-4o-mini-2024-07-18": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000012, "input_cost_per_token_batches": 0.000000150, "output_cost_per_token_batches": 0.000000600, "cache_read_input_token_cost": 0.00000015, "litellm_provider": "openai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_tool_choice": true }, "ft:davinci-002": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000002, "input_cost_per_token_batches": 0.000001, "output_cost_per_token_batches": 0.000001, "litellm_provider": "text-completion-openai", "mode": "completion" }, "ft:babbage-002": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000004, "input_cost_per_token_batches": 0.0000002, "output_cost_per_token_batches": 0.0000002, "litellm_provider": "text-completion-openai", "mode": "completion" }, "text-embedding-3-large": { "max_tokens": 8191, "max_input_tokens": 8191, "output_vector_size": 3072, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.000000, "input_cost_per_token_batches": 0.000000065, "output_cost_per_token_batches": 0.000000000, "litellm_provider": "openai", "mode": "embedding" }, "text-embedding-3-small": { "max_tokens": 8191, "max_input_tokens": 8191, "output_vector_size": 1536, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0.000000, "input_cost_per_token_batches": 0.000000010, "output_cost_per_token_batches": 0.000000000, "litellm_provider": "openai", "mode": "embedding" }, "text-embedding-ada-002": { "max_tokens": 8191, "max_input_tokens": 8191, "output_vector_size": 1536, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.000000, "litellm_provider": "openai", "mode": "embedding" }, "text-embedding-ada-002-v2": { "max_tokens": 8191, "max_input_tokens": 8191, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.000000, "input_cost_per_token_batches": 0.000000050, "output_cost_per_token_batches": 0.000000000, "litellm_provider": "openai", "mode": "embedding" }, "text-moderation-stable": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0.000000, "output_cost_per_token": 0.000000, "litellm_provider": "openai", "mode": "moderations" }, "text-moderation-007": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0.000000, "output_cost_per_token": 0.000000, "litellm_provider": "openai", "mode": "moderations" }, "text-moderation-latest": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 0, "input_cost_per_token": 0.000000, "output_cost_per_token": 0.000000, "litellm_provider": "openai", "mode": "moderations" }, "256-x-256/dall-e-2": { "mode": "image_generation", "input_cost_per_pixel": 0.00000024414, "output_cost_per_pixel": 0.0, "litellm_provider": "openai" }, "512-x-512/dall-e-2": { "mode": "image_generation", "input_cost_per_pixel": 0.0000000686, "output_cost_per_pixel": 0.0, "litellm_provider": "openai" }, "1024-x-1024/dall-e-2": { "mode": "image_generation", "input_cost_per_pixel": 0.000000019, "output_cost_per_pixel": 0.0, "litellm_provider": "openai" }, "hd/1024-x-1792/dall-e-3": { "mode": "image_generation", "input_cost_per_pixel": 0.00000006539, "output_cost_per_pixel": 0.0, "litellm_provider": "openai" }, "hd/1792-x-1024/dall-e-3": { "mode": "image_generation", "input_cost_per_pixel": 0.00000006539, "output_cost_per_pixel": 0.0, "litellm_provider": "openai" }, "hd/1024-x-1024/dall-e-3": { "mode": "image_generation", "input_cost_per_pixel": 0.00000007629, "output_cost_per_pixel": 0.0, "litellm_provider": "openai" }, "standard/1024-x-1792/dall-e-3": { "mode": "image_generation", "input_cost_per_pixel": 0.00000004359, "output_cost_per_pixel": 0.0, "litellm_provider": "openai" }, "standard/1792-x-1024/dall-e-3": { "mode": "image_generation", "input_cost_per_pixel": 0.00000004359, "output_cost_per_pixel": 0.0, "litellm_provider": "openai" }, "standard/1024-x-1024/dall-e-3": { "mode": "image_generation", "input_cost_per_pixel": 0.0000000381469, "output_cost_per_pixel": 0.0, "litellm_provider": "openai" }, "whisper-1": { "mode": "audio_transcription", "input_cost_per_second": 0.0001, "output_cost_per_second": 0.0001, "litellm_provider": "openai" }, "tts-1": { "mode": "audio_speech", "input_cost_per_character": 0.000015, "litellm_provider": "openai" }, "tts-1-hd": { "mode": "audio_speech", "input_cost_per_character": 0.000030, "litellm_provider": "openai" }, "azure/o3-mini-2025-01-31": { "max_tokens": 100000, "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000055, "litellm_provider": "azure", "mode": "chat", "supports_vision": false, "supports_prompt_caching": true, "supports_tool_choice": true }, "azure/tts-1": { "mode": "audio_speech", "input_cost_per_character": 0.000015, "litellm_provider": "azure" }, "azure/tts-1-hd": { "mode": "audio_speech", "input_cost_per_character": 0.000030, "litellm_provider": "azure" }, "azure/whisper-1": { "mode": "audio_transcription", "input_cost_per_second": 0.0001, "output_cost_per_second": 0.0001, "litellm_provider": "azure" }, "azure/o3-mini": { "max_tokens": 100000, "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.0000044, "cache_read_input_token_cost": 0.00000055, "litellm_provider": "azure", "mode": "chat", "supports_vision": false, "supports_prompt_caching": true, "supports_response_schema": true, "supports_tool_choice": true }, "azure/o1-mini": { "max_tokens": 65536, "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000012, "cache_read_input_token_cost": 0.0000015, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, "supports_prompt_caching": true }, "azure/o1-mini-2024-09-12": { "max_tokens": 65536, "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000012, "cache_read_input_token_cost": 0.0000015, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, "supports_prompt_caching": true }, "azure/o1": { "max_tokens": 100000, "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000060, "cache_read_input_token_cost": 0.0000075, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_prompt_caching": true, "supports_tool_choice": true }, "azure/o1-2024-12-17": { "max_tokens": 100000, "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000060, "cache_read_input_token_cost": 0.0000075, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_prompt_caching": true, "supports_tool_choice": true }, "azure/o1-preview": { "max_tokens": 32768, "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000060, "cache_read_input_token_cost": 0.0000075, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, "supports_prompt_caching": true }, "azure/o1-preview-2024-09-12": { "max_tokens": 32768, "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000060, "cache_read_input_token_cost": 0.0000075, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, "supports_prompt_caching": true }, "azure/gpt-4o": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015, "cache_read_input_token_cost": 0.00000125, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_prompt_caching": true, "supports_tool_choice": true }, "azure/gpt-4o-2024-08-06": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000275, "output_cost_per_token": 0.000011, "cache_read_input_token_cost": 0.00000125, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_prompt_caching": true, "supports_tool_choice": true }, "azure/gpt-4o-2024-11-20": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000275, "output_cost_per_token": 0.000011, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "azure/gpt-4o-2024-05-13": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_prompt_caching": true, "supports_tool_choice": true }, "azure/global-standard/gpt-4o-2024-08-06": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.000010, "cache_read_input_token_cost": 0.00000125, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_prompt_caching": true, "supports_tool_choice": true }, "azure/global-standard/gpt-4o-2024-11-20": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.000010, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "azure/global-standard/gpt-4o-mini": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000060, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "azure/gpt-4o-mini": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.000000165, "output_cost_per_token": 0.00000066, "cache_read_input_token_cost": 0.000000075, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_prompt_caching": true, "supports_tool_choice": true }, "azure/gpt-4o-mini-2024-07-18": { "max_tokens": 16384, "max_input_tokens": 128000, "max_output_tokens": 16384, "input_cost_per_token": 0.000000165, "output_cost_per_token": 0.00000066, "cache_read_input_token_cost": 0.000000075, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_prompt_caching": true, "supports_tool_choice": true }, "azure/gpt-4-turbo-2024-04-09": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "azure/gpt-4-0125-preview": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_tool_choice": true }, "azure/gpt-4-1106-preview": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_tool_choice": true }, "azure/gpt-4-0613": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "azure/gpt-4-32k-0613": { "max_tokens": 4096, "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0.00006, "output_cost_per_token": 0.00012, "litellm_provider": "azure", "mode": "chat", "supports_tool_choice": true }, "azure/gpt-4-32k": { "max_tokens": 4096, "max_input_tokens": 32768, "max_output_tokens": 4096, "input_cost_per_token": 0.00006, "output_cost_per_token": 0.00012, "litellm_provider": "azure", "mode": "chat", "supports_tool_choice": true }, "azure/gpt-4": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "azure/gpt-4-turbo": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_tool_choice": true }, "azure/gpt-4-turbo-vision-preview": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "litellm_provider": "azure", "mode": "chat", "supports_vision": true, "supports_tool_choice": true }, "azure/gpt-35-turbo-16k-0613": { "max_tokens": 4096, "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000004, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "azure/gpt-35-turbo-1106": { "max_tokens": 4096, "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000002, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "deprecation_date": "2025-03-31", "supports_tool_choice": true }, "azure/gpt-35-turbo-0613": { "max_tokens": 4097, "max_input_tokens": 4097, "max_output_tokens": 4096, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "deprecation_date": "2025-02-13", "supports_tool_choice": true }, "azure/gpt-35-turbo-0301": { "max_tokens": 4097, "max_input_tokens": 4097, "max_output_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.000002, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "deprecation_date": "2025-02-13", "supports_tool_choice": true }, "azure/gpt-35-turbo-0125": { "max_tokens": 4096, "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "deprecation_date": "2025-03-31", "supports_tool_choice": true }, "azure/gpt-35-turbo-16k": { "max_tokens": 4096, "max_input_tokens": 16385, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000004, "litellm_provider": "azure", "mode": "chat", "supports_tool_choice": true }, "azure/gpt-35-turbo": { "max_tokens": 4096, "max_input_tokens": 4097, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "azure/gpt-3.5-turbo-instruct-0914": { "max_tokens": 4097, "max_input_tokens": 4097, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002, "litellm_provider": "azure_text", "mode": "completion" }, "azure/gpt-35-turbo-instruct": { "max_tokens": 4097, "max_input_tokens": 4097, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002, "litellm_provider": "azure_text", "mode": "completion" }, "azure/gpt-35-turbo-instruct-0914": { "max_tokens": 4097, "max_input_tokens": 4097, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002, "litellm_provider": "azure_text", "mode": "completion" }, "azure/mistral-large-latest": { "max_tokens": 32000, "max_input_tokens": 32000, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true }, "azure/mistral-large-2402": { "max_tokens": 32000, "max_input_tokens": 32000, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true }, "azure/command-r-plus": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "azure", "mode": "chat", "supports_function_calling": true }, "azure/ada": { "max_tokens": 8191, "max_input_tokens": 8191, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.000000, "litellm_provider": "azure", "mode": "embedding" }, "azure/text-embedding-ada-002": { "max_tokens": 8191, "max_input_tokens": 8191, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.000000, "litellm_provider": "azure", "mode": "embedding" }, "azure/text-embedding-3-large": { "max_tokens": 8191, "max_input_tokens": 8191, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.000000, "litellm_provider": "azure", "mode": "embedding" }, "azure/text-embedding-3-small": { "max_tokens": 8191, "max_input_tokens": 8191, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0.000000, "litellm_provider": "azure", "mode": "embedding" }, "azure/standard/1024-x-1024/dall-e-3": { "input_cost_per_pixel": 0.0000000381469, "output_cost_per_token": 0.0, "litellm_provider": "azure", "mode": "image_generation" }, "azure/hd/1024-x-1024/dall-e-3": { "input_cost_per_pixel": 0.00000007629, "output_cost_per_token": 0.0, "litellm_provider": "azure", "mode": "image_generation" }, "azure/standard/1024-x-1792/dall-e-3": { "input_cost_per_pixel": 0.00000004359, "output_cost_per_token": 0.0, "litellm_provider": "azure", "mode": "image_generation" }, "azure/standard/1792-x-1024/dall-e-3": { "input_cost_per_pixel": 0.00000004359, "output_cost_per_token": 0.0, "litellm_provider": "azure", "mode": "image_generation" }, "azure/hd/1024-x-1792/dall-e-3": { "input_cost_per_pixel": 0.00000006539, "output_cost_per_token": 0.0, "litellm_provider": "azure", "mode": "image_generation" }, "azure/hd/1792-x-1024/dall-e-3": { "input_cost_per_pixel": 0.00000006539, "output_cost_per_token": 0.0, "litellm_provider": "azure", "mode": "image_generation" }, "azure/standard/1024-x-1024/dall-e-2": { "input_cost_per_pixel": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "azure", "mode": "image_generation" }, "azure_ai/deepseek-r1": { "max_tokens": 8192, "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "input_cost_per_token_cache_hit": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "azure_ai", "mode": "chat", "supports_prompt_caching": true, "supports_tool_choice": true }, "azure_ai/jamba-instruct": { "max_tokens": 4096, "max_input_tokens": 70000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000007, "litellm_provider": "azure_ai", "mode": "chat", "supports_tool_choice": true }, "azure_ai/mistral-large": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000004, "output_cost_per_token": 0.000012, "litellm_provider": "azure_ai", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "azure_ai/mistral-small": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003, "litellm_provider": "azure_ai", "supports_function_calling": true, "mode": "chat", "supports_tool_choice": true }, "azure_ai/mistral-large-2407": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "litellm_provider": "azure_ai", "supports_function_calling": true, "mode": "chat", "source": "https://azuremarketplace.microsoft.com/en/marketplace/apps/000-000.mistral-ai-large-2407-offer?tab=Overview", "supports_tool_choice": true }, "azure_ai/ministral-3b": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000004, "litellm_provider": "azure_ai", "supports_function_calling": true, "mode": "chat", "source": "https://azuremarketplace.microsoft.com/en/marketplace/apps/000-000.ministral-3b-2410-offer?tab=Overview", "supports_tool_choice": true }, "azure_ai/Llama-3.2-11B-Vision-Instruct": { "max_tokens": 2048, "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000037, "output_cost_per_token": 0.00000037, "litellm_provider": "azure_ai", "supports_function_calling": true, "supports_vision": true, "mode": "chat", "source": "https://azuremarketplace.microsoft.com/en/marketplace/apps/metagenai.meta-llama-3-2-11b-vision-instruct-offer?tab=Overview", "supports_tool_choice": true }, "azure_ai/Llama-3.3-70B-Instruct": { "max_tokens": 2048, "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000071, "output_cost_per_token": 0.00000071, "litellm_provider": "azure_ai", "supports_function_calling": true, "mode": "chat", "source": "https://azuremarketplace.microsoft.com/en/marketplace/apps/metagenai.llama-3-3-70b-instruct-offer?tab=Overview", "supports_tool_choice": true }, "azure_ai/Llama-3.2-90B-Vision-Instruct": { "max_tokens": 2048, "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000204, "output_cost_per_token": 0.00000204, "litellm_provider": "azure_ai", "supports_function_calling": true, "supports_vision": true, "mode": "chat", "source": "https://azuremarketplace.microsoft.com/en/marketplace/apps/metagenai.meta-llama-3-2-90b-vision-instruct-offer?tab=Overview", "supports_tool_choice": true }, "azure_ai/Meta-Llama-3-70B-Instruct": { "max_tokens": 2048, "max_input_tokens": 8192, "max_output_tokens": 2048, "input_cost_per_token": 0.0000011, "output_cost_per_token": 0.00000037, "litellm_provider": "azure_ai", "mode": "chat", "supports_tool_choice": true }, "azure_ai/Meta-Llama-3.1-8B-Instruct": { "max_tokens": 2048, "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.00000061, "litellm_provider": "azure_ai", "mode": "chat", "source":"https://azuremarketplace.microsoft.com/en-us/marketplace/apps/metagenai.meta-llama-3-1-8b-instruct-offer?tab=PlansAndPrice", "supports_tool_choice": true }, "azure_ai/Meta-Llama-3.1-70B-Instruct": { "max_tokens": 2048, "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000268, "output_cost_per_token": 0.00000354, "litellm_provider": "azure_ai", "mode": "chat", "source":"https://azuremarketplace.microsoft.com/en-us/marketplace/apps/metagenai.meta-llama-3-1-70b-instruct-offer?tab=PlansAndPrice", "supports_tool_choice": true }, "azure_ai/Meta-Llama-3.1-405B-Instruct": { "max_tokens": 2048, "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000533, "output_cost_per_token": 0.000016, "litellm_provider": "azure_ai", "mode": "chat", "source":"https://azuremarketplace.microsoft.com/en-us/marketplace/apps/metagenai.meta-llama-3-1-405b-instruct-offer?tab=PlansAndPrice", "supports_tool_choice": true }, "azure_ai/Phi-3.5-mini-instruct": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000052, "litellm_provider": "azure_ai", "mode": "chat", "supports_vision": false, "source": "https://azure.microsoft.com/en-us/pricing/details/phi-3/", "supports_tool_choice": true }, "azure_ai/Phi-3.5-vision-instruct": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000052, "litellm_provider": "azure_ai", "mode": "chat", "supports_vision": true, "source": "https://azure.microsoft.com/en-us/pricing/details/phi-3/", "supports_tool_choice": true }, "azure_ai/Phi-3.5-MoE-instruct": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000016, "output_cost_per_token": 0.00000064, "litellm_provider": "azure_ai", "mode": "chat", "supports_vision": false, "source": "https://azure.microsoft.com/en-us/pricing/details/phi-3/", "supports_tool_choice": true }, "azure_ai/Phi-3-mini-4k-instruct": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000052, "litellm_provider": "azure_ai", "mode": "chat", "supports_vision": false, "source": "https://azure.microsoft.com/en-us/pricing/details/phi-3/", "supports_tool_choice": true }, "azure_ai/Phi-3-mini-128k-instruct": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000052, "litellm_provider": "azure_ai", "mode": "chat", "supports_vision": false, "source": "https://azure.microsoft.com/en-us/pricing/details/phi-3/", "supports_tool_choice": true }, "azure_ai/Phi-3-small-8k-instruct": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "litellm_provider": "azure_ai", "mode": "chat", "supports_vision": false, "source": "https://azure.microsoft.com/en-us/pricing/details/phi-3/", "supports_tool_choice": true }, "azure_ai/Phi-3-small-128k-instruct": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "litellm_provider": "azure_ai", "mode": "chat", "supports_vision": false, "source": "https://azure.microsoft.com/en-us/pricing/details/phi-3/", "supports_tool_choice": true }, "azure_ai/Phi-3-medium-4k-instruct": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000017, "output_cost_per_token": 0.00000068, "litellm_provider": "azure_ai", "mode": "chat", "supports_vision": false, "source": "https://azure.microsoft.com/en-us/pricing/details/phi-3/", "supports_tool_choice": true }, "azure_ai/Phi-3-medium-128k-instruct": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000017, "output_cost_per_token": 0.00000068, "litellm_provider": "azure_ai", "mode": "chat", "supports_vision": false, "source": "https://azure.microsoft.com/en-us/pricing/details/phi-3/", "supports_tool_choice": true }, "azure_ai/cohere-rerank-v3-multilingual": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "max_query_tokens": 2048, "input_cost_per_token": 0.0, "input_cost_per_query": 0.002, "output_cost_per_token": 0.0, "litellm_provider": "azure_ai", "mode": "rerank" }, "azure_ai/cohere-rerank-v3-english": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "max_query_tokens": 2048, "input_cost_per_token": 0.0, "input_cost_per_query": 0.002, "output_cost_per_token": 0.0, "litellm_provider": "azure_ai", "mode": "rerank" }, "azure_ai/Cohere-embed-v3-english": { "max_tokens": 512, "max_input_tokens": 512, "output_vector_size": 1024, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0, "litellm_provider": "azure_ai", "mode": "embedding", "source":"https://azuremarketplace.microsoft.com/en-us/marketplace/apps/cohere.cohere-embed-v3-english-offer?tab=PlansAndPrice" }, "azure_ai/Cohere-embed-v3-multilingual": { "max_tokens": 512, "max_input_tokens": 512, "output_vector_size": 1024, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0, "litellm_provider": "azure_ai", "mode": "embedding", "source":"https://azuremarketplace.microsoft.com/en-us/marketplace/apps/cohere.cohere-embed-v3-english-offer?tab=PlansAndPrice" }, "babbage-002": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000004, "litellm_provider": "text-completion-openai", "mode": "completion" }, "davinci-002": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000002, "litellm_provider": "text-completion-openai", "mode": "completion" }, "gpt-3.5-turbo-instruct": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002, "litellm_provider": "text-completion-openai", "mode": "completion" }, "gpt-3.5-turbo-instruct-0914": { "max_tokens": 4097, "max_input_tokens": 8192, "max_output_tokens": 4097, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002, "litellm_provider": "text-completion-openai", "mode": "completion" }, "claude-instant-1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000163, "output_cost_per_token": 0.00000551, "litellm_provider": "anthropic", "mode": "chat" }, "mistral/mistral-tiny": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000025, "litellm_provider": "mistral", "mode": "chat", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/mistral-small": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003, "litellm_provider": "mistral", "supports_function_calling": true, "mode": "chat", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/mistral-small-latest": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003, "litellm_provider": "mistral", "supports_function_calling": true, "mode": "chat", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/mistral-medium": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000027, "output_cost_per_token": 0.0000081, "litellm_provider": "mistral", "mode": "chat", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/mistral-medium-latest": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000027, "output_cost_per_token": 0.0000081, "litellm_provider": "mistral", "mode": "chat", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/mistral-medium-2312": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000027, "output_cost_per_token": 0.0000081, "litellm_provider": "mistral", "mode": "chat", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/mistral-large-latest": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "litellm_provider": "mistral", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/mistral-large-2411": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "litellm_provider": "mistral", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/mistral-large-2402": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000004, "output_cost_per_token": 0.000012, "litellm_provider": "mistral", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/mistral-large-2407": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000009, "litellm_provider": "mistral", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/pixtral-large-latest": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "litellm_provider": "mistral", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_vision": true, "supports_tool_choice": true }, "mistral/pixtral-large-2411": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "litellm_provider": "mistral", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_vision": true, "supports_tool_choice": true }, "mistral/pixtral-12b-2409": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015, "litellm_provider": "mistral", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_vision": true, "supports_tool_choice": true }, "mistral/open-mistral-7b": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000025, "litellm_provider": "mistral", "mode": "chat", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/open-mixtral-8x7b": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000007, "output_cost_per_token": 0.0000007, "litellm_provider": "mistral", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/open-mixtral-8x22b": { "max_tokens": 8191, "max_input_tokens": 65336, "max_output_tokens": 8191, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "litellm_provider": "mistral", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/codestral-latest": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003, "litellm_provider": "mistral", "mode": "chat", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/codestral-2405": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003, "litellm_provider": "mistral", "mode": "chat", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/open-mistral-nemo": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000003, "litellm_provider": "mistral", "mode": "chat", "source": "https://mistral.ai/technology/", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/open-mistral-nemo-2407": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000003, "litellm_provider": "mistral", "mode": "chat", "source": "https://mistral.ai/technology/", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/open-codestral-mamba": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000025, "litellm_provider": "mistral", "mode": "chat", "source": "https://mistral.ai/technology/", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/codestral-mamba-latest": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000025, "litellm_provider": "mistral", "mode": "chat", "source": "https://mistral.ai/technology/", "supports_assistant_prefill": true, "supports_tool_choice": true }, "mistral/mistral-embed": { "max_tokens": 8192, "max_input_tokens": 8192, "input_cost_per_token": 0.0000001, "litellm_provider": "mistral", "mode": "embedding" }, "deepseek/deepseek-reasoner": { "max_tokens": 8192, "max_input_tokens": 65536, "max_output_tokens": 8192, "input_cost_per_token": 0.00000055, "input_cost_per_token_cache_hit": 0.00000014, "output_cost_per_token": 0.00000219, "litellm_provider": "deepseek", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true, "supports_prompt_caching": true }, "deepseek/deepseek-chat": { "max_tokens": 8192, "max_input_tokens": 65536, "max_output_tokens": 8192, "input_cost_per_token": 0.00000027, "input_cost_per_token_cache_hit": 0.00000007, "cache_read_input_token_cost": 0.00000007, "cache_creation_input_token_cost": 0.0, "output_cost_per_token": 0.0000011, "litellm_provider": "deepseek", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true, "supports_prompt_caching": true }, "codestral/codestral-latest": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000000, "output_cost_per_token": 0.000000, "litellm_provider": "codestral", "mode": "chat", "source": "https://docs.mistral.ai/capabilities/code_generation/", "supports_assistant_prefill": true, "supports_tool_choice": true }, "codestral/codestral-2405": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000000, "output_cost_per_token": 0.000000, "litellm_provider": "codestral", "mode": "chat", "source": "https://docs.mistral.ai/capabilities/code_generation/", "supports_assistant_prefill": true, "supports_tool_choice": true }, "text-completion-codestral/codestral-latest": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000000, "output_cost_per_token": 0.000000, "litellm_provider": "text-completion-codestral", "mode": "completion", "source": "https://docs.mistral.ai/capabilities/code_generation/" }, "text-completion-codestral/codestral-2405": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000000, "output_cost_per_token": 0.000000, "litellm_provider": "text-completion-codestral", "mode": "completion", "source": "https://docs.mistral.ai/capabilities/code_generation/" }, "xai/grok-beta": { "max_tokens": 131072, "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015, "litellm_provider": "xai", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "xai/grok-2-vision-1212": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000002, "input_cost_per_image": 0.000002, "output_cost_per_token": 0.00001, "litellm_provider": "xai", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "xai/grok-2-vision-latest": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000002, "input_cost_per_image": 0.000002, "output_cost_per_token": 0.00001, "litellm_provider": "xai", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "xai/grok-2-vision": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000002, "input_cost_per_image": 0.000002, "output_cost_per_token": 0.00001, "litellm_provider": "xai", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "xai/grok-vision-beta": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.000005, "input_cost_per_image": 0.000005, "output_cost_per_token": 0.000015, "litellm_provider": "xai", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "xai/grok-2-1212": { "max_tokens": 131072, "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.00001, "litellm_provider": "xai", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "xai/grok-2": { "max_tokens": 131072, "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.00001, "litellm_provider": "xai", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "xai/grok-2-latest": { "max_tokens": 131072, "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.00001, "litellm_provider": "xai", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "deepseek/deepseek-coder": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000014, "input_cost_per_token_cache_hit": 0.000000014, "output_cost_per_token": 0.00000028, "litellm_provider": "deepseek", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true, "supports_prompt_caching": true }, "groq/deepseek-r1-distill-llama-70b": { "max_tokens": 131072, "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.00000075, "output_cost_per_token": 0.00000099, "litellm_provider": "groq", "mode": "chat", "supports_system_messages": false, "supports_function_calling": false, "supports_response_schema": false, "supports_tool_choice": true }, "groq/llama-3.3-70b-versatile": { "max_tokens": 8192, "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000059, "output_cost_per_token": 0.00000079, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama-3.3-70b-specdec": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000059, "output_cost_per_token": 0.00000099, "litellm_provider": "groq", "mode": "chat", "supports_tool_choice": true }, "groq/llama2-70b-4096": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000070, "output_cost_per_token": 0.00000080, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama3-8b-8192": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000008, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama-3.2-1b-preview": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000004, "output_cost_per_token": 0.00000004, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama-3.2-3b-preview": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000006, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama-3.2-11b-text-preview": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.00000018, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama-3.2-11b-vision-preview": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.00000018, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "groq/llama-3.2-90b-text-preview": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama-3.2-90b-vision-preview": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "groq/llama3-70b-8192": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000059, "output_cost_per_token": 0.00000079, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama-3.1-8b-instant": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000008, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama-3.1-70b-versatile": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000059, "output_cost_per_token": 0.00000079, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama-3.1-405b-reasoning": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000059, "output_cost_per_token": 0.00000079, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/mixtral-8x7b-32768": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000024, "output_cost_per_token": 0.00000024, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/gemma-7b-it": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000007, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/gemma2-9b-it": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000020, "output_cost_per_token": 0.00000020, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama3-groq-70b-8192-tool-use-preview": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000089, "output_cost_per_token": 0.00000089, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "groq/llama3-groq-8b-8192-tool-use-preview": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000019, "output_cost_per_token": 0.00000019, "litellm_provider": "groq", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_tool_choice": true }, "cerebras/llama3.1-8b": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001, "litellm_provider": "cerebras", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "cerebras/llama3.1-70b": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000006, "litellm_provider": "cerebras", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "friendliai/meta-llama-3.1-8b-instruct": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001, "litellm_provider": "friendliai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_system_messages": true, "supports_response_schema": true, "supports_tool_choice": true }, "friendliai/meta-llama-3.1-70b-instruct": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000006, "litellm_provider": "friendliai", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_system_messages": true, "supports_response_schema": true, "supports_tool_choice": true }, "claude-instant-1.2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000000163, "output_cost_per_token": 0.000000551, "litellm_provider": "anthropic", "mode": "chat", "supports_tool_choice": true }, "claude-2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "anthropic", "mode": "chat" }, "claude-2.1": { "max_tokens": 8191, "max_input_tokens": 200000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "anthropic", "mode": "chat", "supports_tool_choice": true }, "claude-3-haiku-20240307": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "cache_creation_input_token_cost": 0.0000003, "cache_read_input_token_cost": 0.00000003, "litellm_provider": "anthropic", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "tool_use_system_prompt_tokens": 264, "supports_assistant_prefill": true, "supports_prompt_caching": true, "supports_response_schema": true, "deprecation_date": "2025-03-01", "supports_tool_choice": true }, "claude-3-5-haiku-20241022": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "cache_creation_input_token_cost": 0.00000125, "cache_read_input_token_cost": 0.0000001, "litellm_provider": "anthropic", "mode": "chat", "supports_function_calling": true, "tool_use_system_prompt_tokens": 264, "supports_assistant_prefill": true, "supports_prompt_caching": true, "supports_response_schema": true, "deprecation_date": "2025-10-01", "supports_tool_choice": true }, "claude-3-opus-20240229": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "cache_creation_input_token_cost": 0.00001875, "cache_read_input_token_cost": 0.0000015, "litellm_provider": "anthropic", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "tool_use_system_prompt_tokens": 395, "supports_assistant_prefill": true, "supports_prompt_caching": true, "supports_response_schema": true, "deprecation_date": "2025-03-01", "supports_tool_choice": true }, "claude-3-sonnet-20240229": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "anthropic", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "tool_use_system_prompt_tokens": 159, "supports_assistant_prefill": true, "supports_prompt_caching": true, "supports_response_schema": true, "deprecation_date": "2025-07-21", "supports_tool_choice": true }, "claude-3-5-sonnet-20240620": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_creation_input_token_cost": 0.00000375, "cache_read_input_token_cost": 0.0000003, "litellm_provider": "anthropic", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "tool_use_system_prompt_tokens": 159, "supports_assistant_prefill": true, "supports_prompt_caching": true, "supports_response_schema": true, "deprecation_date": "2025-06-01", "supports_tool_choice": true }, "claude-3-5-sonnet-20241022": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "cache_creation_input_token_cost": 0.00000375, "cache_read_input_token_cost": 0.0000003, "litellm_provider": "anthropic", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "tool_use_system_prompt_tokens": 159, "supports_assistant_prefill": true, "supports_pdf_input": true, "supports_prompt_caching": true, "supports_response_schema": true, "deprecation_date": "2025-10-01", "supports_tool_choice": true }, "text-bison": { "max_tokens": 2048, "max_input_tokens": 8192, "max_output_tokens": 2048, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "text-bison@001": { "max_tokens": 1024, "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "text-bison@002": { "max_tokens": 1024, "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "text-bison32k": { "max_tokens": 1024, "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "text-bison32k@002": { "max_tokens": 1024, "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "text-unicorn": { "max_tokens": 1024, "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.000028, "litellm_provider": "vertex_ai-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "text-unicorn@001": { "max_tokens": 1024, "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.000028, "litellm_provider": "vertex_ai-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "chat-bison": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-chat-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "chat-bison@001": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-chat-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "chat-bison@002": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-chat-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "deprecation_date": "2025-04-09", "supports_tool_choice": true }, "chat-bison-32k": { "max_tokens": 8192, "max_input_tokens": 32000, "max_output_tokens": 8192, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-chat-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "chat-bison-32k@002": { "max_tokens": 8192, "max_input_tokens": 32000, "max_output_tokens": 8192, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-chat-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "code-bison": { "max_tokens": 1024, "max_input_tokens": 6144, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-code-text-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "code-bison@001": { "max_tokens": 1024, "max_input_tokens": 6144, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-code-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "code-bison@002": { "max_tokens": 1024, "max_input_tokens": 6144, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-code-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "code-bison32k": { "max_tokens": 1024, "max_input_tokens": 6144, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-code-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "code-bison-32k@002": { "max_tokens": 1024, "max_input_tokens": 6144, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-code-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "code-gecko@001": { "max_tokens": 64, "max_input_tokens": 2048, "max_output_tokens": 64, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "litellm_provider": "vertex_ai-code-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "code-gecko@002": { "max_tokens": 64, "max_input_tokens": 2048, "max_output_tokens": 64, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "litellm_provider": "vertex_ai-code-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "code-gecko": { "max_tokens": 64, "max_input_tokens": 2048, "max_output_tokens": 64, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "litellm_provider": "vertex_ai-code-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "code-gecko-latest": { "max_tokens": 64, "max_input_tokens": 2048, "max_output_tokens": 64, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "litellm_provider": "vertex_ai-code-text-models", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "codechat-bison@latest": { "max_tokens": 1024, "max_input_tokens": 6144, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-code-chat-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "codechat-bison": { "max_tokens": 1024, "max_input_tokens": 6144, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-code-chat-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "codechat-bison@001": { "max_tokens": 1024, "max_input_tokens": 6144, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-code-chat-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "codechat-bison@002": { "max_tokens": 1024, "max_input_tokens": 6144, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-code-chat-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "codechat-bison-32k": { "max_tokens": 8192, "max_input_tokens": 32000, "max_output_tokens": 8192, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-code-chat-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "codechat-bison-32k@002": { "max_tokens": 8192, "max_input_tokens": 32000, "max_output_tokens": 8192, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "input_cost_per_character": 0.00000025, "output_cost_per_character": 0.0000005, "litellm_provider": "vertex_ai-code-chat-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "gemini-pro": { "max_tokens": 8192, "max_input_tokens": 32760, "max_output_tokens": 8192, "input_cost_per_image": 0.0025, "input_cost_per_video_per_second": 0.002, "input_cost_per_token": 0.0000005, "input_cost_per_character": 0.000000125, "output_cost_per_token": 0.0000015, "output_cost_per_character": 0.000000375, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_function_calling": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing", "supports_tool_choice": true }, "gemini-1.0-pro": { "max_tokens": 8192, "max_input_tokens": 32760, "max_output_tokens": 8192, "input_cost_per_image": 0.0025, "input_cost_per_video_per_second": 0.002, "input_cost_per_token": 0.0000005, "input_cost_per_character": 0.000000125, "output_cost_per_token": 0.0000015, "output_cost_per_character": 0.000000375, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_function_calling": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#google_models", "supports_tool_choice": true }, "gemini-1.0-pro-001": { "max_tokens": 8192, "max_input_tokens": 32760, "max_output_tokens": 8192, "input_cost_per_image": 0.0025, "input_cost_per_video_per_second": 0.002, "input_cost_per_token": 0.0000005, "input_cost_per_character": 0.000000125, "output_cost_per_token": 0.0000015, "output_cost_per_character": 0.000000375, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_function_calling": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "deprecation_date": "2025-04-09", "supports_tool_choice": true }, "gemini-1.0-ultra": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 2048, "input_cost_per_image": 0.0025, "input_cost_per_video_per_second": 0.002, "input_cost_per_token": 0.0000005, "input_cost_per_character": 0.000000125, "output_cost_per_token": 0.0000015, "output_cost_per_character": 0.000000375, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_function_calling": true, "source": "As of Jun, 2024. There is no available doc on vertex ai pricing gemini-1.0-ultra-001. Using gemini-1.0-pro pricing. Got max_tokens info here: https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "gemini-1.0-ultra-001": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 2048, "input_cost_per_image": 0.0025, "input_cost_per_video_per_second": 0.002, "input_cost_per_token": 0.0000005, "input_cost_per_character": 0.000000125, "output_cost_per_token": 0.0000015, "output_cost_per_character": 0.000000375, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_function_calling": true, "source": "As of Jun, 2024. There is no available doc on vertex ai pricing gemini-1.0-ultra-001. Using gemini-1.0-pro pricing. Got max_tokens info here: https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "gemini-1.0-pro-002": { "max_tokens": 8192, "max_input_tokens": 32760, "max_output_tokens": 8192, "input_cost_per_image": 0.0025, "input_cost_per_video_per_second": 0.002, "input_cost_per_token": 0.0000005, "input_cost_per_character": 0.000000125, "output_cost_per_token": 0.0000015, "output_cost_per_character": 0.000000375, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_function_calling": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "deprecation_date": "2025-04-09", "supports_tool_choice": true }, "gemini-1.5-pro": { "max_tokens": 8192, "max_input_tokens": 2097152, "max_output_tokens": 8192, "input_cost_per_image": 0.00032875, "input_cost_per_audio_per_second": 0.00003125, "input_cost_per_video_per_second": 0.00032875, "input_cost_per_token": 0.00000125, "input_cost_per_character": 0.0000003125, "input_cost_per_image_above_128k_tokens": 0.0006575, "input_cost_per_video_per_second_above_128k_tokens": 0.0006575, "input_cost_per_audio_per_second_above_128k_tokens": 0.0000625, "input_cost_per_token_above_128k_tokens": 0.0000025, "input_cost_per_character_above_128k_tokens": 0.000000625, "output_cost_per_token": 0.000005, "output_cost_per_character": 0.00000125, "output_cost_per_token_above_128k_tokens": 0.00001, "output_cost_per_character_above_128k_tokens": 0.0000025, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_vision": true, "supports_pdf_input": true, "supports_system_messages": true, "supports_function_calling": true, "supports_tool_choice": true, "supports_response_schema": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "gemini-1.5-pro-002": { "max_tokens": 8192, "max_input_tokens": 2097152, "max_output_tokens": 8192, "input_cost_per_image": 0.00032875, "input_cost_per_audio_per_second": 0.00003125, "input_cost_per_video_per_second": 0.00032875, "input_cost_per_token": 0.00000125, "input_cost_per_character": 0.0000003125, "input_cost_per_image_above_128k_tokens": 0.0006575, "input_cost_per_video_per_second_above_128k_tokens": 0.0006575, "input_cost_per_audio_per_second_above_128k_tokens": 0.0000625, "input_cost_per_token_above_128k_tokens": 0.0000025, "input_cost_per_character_above_128k_tokens": 0.000000625, "output_cost_per_token": 0.000005, "output_cost_per_character": 0.00000125, "output_cost_per_token_above_128k_tokens": 0.00001, "output_cost_per_character_above_128k_tokens": 0.0000025, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_vision": true, "supports_system_messages": true, "supports_function_calling": true, "supports_tool_choice": true, "supports_response_schema": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-1.5-pro", "deprecation_date": "2025-09-24" }, "gemini-1.5-pro-001": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_image": 0.00032875, "input_cost_per_audio_per_second": 0.00003125, "input_cost_per_video_per_second": 0.00032875, "input_cost_per_token": 0.00000125, "input_cost_per_character": 0.0000003125, "input_cost_per_image_above_128k_tokens": 0.0006575, "input_cost_per_video_per_second_above_128k_tokens": 0.0006575, "input_cost_per_audio_per_second_above_128k_tokens": 0.0000625, "input_cost_per_token_above_128k_tokens": 0.0000025, "input_cost_per_character_above_128k_tokens": 0.000000625, "output_cost_per_token": 0.000005, "output_cost_per_character": 0.00000125, "output_cost_per_token_above_128k_tokens": 0.00001, "output_cost_per_character_above_128k_tokens": 0.0000025, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_vision": true, "supports_system_messages": true, "supports_function_calling": true, "supports_tool_choice": true, "supports_response_schema": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "deprecation_date": "2025-05-24" }, "gemini-1.5-pro-preview-0514": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_image": 0.00032875, "input_cost_per_audio_per_second": 0.00003125, "input_cost_per_video_per_second": 0.00032875, "input_cost_per_token": 0.000000078125, "input_cost_per_character": 0.0000003125, "input_cost_per_image_above_128k_tokens": 0.0006575, "input_cost_per_video_per_second_above_128k_tokens": 0.0006575, "input_cost_per_audio_per_second_above_128k_tokens": 0.0000625, "input_cost_per_token_above_128k_tokens": 0.00000015625, "input_cost_per_character_above_128k_tokens": 0.000000625, "output_cost_per_token": 0.0000003125, "output_cost_per_character": 0.00000125, "output_cost_per_token_above_128k_tokens": 0.000000625, "output_cost_per_character_above_128k_tokens": 0.0000025, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_tool_choice": true, "supports_response_schema": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "gemini-1.5-pro-preview-0215": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_image": 0.00032875, "input_cost_per_audio_per_second": 0.00003125, "input_cost_per_video_per_second": 0.00032875, "input_cost_per_token": 0.000000078125, "input_cost_per_character": 0.0000003125, "input_cost_per_image_above_128k_tokens": 0.0006575, "input_cost_per_video_per_second_above_128k_tokens": 0.0006575, "input_cost_per_audio_per_second_above_128k_tokens": 0.0000625, "input_cost_per_token_above_128k_tokens": 0.00000015625, "input_cost_per_character_above_128k_tokens": 0.000000625, "output_cost_per_token": 0.0000003125, "output_cost_per_character": 0.00000125, "output_cost_per_token_above_128k_tokens": 0.000000625, "output_cost_per_character_above_128k_tokens": 0.0000025, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_tool_choice": true, "supports_response_schema": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "gemini-1.5-pro-preview-0409": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_image": 0.00032875, "input_cost_per_audio_per_second": 0.00003125, "input_cost_per_video_per_second": 0.00032875, "input_cost_per_token": 0.000000078125, "input_cost_per_character": 0.0000003125, "input_cost_per_image_above_128k_tokens": 0.0006575, "input_cost_per_video_per_second_above_128k_tokens": 0.0006575, "input_cost_per_audio_per_second_above_128k_tokens": 0.0000625, "input_cost_per_token_above_128k_tokens": 0.00000015625, "input_cost_per_character_above_128k_tokens": 0.000000625, "output_cost_per_token": 0.0000003125, "output_cost_per_character": 0.00000125, "output_cost_per_token_above_128k_tokens": 0.000000625, "output_cost_per_character_above_128k_tokens": 0.0000025, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true, "supports_response_schema": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "gemini-1.5-flash": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_image": 0.00002, "input_cost_per_video_per_second": 0.00002, "input_cost_per_audio_per_second": 0.000002, "input_cost_per_token": 0.000000075, "input_cost_per_character": 0.00000001875, "input_cost_per_token_above_128k_tokens": 0.000001, "input_cost_per_character_above_128k_tokens": 0.00000025, "input_cost_per_image_above_128k_tokens": 0.00004, "input_cost_per_video_per_second_above_128k_tokens": 0.00004, "input_cost_per_audio_per_second_above_128k_tokens": 0.000004, "output_cost_per_token": 0.0000003, "output_cost_per_character": 0.000000075, "output_cost_per_token_above_128k_tokens": 0.0000006, "output_cost_per_character_above_128k_tokens": 0.00000015, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "gemini-1.5-flash-exp-0827": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_image": 0.00002, "input_cost_per_video_per_second": 0.00002, "input_cost_per_audio_per_second": 0.000002, "input_cost_per_token": 0.000000004688, "input_cost_per_character": 0.00000001875, "input_cost_per_token_above_128k_tokens": 0.000001, "input_cost_per_character_above_128k_tokens": 0.00000025, "input_cost_per_image_above_128k_tokens": 0.00004, "input_cost_per_video_per_second_above_128k_tokens": 0.00004, "input_cost_per_audio_per_second_above_128k_tokens": 0.000004, "output_cost_per_token": 0.0000000046875, "output_cost_per_character": 0.00000001875, "output_cost_per_token_above_128k_tokens": 0.000000009375, "output_cost_per_character_above_128k_tokens": 0.0000000375, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "gemini-1.5-flash-002": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_image": 0.00002, "input_cost_per_video_per_second": 0.00002, "input_cost_per_audio_per_second": 0.000002, "input_cost_per_token": 0.000000075, "input_cost_per_character": 0.00000001875, "input_cost_per_token_above_128k_tokens": 0.000001, "input_cost_per_character_above_128k_tokens": 0.00000025, "input_cost_per_image_above_128k_tokens": 0.00004, "input_cost_per_video_per_second_above_128k_tokens": 0.00004, "input_cost_per_audio_per_second_above_128k_tokens": 0.000004, "output_cost_per_token": 0.0000003, "output_cost_per_character": 0.000000075, "output_cost_per_token_above_128k_tokens": 0.0000006, "output_cost_per_character_above_128k_tokens": 0.00000015, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-1.5-flash", "deprecation_date": "2025-09-24", "supports_tool_choice": true }, "gemini-1.5-flash-001": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_image": 0.00002, "input_cost_per_video_per_second": 0.00002, "input_cost_per_audio_per_second": 0.000002, "input_cost_per_token": 0.000000075, "input_cost_per_character": 0.00000001875, "input_cost_per_token_above_128k_tokens": 0.000001, "input_cost_per_character_above_128k_tokens": 0.00000025, "input_cost_per_image_above_128k_tokens": 0.00004, "input_cost_per_video_per_second_above_128k_tokens": 0.00004, "input_cost_per_audio_per_second_above_128k_tokens": 0.000004, "output_cost_per_token": 0.0000003, "output_cost_per_character": 0.000000075, "output_cost_per_token_above_128k_tokens": 0.0000006, "output_cost_per_character_above_128k_tokens": 0.00000015, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "deprecation_date": "2025-05-24", "supports_tool_choice": true }, "gemini-1.5-flash-preview-0514": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_image": 0.00002, "input_cost_per_video_per_second": 0.00002, "input_cost_per_audio_per_second": 0.000002, "input_cost_per_token": 0.000000075, "input_cost_per_character": 0.00000001875, "input_cost_per_token_above_128k_tokens": 0.000001, "input_cost_per_character_above_128k_tokens": 0.00000025, "input_cost_per_image_above_128k_tokens": 0.00004, "input_cost_per_video_per_second_above_128k_tokens": 0.00004, "input_cost_per_audio_per_second_above_128k_tokens": 0.000004, "output_cost_per_token": 0.0000000046875, "output_cost_per_character": 0.00000001875, "output_cost_per_token_above_128k_tokens": 0.000000009375, "output_cost_per_character_above_128k_tokens": 0.0000000375, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "gemini-pro-experimental": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0, "input_cost_per_character": 0, "output_cost_per_character": 0, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_function_calling": false, "supports_tool_choice": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/multimodal/gemini-experimental" }, "gemini-flash-experimental": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0, "output_cost_per_token": 0, "input_cost_per_character": 0, "output_cost_per_character": 0, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_function_calling": false, "supports_tool_choice": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/multimodal/gemini-experimental" }, "gemini-pro-vision": { "max_tokens": 2048, "max_input_tokens": 16384, "max_output_tokens": 2048, "max_images_per_prompt": 16, "max_videos_per_prompt": 1, "max_video_length": 2, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015, "input_cost_per_image": 0.0025, "litellm_provider": "vertex_ai-vision-models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "gemini-1.0-pro-vision": { "max_tokens": 2048, "max_input_tokens": 16384, "max_output_tokens": 2048, "max_images_per_prompt": 16, "max_videos_per_prompt": 1, "max_video_length": 2, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015, "input_cost_per_image": 0.0025, "litellm_provider": "vertex_ai-vision-models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "gemini-1.0-pro-vision-001": { "max_tokens": 2048, "max_input_tokens": 16384, "max_output_tokens": 2048, "max_images_per_prompt": 16, "max_videos_per_prompt": 1, "max_video_length": 2, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015, "input_cost_per_image": 0.0025, "litellm_provider": "vertex_ai-vision-models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "deprecation_date": "2025-04-09", "supports_tool_choice": true }, "medlm-medium": { "max_tokens": 8192, "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_character": 0.0000005, "output_cost_per_character": 0.000001, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "medlm-large": { "max_tokens": 1024, "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_character": 0.000005, "output_cost_per_character": 0.000015, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "gemini-2.0-flash-exp": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_image": 0, "input_cost_per_video_per_second": 0, "input_cost_per_audio_per_second": 0, "input_cost_per_token": 0, "input_cost_per_character": 0, "input_cost_per_token_above_128k_tokens": 0, "input_cost_per_character_above_128k_tokens": 0, "input_cost_per_image_above_128k_tokens": 0, "input_cost_per_video_per_second_above_128k_tokens": 0, "input_cost_per_audio_per_second_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_character": 0, "output_cost_per_token_above_128k_tokens": 0, "output_cost_per_character_above_128k_tokens": 0, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_audio_output": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing", "supports_tool_choice": true }, "gemini/gemini-2.0-flash": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_audio_token": 0.0000007, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004, "litellm_provider": "gemini", "mode": "chat", "rpm": 10000, "tpm": 10000000, "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_audio_output": true, "supports_tool_choice": true, "source": "https://ai.google.dev/pricing#2_0flash" }, "gemini-2.0-flash-001": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_audio_token": 0.000001, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_audio_output": true, "supports_tool_choice": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing" }, "gemini-2.0-pro-exp-02-05": { "max_tokens": 8192, "max_input_tokens": 2097152, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_audio_token": 0.000001, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_audio_output": true, "supports_tool_choice": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing" }, "gemini-2.0-flash-thinking-exp": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_image": 0, "input_cost_per_video_per_second": 0, "input_cost_per_audio_per_second": 0, "input_cost_per_token": 0, "input_cost_per_character": 0, "input_cost_per_token_above_128k_tokens": 0, "input_cost_per_character_above_128k_tokens": 0, "input_cost_per_image_above_128k_tokens": 0, "input_cost_per_video_per_second_above_128k_tokens": 0, "input_cost_per_audio_per_second_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_character": 0, "output_cost_per_token_above_128k_tokens": 0, "output_cost_per_character_above_128k_tokens": 0, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_audio_output": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", "supports_tool_choice": true }, "gemini-2.0-flash-thinking-exp-01-21": { "max_tokens": 65536, "max_input_tokens": 1048576, "max_output_tokens": 65536, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_image": 0, "input_cost_per_video_per_second": 0, "input_cost_per_audio_per_second": 0, "input_cost_per_token": 0, "input_cost_per_character": 0, "input_cost_per_token_above_128k_tokens": 0, "input_cost_per_character_above_128k_tokens": 0, "input_cost_per_image_above_128k_tokens": 0, "input_cost_per_video_per_second_above_128k_tokens": 0, "input_cost_per_audio_per_second_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_character": 0, "output_cost_per_token_above_128k_tokens": 0, "output_cost_per_character_above_128k_tokens": 0, "litellm_provider": "vertex_ai-language-models", "mode": "chat", "supports_system_messages": true, "supports_function_calling": false, "supports_vision": true, "supports_response_schema": false, "supports_audio_output": false, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", "supports_tool_choice": true }, "gemini/gemini-2.0-flash-001": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_audio_token": 0.0000007, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000004, "litellm_provider": "gemini", "mode": "chat", "rpm": 10000, "tpm": 10000000, "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_audio_output": false, "supports_tool_choice": true, "source": "https://ai.google.dev/pricing#2_0flash" }, "gemini/gemini-2.0-flash-exp": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_image": 0, "input_cost_per_video_per_second": 0, "input_cost_per_audio_per_second": 0, "input_cost_per_token": 0, "input_cost_per_character": 0, "input_cost_per_token_above_128k_tokens": 0, "input_cost_per_character_above_128k_tokens": 0, "input_cost_per_image_above_128k_tokens": 0, "input_cost_per_video_per_second_above_128k_tokens": 0, "input_cost_per_audio_per_second_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_character": 0, "output_cost_per_token_above_128k_tokens": 0, "output_cost_per_character_above_128k_tokens": 0, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_audio_output": true, "tpm": 4000000, "rpm": 10, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", "supports_tool_choice": true }, "gemini/gemini-2.0-flash-lite-preview-02-05": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_audio_token": 0.000000075, "input_cost_per_token": 0.000000075, "output_cost_per_token": 0.0000003, "litellm_provider": "gemini", "mode": "chat", "rpm": 60000, "tpm": 10000000, "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_audio_output": false, "supports_tool_choice": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash-lite" }, "gemini/gemini-2.0-flash-thinking-exp": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_image": 0, "input_cost_per_video_per_second": 0, "input_cost_per_audio_per_second": 0, "input_cost_per_token": 0, "input_cost_per_character": 0, "input_cost_per_token_above_128k_tokens": 0, "input_cost_per_character_above_128k_tokens": 0, "input_cost_per_image_above_128k_tokens": 0, "input_cost_per_video_per_second_above_128k_tokens": 0, "input_cost_per_audio_per_second_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_character": 0, "output_cost_per_token_above_128k_tokens": 0, "output_cost_per_character_above_128k_tokens": 0, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_audio_output": true, "tpm": 4000000, "rpm": 10, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash", "supports_tool_choice": true }, "vertex_ai/claude-3-sonnet": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/claude-3-sonnet@20240229": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/claude-3-5-sonnet": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/claude-3-5-sonnet@20240620": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/claude-3-5-sonnet-v2": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/claude-3-5-sonnet-v2@20241022": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/claude-3-haiku": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/claude-3-haiku@20240307": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/claude-3-5-haiku": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/claude-3-5-haiku@20241022": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/claude-3-opus": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/claude-3-opus@20240229": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "litellm_provider": "vertex_ai-anthropic_models", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_tool_choice": true }, "vertex_ai/meta/llama3-405b-instruct-maas": { "max_tokens": 32000, "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "vertex_ai-llama_models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#partner-models", "supports_tool_choice": true }, "vertex_ai/meta/llama3-70b-instruct-maas": { "max_tokens": 32000, "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "vertex_ai-llama_models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#partner-models", "supports_tool_choice": true }, "vertex_ai/meta/llama3-8b-instruct-maas": { "max_tokens": 32000, "max_input_tokens": 32000, "max_output_tokens": 32000, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "vertex_ai-llama_models", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing#partner-models", "supports_tool_choice": true }, "vertex_ai/meta/llama-3.2-90b-vision-instruct-maas": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "vertex_ai-llama_models", "mode": "chat", "supports_system_messages": true, "supports_vision": true, "source": "https://console.cloud.google.com/vertex-ai/publishers/meta/model-garden/llama-3.2-90b-vision-instruct-maas", "supports_tool_choice": true }, "vertex_ai/mistral-large@latest": { "max_tokens": 8191, "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "litellm_provider": "vertex_ai-mistral_models", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "vertex_ai/mistral-large@2411-001": { "max_tokens": 8191, "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "litellm_provider": "vertex_ai-mistral_models", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "vertex_ai/mistral-large-2411": { "max_tokens": 8191, "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "litellm_provider": "vertex_ai-mistral_models", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "vertex_ai/mistral-large@2407": { "max_tokens": 8191, "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000006, "litellm_provider": "vertex_ai-mistral_models", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "vertex_ai/mistral-nemo@latest": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015, "litellm_provider": "vertex_ai-mistral_models", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "vertex_ai/jamba-1.5-mini@001": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004, "litellm_provider": "vertex_ai-ai21_models", "mode": "chat", "supports_tool_choice": true }, "vertex_ai/jamba-1.5-large@001": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "litellm_provider": "vertex_ai-ai21_models", "mode": "chat", "supports_tool_choice": true }, "vertex_ai/jamba-1.5": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004, "litellm_provider": "vertex_ai-ai21_models", "mode": "chat", "supports_tool_choice": true }, "vertex_ai/jamba-1.5-mini": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004, "litellm_provider": "vertex_ai-ai21_models", "mode": "chat", "supports_tool_choice": true }, "vertex_ai/jamba-1.5-large": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "litellm_provider": "vertex_ai-ai21_models", "mode": "chat", "supports_tool_choice": true }, "vertex_ai/mistral-nemo@2407": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000003, "litellm_provider": "vertex_ai-mistral_models", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "vertex_ai/codestral@latest": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006, "litellm_provider": "vertex_ai-mistral_models", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "vertex_ai/codestral@2405": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006, "litellm_provider": "vertex_ai-mistral_models", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "vertex_ai/codestral-2501": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000006, "litellm_provider": "vertex_ai-mistral_models", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "vertex_ai/imagegeneration@006": { "output_cost_per_image": 0.020, "litellm_provider": "vertex_ai-image-models", "mode": "image_generation", "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing" }, "vertex_ai/imagen-3.0-generate-001": { "output_cost_per_image": 0.04, "litellm_provider": "vertex_ai-image-models", "mode": "image_generation", "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing" }, "vertex_ai/imagen-3.0-fast-generate-001": { "output_cost_per_image": 0.02, "litellm_provider": "vertex_ai-image-models", "mode": "image_generation", "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing" }, "text-embedding-004": { "max_tokens": 2048, "max_input_tokens": 2048, "output_vector_size": 768, "input_cost_per_character": 0.000000025, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "litellm_provider": "vertex_ai-embedding-models", "mode": "embedding", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models" }, "text-embedding-005": { "max_tokens": 2048, "max_input_tokens": 2048, "output_vector_size": 768, "input_cost_per_character": 0.000000025, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "litellm_provider": "vertex_ai-embedding-models", "mode": "embedding", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models" }, "text-multilingual-embedding-002": { "max_tokens": 2048, "max_input_tokens": 2048, "output_vector_size": 768, "input_cost_per_character": 0.000000025, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "litellm_provider": "vertex_ai-embedding-models", "mode": "embedding", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models" }, "textembedding-gecko": { "max_tokens": 3072, "max_input_tokens": 3072, "output_vector_size": 768, "input_cost_per_character": 0.000000025, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "litellm_provider": "vertex_ai-embedding-models", "mode": "embedding", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "textembedding-gecko-multilingual": { "max_tokens": 3072, "max_input_tokens": 3072, "output_vector_size": 768, "input_cost_per_character": 0.000000025, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "litellm_provider": "vertex_ai-embedding-models", "mode": "embedding", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "textembedding-gecko-multilingual@001": { "max_tokens": 3072, "max_input_tokens": 3072, "output_vector_size": 768, "input_cost_per_character": 0.000000025, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "litellm_provider": "vertex_ai-embedding-models", "mode": "embedding", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "textembedding-gecko@001": { "max_tokens": 3072, "max_input_tokens": 3072, "output_vector_size": 768, "input_cost_per_character": 0.000000025, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "litellm_provider": "vertex_ai-embedding-models", "mode": "embedding", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "textembedding-gecko@003": { "max_tokens": 3072, "max_input_tokens": 3072, "output_vector_size": 768, "input_cost_per_character": 0.000000025, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0, "litellm_provider": "vertex_ai-embedding-models", "mode": "embedding", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "text-embedding-preview-0409": { "max_tokens": 3072, "max_input_tokens": 3072, "output_vector_size": 768, "input_cost_per_token": 0.00000000625, "input_cost_per_token_batch_requests": 0.000000005, "output_cost_per_token": 0, "litellm_provider": "vertex_ai-embedding-models", "mode": "embedding", "source": "https://cloud.google.com/vertex-ai/generative-ai/pricing" }, "text-multilingual-embedding-preview-0409":{ "max_tokens": 3072, "max_input_tokens": 3072, "output_vector_size": 768, "input_cost_per_token": 0.00000000625, "output_cost_per_token": 0, "litellm_provider": "vertex_ai-embedding-models", "mode": "embedding", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "palm/chat-bison": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "litellm_provider": "palm", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "palm/chat-bison-001": { "max_tokens": 4096, "max_input_tokens": 8192, "max_output_tokens": 4096, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "litellm_provider": "palm", "mode": "chat", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "palm/text-bison": { "max_tokens": 1024, "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "litellm_provider": "palm", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "palm/text-bison-001": { "max_tokens": 1024, "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "litellm_provider": "palm", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "palm/text-bison-safety-off": { "max_tokens": 1024, "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "litellm_provider": "palm", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "palm/text-bison-safety-recitation-off": { "max_tokens": 1024, "max_input_tokens": 8192, "max_output_tokens": 1024, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000125, "litellm_provider": "palm", "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, "gemini/gemini-1.5-flash-002": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "cache_read_input_token_cost": 0.00000001875, "cache_creation_input_token_cost": 0.000001, "input_cost_per_token": 0.000000075, "input_cost_per_token_above_128k_tokens": 0.00000015, "output_cost_per_token": 0.0000003, "output_cost_per_token_above_128k_tokens": 0.0000006, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_prompt_caching": true, "tpm": 4000000, "rpm": 2000, "source": "https://ai.google.dev/pricing", "deprecation_date": "2025-09-24", "supports_tool_choice": true }, "gemini/gemini-1.5-flash-001": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "cache_read_input_token_cost": 0.00000001875, "cache_creation_input_token_cost": 0.000001, "input_cost_per_token": 0.000000075, "input_cost_per_token_above_128k_tokens": 0.00000015, "output_cost_per_token": 0.0000003, "output_cost_per_token_above_128k_tokens": 0.0000006, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_prompt_caching": true, "tpm": 4000000, "rpm": 2000, "source": "https://ai.google.dev/pricing", "deprecation_date": "2025-05-24", "supports_tool_choice": true }, "gemini/gemini-1.5-flash": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_token": 0.000000075, "input_cost_per_token_above_128k_tokens": 0.00000015, "output_cost_per_token": 0.0000003, "output_cost_per_token_above_128k_tokens": 0.0000006, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "tpm": 4000000, "rpm": 2000, "source": "https://ai.google.dev/pricing", "supports_tool_choice": true }, "gemini/gemini-1.5-flash-latest": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_token": 0.000000075, "input_cost_per_token_above_128k_tokens": 0.00000015, "output_cost_per_token": 0.0000003, "output_cost_per_token_above_128k_tokens": 0.0000006, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_prompt_caching": true, "tpm": 4000000, "rpm": 2000, "source": "https://ai.google.dev/pricing", "supports_tool_choice": true }, "gemini/gemini-1.5-flash-8b": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_token": 0, "input_cost_per_token_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_token_above_128k_tokens": 0, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_prompt_caching": true, "tpm": 4000000, "rpm": 4000, "source": "https://ai.google.dev/pricing", "supports_tool_choice": true }, "gemini/gemini-1.5-flash-8b-exp-0924": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_token": 0, "input_cost_per_token_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_token_above_128k_tokens": 0, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "supports_prompt_caching": true, "tpm": 4000000, "rpm": 4000, "source": "https://ai.google.dev/pricing", "supports_tool_choice": true }, "gemini/gemini-exp-1114": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_token": 0, "input_cost_per_token_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_token_above_128k_tokens": 0, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_tool_choice": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "tpm": 4000000, "rpm": 1000, "source": "https://ai.google.dev/pricing", "metadata": { "notes": "Rate limits not documented for gemini-exp-1114. Assuming same as gemini-1.5-pro.", "supports_tool_choice": true } }, "gemini/gemini-exp-1206": { "max_tokens": 8192, "max_input_tokens": 2097152, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_token": 0, "input_cost_per_token_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_token_above_128k_tokens": 0, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_tool_choice": true, "supports_vision": true, "supports_response_schema": true, "tpm": 4000000, "rpm": 1000, "source": "https://ai.google.dev/pricing", "metadata": { "notes": "Rate limits not documented for gemini-exp-1206. Assuming same as gemini-1.5-pro.", "supports_tool_choice": true } }, "gemini/gemini-1.5-flash-exp-0827": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_token": 0, "input_cost_per_token_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_token_above_128k_tokens": 0, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "tpm": 4000000, "rpm": 2000, "source": "https://ai.google.dev/pricing", "supports_tool_choice": true }, "gemini/gemini-1.5-flash-8b-exp-0827": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, "max_video_length": 1, "max_audio_length_hours": 8.4, "max_audio_per_prompt": 1, "max_pdf_size_mb": 30, "input_cost_per_token": 0, "input_cost_per_token_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_token_above_128k_tokens": 0, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "tpm": 4000000, "rpm": 4000, "source": "https://ai.google.dev/pricing", "supports_tool_choice": true }, "gemini/gemini-pro": { "max_tokens": 8192, "max_input_tokens": 32760, "max_output_tokens": 8192, "input_cost_per_token": 0.00000035, "input_cost_per_token_above_128k_tokens": 0.0000007, "output_cost_per_token": 0.00000105, "output_cost_per_token_above_128k_tokens": 0.0000021, "litellm_provider": "gemini", "mode": "chat", "supports_function_calling": true, "rpd": 30000, "tpm": 120000, "rpm": 360, "source": "https://ai.google.dev/gemini-api/docs/models/gemini", "supports_tool_choice": true }, "gemini/gemini-1.5-pro": { "max_tokens": 8192, "max_input_tokens": 2097152, "max_output_tokens": 8192, "input_cost_per_token": 0.0000035, "input_cost_per_token_above_128k_tokens": 0.000007, "output_cost_per_token": 0.0000105, "output_cost_per_token_above_128k_tokens": 0.000021, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true, "supports_response_schema": true, "tpm": 4000000, "rpm": 1000, "source": "https://ai.google.dev/pricing" }, "gemini/gemini-1.5-pro-002": { "max_tokens": 8192, "max_input_tokens": 2097152, "max_output_tokens": 8192, "input_cost_per_token": 0.0000035, "input_cost_per_token_above_128k_tokens": 0.000007, "output_cost_per_token": 0.0000105, "output_cost_per_token_above_128k_tokens": 0.000021, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true, "supports_response_schema": true, "supports_prompt_caching": true, "tpm": 4000000, "rpm": 1000, "source": "https://ai.google.dev/pricing", "deprecation_date": "2025-09-24" }, "gemini/gemini-1.5-pro-001": { "max_tokens": 8192, "max_input_tokens": 2097152, "max_output_tokens": 8192, "input_cost_per_token": 0.0000035, "input_cost_per_token_above_128k_tokens": 0.000007, "output_cost_per_token": 0.0000105, "output_cost_per_token_above_128k_tokens": 0.000021, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true, "supports_response_schema": true, "supports_prompt_caching": true, "tpm": 4000000, "rpm": 1000, "source": "https://ai.google.dev/pricing", "deprecation_date": "2025-05-24" }, "gemini/gemini-1.5-pro-exp-0801": { "max_tokens": 8192, "max_input_tokens": 2097152, "max_output_tokens": 8192, "input_cost_per_token": 0.0000035, "input_cost_per_token_above_128k_tokens": 0.000007, "output_cost_per_token": 0.0000105, "output_cost_per_token_above_128k_tokens": 0.000021, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true, "supports_response_schema": true, "tpm": 4000000, "rpm": 1000, "source": "https://ai.google.dev/pricing" }, "gemini/gemini-1.5-pro-exp-0827": { "max_tokens": 8192, "max_input_tokens": 2097152, "max_output_tokens": 8192, "input_cost_per_token": 0, "input_cost_per_token_above_128k_tokens": 0, "output_cost_per_token": 0, "output_cost_per_token_above_128k_tokens": 0, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true, "supports_response_schema": true, "tpm": 4000000, "rpm": 1000, "source": "https://ai.google.dev/pricing" }, "gemini/gemini-1.5-pro-latest": { "max_tokens": 8192, "max_input_tokens": 1048576, "max_output_tokens": 8192, "input_cost_per_token": 0.0000035, "input_cost_per_token_above_128k_tokens": 0.000007, "output_cost_per_token": 0.00000105, "output_cost_per_token_above_128k_tokens": 0.000021, "litellm_provider": "gemini", "mode": "chat", "supports_system_messages": true, "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true, "supports_response_schema": true, "tpm": 4000000, "rpm": 1000, "source": "https://ai.google.dev/pricing" }, "gemini/gemini-pro-vision": { "max_tokens": 2048, "max_input_tokens": 30720, "max_output_tokens": 2048, "input_cost_per_token": 0.00000035, "input_cost_per_token_above_128k_tokens": 0.0000007, "output_cost_per_token": 0.00000105, "output_cost_per_token_above_128k_tokens": 0.0000021, "litellm_provider": "gemini", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "rpd": 30000, "tpm": 120000, "rpm": 360, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "gemini/gemini-gemma-2-27b-it": { "max_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000105, "litellm_provider": "gemini", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "gemini/gemini-gemma-2-9b-it": { "max_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000105, "litellm_provider": "gemini", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models", "supports_tool_choice": true }, "command-r": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "litellm_provider": "cohere_chat", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "command-r-08-2024": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000006, "litellm_provider": "cohere_chat", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "command-r7b-12-2024": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000000375, "litellm_provider": "cohere_chat", "mode": "chat", "supports_function_calling": true, "source": "https://docs.cohere.com/v2/docs/command-r7b", "supports_tool_choice": true }, "command-light": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000006, "litellm_provider": "cohere_chat", "mode": "chat", "supports_tool_choice": true }, "command-r-plus": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "litellm_provider": "cohere_chat", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "command-r-plus-08-2024": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.00001, "litellm_provider": "cohere_chat", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "command-nightly": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000002, "litellm_provider": "cohere", "mode": "completion" }, "command": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000002, "litellm_provider": "cohere", "mode": "completion" }, "rerank-v3.5": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "max_query_tokens": 2048, "input_cost_per_token": 0.0, "input_cost_per_query": 0.002, "output_cost_per_token": 0.0, "litellm_provider": "cohere", "mode": "rerank" }, "rerank-english-v3.0": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "max_query_tokens": 2048, "input_cost_per_token": 0.0, "input_cost_per_query": 0.002, "output_cost_per_token": 0.0, "litellm_provider": "cohere", "mode": "rerank" }, "rerank-multilingual-v3.0": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "max_query_tokens": 2048, "input_cost_per_token": 0.0, "input_cost_per_query": 0.002, "output_cost_per_token": 0.0, "litellm_provider": "cohere", "mode": "rerank" }, "rerank-english-v2.0": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "max_query_tokens": 2048, "input_cost_per_token": 0.0, "input_cost_per_query": 0.002, "output_cost_per_token": 0.0, "litellm_provider": "cohere", "mode": "rerank" }, "rerank-multilingual-v2.0": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "max_query_tokens": 2048, "input_cost_per_token": 0.0, "input_cost_per_query": 0.002, "output_cost_per_token": 0.0, "litellm_provider": "cohere", "mode": "rerank" }, "embed-english-light-v3.0": { "max_tokens": 1024, "max_input_tokens": 1024, "input_cost_per_token": 0.00000010, "output_cost_per_token": 0.00000, "litellm_provider": "cohere", "mode": "embedding" }, "embed-multilingual-v3.0": { "max_tokens": 1024, "max_input_tokens": 1024, "input_cost_per_token": 0.00000010, "output_cost_per_token": 0.00000, "litellm_provider": "cohere", "mode": "embedding" }, "embed-english-v2.0": { "max_tokens": 4096, "max_input_tokens": 4096, "input_cost_per_token": 0.00000010, "output_cost_per_token": 0.00000, "litellm_provider": "cohere", "mode": "embedding" }, "embed-english-light-v2.0": { "max_tokens": 1024, "max_input_tokens": 1024, "input_cost_per_token": 0.00000010, "output_cost_per_token": 0.00000, "litellm_provider": "cohere", "mode": "embedding" }, "embed-multilingual-v2.0": { "max_tokens": 768, "max_input_tokens": 768, "input_cost_per_token": 0.00000010, "output_cost_per_token": 0.00000, "litellm_provider": "cohere", "mode": "embedding" }, "embed-english-v3.0": { "max_tokens": 1024, "max_input_tokens": 1024, "input_cost_per_token": 0.00000010, "input_cost_per_image": 0.0001, "output_cost_per_token": 0.00000, "litellm_provider": "cohere", "mode": "embedding", "supports_image_input": true, "supports_embedding_image_input": true, "metadata": { "notes": "'supports_image_input' is a deprecated field. Use 'supports_embedding_image_input' instead." } }, "replicate/meta/llama-2-13b": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000005, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/meta/llama-2-13b-chat": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000005, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/meta/llama-2-70b": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000275, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/meta/llama-2-70b-chat": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000275, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/meta/llama-2-7b": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/meta/llama-2-7b-chat": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/meta/llama-3-70b": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000275, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/meta/llama-3-70b-instruct": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000275, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/meta/llama-3-8b": { "max_tokens": 8086, "max_input_tokens": 8086, "max_output_tokens": 8086, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/meta/llama-3-8b-instruct": { "max_tokens": 8086, "max_input_tokens": 8086, "max_output_tokens": 8086, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/mistralai/mistral-7b-v0.1": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/mistralai/mistral-7b-instruct-v0.2": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000005, "output_cost_per_token": 0.00000025, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "replicate/mistralai/mixtral-8x7b-instruct-v0.1": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.000001, "litellm_provider": "replicate", "mode": "chat", "supports_tool_choice": true }, "openrouter/deepseek/deepseek-r1": { "max_tokens": 8192, "max_input_tokens": 65336, "max_output_tokens": 8192, "input_cost_per_token": 0.00000055, "input_cost_per_token_cache_hit": 0.00000014, "output_cost_per_token": 0.00000219, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_tool_choice": true, "supports_prompt_caching": true }, "openrouter/deepseek/deepseek-chat": { "max_tokens": 8192, "max_input_tokens": 65536, "max_output_tokens": 8192, "input_cost_per_token": 0.00000014, "output_cost_per_token": 0.00000028, "litellm_provider": "openrouter", "supports_prompt_caching": true, "mode": "chat", "supports_tool_choice": true }, "openrouter/deepseek/deepseek-coder": { "max_tokens": 8192, "max_input_tokens": 66000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000014, "output_cost_per_token": 0.00000028, "litellm_provider": "openrouter", "supports_prompt_caching": true, "mode": "chat", "supports_tool_choice": true }, "openrouter/microsoft/wizardlm-2-8x22b:nitro": { "max_tokens": 65536, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/google/gemini-pro-1.5": { "max_tokens": 8192, "max_input_tokens": 1000000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000025, "output_cost_per_token": 0.0000075, "input_cost_per_image": 0.00265, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "openrouter/mistralai/mixtral-8x22b-instruct": { "max_tokens": 65536, "input_cost_per_token": 0.00000065, "output_cost_per_token": 0.00000065, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/cohere/command-r-plus": { "max_tokens": 128000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/databricks/dbrx-instruct": { "max_tokens": 32768, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000006, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/anthropic/claude-3-haiku": { "max_tokens": 200000, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "input_cost_per_image": 0.0004, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "openrouter/anthropic/claude-3-5-haiku": { "max_tokens": 200000, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "openrouter/anthropic/claude-3-haiku-20240307": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "tool_use_system_prompt_tokens": 264, "supports_tool_choice": true }, "openrouter/anthropic/claude-3-5-haiku-20241022": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "tool_use_system_prompt_tokens": 264, "supports_tool_choice": true }, "openrouter/anthropic/claude-3.5-sonnet": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "tool_use_system_prompt_tokens": 159, "supports_assistant_prefill": true, "supports_tool_choice": true }, "openrouter/anthropic/claude-3.5-sonnet:beta": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "tool_use_system_prompt_tokens": 159, "supports_tool_choice": true }, "openrouter/anthropic/claude-3-sonnet": { "max_tokens": 200000, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "input_cost_per_image": 0.0048, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "openrouter/mistralai/mistral-large": { "max_tokens": 32000, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/cognitivecomputations/dolphin-mixtral-8x7b": { "max_tokens": 32769, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/google/gemini-pro-vision": { "max_tokens": 45875, "input_cost_per_token": 0.000000125, "output_cost_per_token": 0.000000375, "input_cost_per_image": 0.0025, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "openrouter/fireworks/firellava-13b": { "max_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/meta-llama/llama-3-8b-instruct:free": { "max_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/meta-llama/llama-3-8b-instruct:extended": { "max_tokens": 16384, "input_cost_per_token": 0.000000225, "output_cost_per_token": 0.00000225, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/meta-llama/llama-3-70b-instruct:nitro": { "max_tokens": 8192, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/meta-llama/llama-3-70b-instruct": { "max_tokens": 8192, "input_cost_per_token": 0.00000059, "output_cost_per_token": 0.00000079, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/openai/o1": { "max_tokens": 100000, "max_input_tokens": 200000, "max_output_tokens": 100000, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.00006, "cache_read_input_token_cost": 0.0000075, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_prompt_caching": true, "supports_system_messages": true, "supports_response_schema": true, "supports_tool_choice": true }, "openrouter/openai/o1-mini": { "max_tokens": 65536, "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000012, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, "supports_tool_choice": true }, "openrouter/openai/o1-mini-2024-09-12": { "max_tokens": 65536, "max_input_tokens": 128000, "max_output_tokens": 65536, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000012, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, "supports_tool_choice": true }, "openrouter/openai/o1-preview": { "max_tokens": 32768, "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000060, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, "supports_tool_choice": true }, "openrouter/openai/o1-preview-2024-09-12": { "max_tokens": 32768, "max_input_tokens": 128000, "max_output_tokens": 32768, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000060, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": false, "supports_tool_choice": true }, "openrouter/openai/gpt-4o": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "openrouter/openai/gpt-4o-2024-05-13": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000015, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "openrouter/openai/gpt-4-vision-preview": { "max_tokens": 130000, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00003, "input_cost_per_image": 0.01445, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_tool_choice": true }, "openrouter/openai/gpt-3.5-turbo": { "max_tokens": 4095, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000002, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/openai/gpt-3.5-turbo-16k": { "max_tokens": 16383, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000004, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/openai/gpt-4": { "max_tokens": 8192, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.00006, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/anthropic/claude-instant-v1": { "max_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000163, "output_cost_per_token": 0.00000551, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/anthropic/claude-2": { "max_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.00001102, "output_cost_per_token": 0.00003268, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/anthropic/claude-3-opus": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "litellm_provider": "openrouter", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "tool_use_system_prompt_tokens": 395, "supports_tool_choice": true }, "openrouter/google/palm-2-chat-bison": { "max_tokens": 25804, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/google/palm-2-codechat-bison": { "max_tokens": 20070, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/meta-llama/llama-2-13b-chat": { "max_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/meta-llama/llama-2-70b-chat": { "max_tokens": 4096, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.0000015, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/meta-llama/codellama-34b-instruct": { "max_tokens": 8192, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/nousresearch/nous-hermes-llama2-13b": { "max_tokens": 4096, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/mancer/weaver": { "max_tokens": 8000, "input_cost_per_token": 0.000005625, "output_cost_per_token": 0.000005625, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/gryphe/mythomax-l2-13b": { "max_tokens": 8192, "input_cost_per_token": 0.000001875, "output_cost_per_token": 0.000001875, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/jondurbin/airoboros-l2-70b-2.1": { "max_tokens": 4096, "input_cost_per_token": 0.000013875, "output_cost_per_token": 0.000013875, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/undi95/remm-slerp-l2-13b": { "max_tokens": 6144, "input_cost_per_token": 0.000001875, "output_cost_per_token": 0.000001875, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/pygmalionai/mythalion-13b": { "max_tokens": 4096, "input_cost_per_token": 0.000001875, "output_cost_per_token": 0.000001875, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/mistralai/mistral-7b-instruct": { "max_tokens": 8192, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000013, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/mistralai/mistral-7b-instruct:free": { "max_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "openrouter/qwen/qwen-2.5-coder-32b-instruct": { "max_tokens": 33792, "max_input_tokens": 33792, "max_output_tokens": 33792, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.00000018, "litellm_provider": "openrouter", "mode": "chat", "supports_tool_choice": true }, "j2-ultra": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000015, "litellm_provider": "ai21", "mode": "completion" }, "jamba-1.5-mini@001": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004, "litellm_provider": "ai21", "mode": "chat", "supports_tool_choice": true }, "jamba-1.5-large@001": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "litellm_provider": "ai21", "mode": "chat", "supports_tool_choice": true }, "jamba-1.5": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004, "litellm_provider": "ai21", "mode": "chat", "supports_tool_choice": true }, "jamba-1.5-mini": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004, "litellm_provider": "ai21", "mode": "chat", "supports_tool_choice": true }, "jamba-1.5-large": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "litellm_provider": "ai21", "mode": "chat", "supports_tool_choice": true }, "j2-mid": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00001, "output_cost_per_token": 0.00001, "litellm_provider": "ai21", "mode": "completion" }, "j2-light": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000003, "litellm_provider": "ai21", "mode": "completion" }, "dolphin": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005, "litellm_provider": "nlp_cloud", "mode": "completion" }, "chatdolphin": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005, "litellm_provider": "nlp_cloud", "mode": "chat" }, "luminous-base": { "max_tokens": 2048, "input_cost_per_token": 0.00003, "output_cost_per_token": 0.000033, "litellm_provider": "aleph_alpha", "mode": "completion" }, "luminous-base-control": { "max_tokens": 2048, "input_cost_per_token": 0.0000375, "output_cost_per_token": 0.00004125, "litellm_provider": "aleph_alpha", "mode": "chat" }, "luminous-extended": { "max_tokens": 2048, "input_cost_per_token": 0.000045, "output_cost_per_token": 0.0000495, "litellm_provider": "aleph_alpha", "mode": "completion" }, "luminous-extended-control": { "max_tokens": 2048, "input_cost_per_token": 0.00005625, "output_cost_per_token": 0.000061875, "litellm_provider": "aleph_alpha", "mode": "chat" }, "luminous-supreme": { "max_tokens": 2048, "input_cost_per_token": 0.000175, "output_cost_per_token": 0.0001925, "litellm_provider": "aleph_alpha", "mode": "completion" }, "luminous-supreme-control": { "max_tokens": 2048, "input_cost_per_token": 0.00021875, "output_cost_per_token": 0.000240625, "litellm_provider": "aleph_alpha", "mode": "chat" }, "ai21.j2-mid-v1": { "max_tokens": 8191, "max_input_tokens": 8191, "max_output_tokens": 8191, "input_cost_per_token": 0.0000125, "output_cost_per_token": 0.0000125, "litellm_provider": "bedrock", "mode": "chat" }, "ai21.j2-ultra-v1": { "max_tokens": 8191, "max_input_tokens": 8191, "max_output_tokens": 8191, "input_cost_per_token": 0.0000188, "output_cost_per_token": 0.0000188, "litellm_provider": "bedrock", "mode": "chat" }, "ai21.jamba-instruct-v1:0": { "max_tokens": 4096, "max_input_tokens": 70000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000007, "litellm_provider": "bedrock", "mode": "chat", "supports_system_messages": true }, "ai21.jamba-1-5-large-v1:0": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000008, "litellm_provider": "bedrock", "mode": "chat" }, "ai21.jamba-1-5-mini-v1:0": { "max_tokens": 256000, "max_input_tokens": 256000, "max_output_tokens": 256000, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000004, "litellm_provider": "bedrock", "mode": "chat" }, "amazon.titan-text-lite-v1": { "max_tokens": 4000, "max_input_tokens": 42000, "max_output_tokens": 4000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000004, "litellm_provider": "bedrock", "mode": "chat" }, "amazon.titan-text-express-v1": { "max_tokens": 8000, "max_input_tokens": 42000, "max_output_tokens": 8000, "input_cost_per_token": 0.0000013, "output_cost_per_token": 0.0000017, "litellm_provider": "bedrock", "mode": "chat" }, "amazon.titan-text-premier-v1:0": { "max_tokens": 32000, "max_input_tokens": 42000, "max_output_tokens": 32000, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015, "litellm_provider": "bedrock", "mode": "chat" }, "amazon.titan-embed-text-v1": { "max_tokens": 8192, "max_input_tokens": 8192, "output_vector_size": 1536, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0, "litellm_provider": "bedrock", "mode": "embedding" }, "amazon.titan-embed-text-v2:0": { "max_tokens": 8192, "max_input_tokens": 8192, "output_vector_size": 1024, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0, "litellm_provider": "bedrock", "mode": "embedding" }, "amazon.titan-embed-image-v1": { "max_tokens": 128, "max_input_tokens": 128, "output_vector_size": 1024, "input_cost_per_token": 0.0000008, "input_cost_per_image": 0.00006, "output_cost_per_token": 0.0, "litellm_provider": "bedrock", "supports_image_input": true, "supports_embedding_image_input": true, "mode": "embedding", "source": "https://us-east-1.console.aws.amazon.com/bedrock/home?region=us-east-1#/providers?model=amazon.titan-image-generator-v1", "metadata": { "notes": "'supports_image_input' is a deprecated field. Use 'supports_embedding_image_input' instead." } }, "mistral.mistral-7b-instruct-v0:2": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000002, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "mistral.mixtral-8x7b-instruct-v0:1": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000045, "output_cost_per_token": 0.0000007, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "mistral.mistral-large-2402-v1:0": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "mistral.mistral-large-2407-v1:0": { "max_tokens": 8191, "max_input_tokens": 128000, "max_output_tokens": 8191, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000009, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "mistral.mistral-small-2402-v1:0": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000003, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000045, "output_cost_per_token": 0.0000007, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/mistral.mixtral-8x7b-instruct-v0:1": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000045, "output_cost_per_token": 0.0000007, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/eu-west-3/mistral.mixtral-8x7b-instruct-v0:1": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000059, "output_cost_per_token": 0.00000091, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-west-2/mistral.mistral-7b-instruct-v0:2": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000002, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/mistral.mistral-7b-instruct-v0:2": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.0000002, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/eu-west-3/mistral.mistral-7b-instruct-v0:2": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.00000026, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/mistral.mistral-large-2402-v1:0": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "bedrock/us-west-2/mistral.mistral-large-2402-v1:0": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "bedrock/eu-west-3/mistral.mistral-large-2402-v1:0": { "max_tokens": 8191, "max_input_tokens": 32000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000104, "output_cost_per_token": 0.0000312, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": true }, "amazon.nova-micro-v1:0": { "max_tokens": 4096, "max_input_tokens": 300000, "max_output_tokens": 4096, "input_cost_per_token": 0.000000035, "output_cost_per_token": 0.00000014, "litellm_provider": "bedrock_converse", "mode": "chat", "supports_function_calling": true, "supports_prompt_caching": true }, "us.amazon.nova-micro-v1:0": { "max_tokens": 4096, "max_input_tokens": 300000, "max_output_tokens": 4096, "input_cost_per_token": 0.000000035, "output_cost_per_token": 0.00000014, "litellm_provider": "bedrock_converse", "mode": "chat", "supports_function_calling": true, "supports_prompt_caching": true, "supports_response_schema": true }, "amazon.nova-lite-v1:0": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000024, "litellm_provider": "bedrock_converse", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_pdf_input": true, "supports_prompt_caching": true }, "us.amazon.nova-lite-v1:0": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.00000024, "litellm_provider": "bedrock_converse", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_pdf_input": true, "supports_prompt_caching": true }, "amazon.nova-pro-v1:0": { "max_tokens": 4096, "max_input_tokens": 300000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000032, "litellm_provider": "bedrock_converse", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_pdf_input": true, "supports_prompt_caching": true }, "us.amazon.nova-pro-v1:0": { "max_tokens": 4096, "max_input_tokens": 300000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000032, "litellm_provider": "bedrock_converse", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_pdf_input": true, "supports_prompt_caching": true }, "anthropic.claude-3-sonnet-20240229-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "anthropic.claude-3-5-sonnet-20240620-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "anthropic.claude-3-5-sonnet-20241022-v2:0": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_prompt_caching": true, "supports_response_schema": true, "supports_tool_choice": true }, "anthropic.claude-3-haiku-20240307-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "anthropic.claude-3-5-haiku-20241022-v1:0": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.000004, "litellm_provider": "bedrock", "mode": "chat", "supports_assistant_prefill": true, "supports_function_calling": true, "supports_response_schema": true, "supports_prompt_caching": true, "supports_tool_choice": true }, "anthropic.claude-3-opus-20240229-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "us.anthropic.claude-3-sonnet-20240229-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "us.anthropic.claude-3-5-sonnet-20240620-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "us.anthropic.claude-3-5-sonnet-20241022-v2:0": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_prompt_caching": true, "supports_response_schema": true, "supports_tool_choice": true }, "us.anthropic.claude-3-haiku-20240307-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "us.anthropic.claude-3-5-haiku-20241022-v1:0": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.000004, "litellm_provider": "bedrock", "mode": "chat", "supports_assistant_prefill": true, "supports_function_calling": true, "supports_prompt_caching": true, "supports_response_schema": true, "supports_tool_choice": true }, "us.anthropic.claude-3-opus-20240229-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "eu.anthropic.claude-3-sonnet-20240229-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "eu.anthropic.claude-3-5-sonnet-20240620-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "eu.anthropic.claude-3-5-sonnet-20241022-v2:0": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_assistant_prefill": true, "supports_prompt_caching": true, "supports_response_schema": true, "supports_tool_choice": true }, "eu.anthropic.claude-3-haiku-20240307-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "eu.anthropic.claude-3-5-haiku-20241022-v1:0": { "max_tokens": 8192, "max_input_tokens": 200000, "max_output_tokens": 8192, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000125, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_assistant_prefill": true, "supports_prompt_caching": true, "supports_response_schema": true, "supports_tool_choice": true }, "eu.anthropic.claude-3-opus-20240229-v1:0": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.000015, "output_cost_per_token": 0.000075, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "supports_vision": true, "supports_tool_choice": true }, "anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/us-east-1/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-west-2/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/ap-northeast-1/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0455, "output_cost_per_second": 0.0455, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.02527, "output_cost_per_second": 0.02527, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/eu-central-1/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/eu-central-1/1-month-commitment/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0415, "output_cost_per_second": 0.0415, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/eu-central-1/6-month-commitment/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.02305, "output_cost_per_second": 0.02305, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/us-east-1/1-month-commitment/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0175, "output_cost_per_second": 0.0175, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/us-east-1/6-month-commitment/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00972, "output_cost_per_second": 0.00972, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/us-west-2/1-month-commitment/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0175, "output_cost_per_second": 0.0175, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/us-west-2/6-month-commitment/anthropic.claude-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00972, "output_cost_per_second": 0.00972, "litellm_provider": "bedrock", "mode": "chat" }, "anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-west-2/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/ap-northeast-1/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0455, "output_cost_per_second": 0.0455, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.02527, "output_cost_per_second": 0.02527, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/eu-central-1/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0415, "output_cost_per_second": 0.0415, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.02305, "output_cost_per_second": 0.02305, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/1-month-commitment/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0175, "output_cost_per_second": 0.0175, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/6-month-commitment/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00972, "output_cost_per_second": 0.00972, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-west-2/1-month-commitment/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0175, "output_cost_per_second": 0.0175, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-west-2/6-month-commitment/anthropic.claude-v2": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00972, "output_cost_per_second": 0.00972, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-west-2/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/ap-northeast-1/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0455, "output_cost_per_second": 0.0455, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.02527, "output_cost_per_second": 0.02527, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/eu-central-1/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.000008, "output_cost_per_token": 0.000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0415, "output_cost_per_second": 0.0415, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.02305, "output_cost_per_second": 0.02305, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/1-month-commitment/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0175, "output_cost_per_second": 0.0175, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/6-month-commitment/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00972, "output_cost_per_second": 0.00972, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-west-2/1-month-commitment/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.0175, "output_cost_per_second": 0.0175, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-west-2/6-month-commitment/anthropic.claude-v2:1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00972, "output_cost_per_second": 0.00972, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/1-month-commitment/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.011, "output_cost_per_second": 0.011, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-east-1/6-month-commitment/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00611, "output_cost_per_second": 0.00611, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-west-2/1-month-commitment/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.011, "output_cost_per_second": 0.011, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-west-2/6-month-commitment/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.00611, "output_cost_per_second": 0.00611, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/us-west-2/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000024, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/ap-northeast-1/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000223, "output_cost_per_token": 0.00000755, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.01475, "output_cost_per_second": 0.01475, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.008194, "output_cost_per_second": 0.008194, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/eu-central-1/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_token": 0.00000248, "output_cost_per_token": 0.00000838, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/eu-central-1/1-month-commitment/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.01635, "output_cost_per_second": 0.01635, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "bedrock/eu-central-1/6-month-commitment/anthropic.claude-instant-v1": { "max_tokens": 8191, "max_input_tokens": 100000, "max_output_tokens": 8191, "input_cost_per_second": 0.009083, "output_cost_per_second": 0.009083, "litellm_provider": "bedrock", "mode": "chat", "supports_tool_choice": true }, "cohere.command-text-v14": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.0000020, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/*/1-month-commitment/cohere.command-text-v14": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_second": 0.011, "output_cost_per_second": 0.011, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/*/6-month-commitment/cohere.command-text-v14": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_second": 0.0066027, "output_cost_per_second": 0.0066027, "litellm_provider": "bedrock", "mode": "chat" }, "cohere.command-light-text-v14": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000006, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/*/1-month-commitment/cohere.command-light-text-v14": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_second": 0.001902, "output_cost_per_second": 0.001902, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/*/6-month-commitment/cohere.command-light-text-v14": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_second": 0.0011416, "output_cost_per_second": 0.0011416, "litellm_provider": "bedrock", "mode": "chat" }, "cohere.command-r-plus-v1:0": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000030, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", "mode": "chat" }, "cohere.command-r-v1:0": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000015, "litellm_provider": "bedrock", "mode": "chat" }, "cohere.embed-english-v3": { "max_tokens": 512, "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.000000, "litellm_provider": "bedrock", "mode": "embedding" }, "cohere.embed-multilingual-v3": { "max_tokens": 512, "max_input_tokens": 512, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.000000, "litellm_provider": "bedrock", "mode": "embedding" }, "meta.llama3-3-70b-instruct-v1:0": { "max_tokens": 4096, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000072, "output_cost_per_token": 0.00000072, "litellm_provider": "bedrock_converse", "mode": "chat" }, "meta.llama2-13b-chat-v1": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000075, "output_cost_per_token": 0.000001, "litellm_provider": "bedrock", "mode": "chat" }, "meta.llama2-70b-chat-v1": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000195, "output_cost_per_token": 0.00000256, "litellm_provider": "bedrock", "mode": "chat" }, "meta.llama3-8b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000006, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/us-east-1/meta.llama3-8b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000006, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/us-west-1/meta.llama3-8b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000006, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/ap-south-1/meta.llama3-8b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000036, "output_cost_per_token": 0.00000072, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/ca-central-1/meta.llama3-8b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000069, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/eu-west-1/meta.llama3-8b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000032, "output_cost_per_token": 0.00000065, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/eu-west-2/meta.llama3-8b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000039, "output_cost_per_token": 0.00000078, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/sa-east-1/meta.llama3-8b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.00000101, "litellm_provider": "bedrock", "mode": "chat" }, "meta.llama3-70b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000265, "output_cost_per_token": 0.0000035, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/us-east-1/meta.llama3-70b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000265, "output_cost_per_token": 0.0000035, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/us-west-1/meta.llama3-70b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000265, "output_cost_per_token": 0.0000035, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/ap-south-1/meta.llama3-70b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000318, "output_cost_per_token": 0.0000042, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/ca-central-1/meta.llama3-70b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000305, "output_cost_per_token": 0.00000403, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/eu-west-1/meta.llama3-70b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000286, "output_cost_per_token": 0.00000378, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/eu-west-2/meta.llama3-70b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000345, "output_cost_per_token": 0.00000455, "litellm_provider": "bedrock", "mode": "chat" }, "bedrock/sa-east-1/meta.llama3-70b-instruct-v1:0": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000445, "output_cost_per_token": 0.00000588, "litellm_provider": "bedrock", "mode": "chat" }, "meta.llama3-1-8b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000022, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "us.meta.llama3-1-8b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000022, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "meta.llama3-1-70b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000099, "output_cost_per_token": 0.00000099, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "us.meta.llama3-1-70b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 2048, "input_cost_per_token": 0.00000099, "output_cost_per_token": 0.00000099, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "meta.llama3-1-405b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000532, "output_cost_per_token": 0.000016, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "us.meta.llama3-1-405b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000532, "output_cost_per_token": 0.000016, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "meta.llama3-2-1b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "us.meta.llama3-2-1b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "eu.meta.llama3-2-1b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000013, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "meta.llama3-2-3b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "us.meta.llama3-2-3b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "eu.meta.llama3-2-3b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000019, "output_cost_per_token": 0.00000019, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "meta.llama3-2-11b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000035, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "us.meta.llama3-2-11b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000035, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "meta.llama3-2-90b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000002, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "us.meta.llama3-2-90b-instruct-v1:0": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 4096, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000002, "litellm_provider": "bedrock", "mode": "chat", "supports_function_calling": true, "supports_tool_choice": false }, "512-x-512/50-steps/stability.stable-diffusion-xl-v0": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.018, "litellm_provider": "bedrock", "mode": "image_generation" }, "512-x-512/max-steps/stability.stable-diffusion-xl-v0": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.036, "litellm_provider": "bedrock", "mode": "image_generation" }, "max-x-max/50-steps/stability.stable-diffusion-xl-v0": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.036, "litellm_provider": "bedrock", "mode": "image_generation" }, "max-x-max/max-steps/stability.stable-diffusion-xl-v0": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.072, "litellm_provider": "bedrock", "mode": "image_generation" }, "1024-x-1024/50-steps/stability.stable-diffusion-xl-v1": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.04, "litellm_provider": "bedrock", "mode": "image_generation" }, "1024-x-1024/max-steps/stability.stable-diffusion-xl-v1": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.08, "litellm_provider": "bedrock", "mode": "image_generation" }, "stability.sd3-large-v1:0": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.08, "litellm_provider": "bedrock", "mode": "image_generation" }, "stability.sd3-5-large-v1:0": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.08, "litellm_provider": "bedrock", "mode": "image_generation" }, "stability.stable-image-core-v1:0": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.04, "litellm_provider": "bedrock", "mode": "image_generation" }, "stability.stable-image-core-v1:1": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.04, "litellm_provider": "bedrock", "mode": "image_generation" }, "stability.stable-image-ultra-v1:0": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.14, "litellm_provider": "bedrock", "mode": "image_generation" }, "stability.stable-image-ultra-v1:1": { "max_tokens": 77, "max_input_tokens": 77, "output_cost_per_image": 0.14, "litellm_provider": "bedrock", "mode": "image_generation" }, "sagemaker/meta-textgeneration-llama-2-7b": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000, "output_cost_per_token": 0.000, "litellm_provider": "sagemaker", "mode": "completion" }, "sagemaker/meta-textgeneration-llama-2-7b-f": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000, "output_cost_per_token": 0.000, "litellm_provider": "sagemaker", "mode": "chat" }, "sagemaker/meta-textgeneration-llama-2-13b": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000, "output_cost_per_token": 0.000, "litellm_provider": "sagemaker", "mode": "completion" }, "sagemaker/meta-textgeneration-llama-2-13b-f": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000, "output_cost_per_token": 0.000, "litellm_provider": "sagemaker", "mode": "chat" }, "sagemaker/meta-textgeneration-llama-2-70b": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000, "output_cost_per_token": 0.000, "litellm_provider": "sagemaker", "mode": "completion" }, "sagemaker/meta-textgeneration-llama-2-70b-b-f": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000, "output_cost_per_token": 0.000, "litellm_provider": "sagemaker", "mode": "chat" }, "together-ai-up-to-4b": { "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001, "litellm_provider": "together_ai", "mode": "chat" }, "together-ai-4.1b-8b": { "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002, "litellm_provider": "together_ai", "mode": "chat" }, "together-ai-8.1b-21b": { "max_tokens": 1000, "input_cost_per_token": 0.0000003, "output_cost_per_token": 0.0000003, "litellm_provider": "together_ai", "mode": "chat" }, "together-ai-21.1b-41b": { "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000008, "litellm_provider": "together_ai", "mode": "chat" }, "together-ai-41.1b-80b": { "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009, "litellm_provider": "together_ai", "mode": "chat" }, "together-ai-81.1b-110b": { "input_cost_per_token": 0.0000018, "output_cost_per_token": 0.0000018, "litellm_provider": "together_ai", "mode": "chat" }, "together-ai-embedding-up-to-150m": { "input_cost_per_token": 0.000000008, "output_cost_per_token": 0.0, "litellm_provider": "together_ai", "mode": "embedding" }, "together-ai-embedding-151m-to-350m": { "input_cost_per_token": 0.000000016, "output_cost_per_token": 0.0, "litellm_provider": "together_ai", "mode": "embedding" }, "together_ai/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo": { "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.00000018, "litellm_provider": "together_ai", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "mode": "chat", "supports_tool_choice": true }, "together_ai/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo": { "input_cost_per_token": 0.00000088, "output_cost_per_token": 0.00000088, "litellm_provider": "together_ai", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "mode": "chat", "supports_tool_choice": true }, "together_ai/meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo": { "input_cost_per_token": 0.0000035, "output_cost_per_token": 0.0000035, "litellm_provider": "together_ai", "supports_function_calling": true, "supports_parallel_function_calling": true, "mode": "chat", "supports_tool_choice": true }, "together_ai/meta-llama/Llama-3.3-70B-Instruct-Turbo": { "input_cost_per_token": 0.00000088, "output_cost_per_token": 0.00000088, "litellm_provider": "together_ai", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "mode": "chat", "supports_tool_choice": true }, "together_ai/meta-llama/Llama-3.3-70B-Instruct-Turbo-Free": { "input_cost_per_token": 0, "output_cost_per_token": 0, "litellm_provider": "together_ai", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "mode": "chat", "supports_tool_choice": true }, "together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1": { "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000006, "litellm_provider": "together_ai", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "mode": "chat", "supports_tool_choice": true }, "together_ai/mistralai/Mistral-7B-Instruct-v0.1": { "litellm_provider": "together_ai", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_response_schema": true, "mode": "chat", "supports_tool_choice": true }, "together_ai/togethercomputer/CodeLlama-34b-Instruct": { "litellm_provider": "together_ai", "supports_function_calling": true, "supports_parallel_function_calling": true, "mode": "chat", "supports_tool_choice": true }, "ollama/codegemma": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "completion" }, "ollama/codegeex4": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat", "supports_function_calling": false }, "ollama/deepseek-coder-v2-instruct": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat", "supports_function_calling": true }, "ollama/deepseek-coder-v2-base": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "completion", "supports_function_calling": true }, "ollama/deepseek-coder-v2-lite-instruct": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat", "supports_function_calling": true }, "ollama/deepseek-coder-v2-lite-base": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "completion", "supports_function_calling": true }, "ollama/internlm2_5-20b-chat": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat", "supports_function_calling": true }, "ollama/llama2": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/llama2:7b": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/llama2:13b": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/llama2:70b": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/llama2-uncensored": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "completion" }, "ollama/llama3": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/llama3:8b": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/llama3:70b": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/llama3.1": { "max_tokens": 32768, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat", "supports_function_calling": true }, "ollama/mistral-large-instruct-2407": { "max_tokens": 65536, "max_input_tokens": 65536, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/mistral": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "completion" }, "ollama/mistral-7B-Instruct-v0.1": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/mistral-7B-Instruct-v0.2": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/mixtral-8x7B-Instruct-v0.1": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/mixtral-8x22B-Instruct-v0.1": { "max_tokens": 65536, "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "chat" }, "ollama/codellama": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "completion" }, "ollama/orca-mini": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "completion" }, "ollama/vicuna": { "max_tokens": 2048, "max_input_tokens": 2048, "max_output_tokens": 2048, "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "ollama", "mode": "completion" }, "deepinfra/lizpreciatior/lzlv_70b_fp16_hf": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000070, "output_cost_per_token": 0.00000090, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/Gryphe/MythoMax-L2-13b": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000022, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/mistralai/Mistral-7B-Instruct-v0.1": { "max_tokens": 8191, "max_input_tokens": 32768, "max_output_tokens": 8191, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000013, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/meta-llama/Llama-2-70b-chat-hf": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000070, "output_cost_per_token": 0.00000090, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/cognitivecomputations/dolphin-2.6-mixtral-8x7b": { "max_tokens": 8191, "max_input_tokens": 32768, "max_output_tokens": 8191, "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.00000027, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/codellama/CodeLlama-34b-Instruct-hf": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000060, "output_cost_per_token": 0.00000060, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/deepinfra/mixtral": { "max_tokens": 4096, "max_input_tokens": 32000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.00000027, "litellm_provider": "deepinfra", "mode": "completion" }, "deepinfra/Phind/Phind-CodeLlama-34B-v2": { "max_tokens": 4096, "max_input_tokens": 16384, "max_output_tokens": 4096, "input_cost_per_token": 0.00000060, "output_cost_per_token": 0.00000060, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/mistralai/Mixtral-8x7B-Instruct-v0.1": { "max_tokens": 8191, "max_input_tokens": 32768, "max_output_tokens": 8191, "input_cost_per_token": 0.00000027, "output_cost_per_token": 0.00000027, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/deepinfra/airoboros-70b": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000070, "output_cost_per_token": 0.00000090, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/01-ai/Yi-34B-Chat": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000060, "output_cost_per_token": 0.00000060, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/01-ai/Yi-6B-200K": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000013, "litellm_provider": "deepinfra", "mode": "completion" }, "deepinfra/jondurbin/airoboros-l2-70b-gpt4-1.4.1": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000070, "output_cost_per_token": 0.00000090, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/meta-llama/Llama-2-13b-chat-hf": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000022, "output_cost_per_token": 0.00000022, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/amazon/MistralLite": { "max_tokens": 8191, "max_input_tokens": 32768, "max_output_tokens": 8191, "input_cost_per_token": 0.00000020, "output_cost_per_token": 0.00000020, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/meta-llama/Llama-2-7b-chat-hf": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000013, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/meta-llama/Meta-Llama-3-8B-Instruct": { "max_tokens": 8191, "max_input_tokens": 8191, "max_output_tokens": 4096, "input_cost_per_token": 0.00000008, "output_cost_per_token": 0.00000008, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/meta-llama/Meta-Llama-3-70B-Instruct": { "max_tokens": 8191, "max_input_tokens": 8191, "max_output_tokens": 4096, "input_cost_per_token": 0.00000059, "output_cost_per_token": 0.00000079, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009, "litellm_provider": "deepinfra", "mode": "chat", "supports_function_calling": true, "supports_parallel_function_calling": true, "supports_tool_choice": true }, "deepinfra/01-ai/Yi-34B-200K": { "max_tokens": 4096, "max_input_tokens": 200000, "max_output_tokens": 4096, "input_cost_per_token": 0.00000060, "output_cost_per_token": 0.00000060, "litellm_provider": "deepinfra", "mode": "completion" }, "deepinfra/openchat/openchat_3.5": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000013, "output_cost_per_token": 0.00000013, "litellm_provider": "deepinfra", "mode": "chat", "supports_tool_choice": true }, "perplexity/codellama-34b-instruct": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000035, "output_cost_per_token": 0.00000140, "litellm_provider": "perplexity", "mode": "chat" , "supports_tool_choice": true }, "perplexity/codellama-70b-instruct": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000070, "output_cost_per_token": 0.00000280, "litellm_provider": "perplexity", "mode": "chat" , "supports_tool_choice": true }, "perplexity/llama-3.1-70b-instruct": { "max_tokens": 131072, "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001, "litellm_provider": "perplexity", "mode": "chat" , "supports_tool_choice": true }, "perplexity/llama-3.1-8b-instruct": { "max_tokens": 131072, "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002, "litellm_provider": "perplexity", "mode": "chat" , "supports_tool_choice": true }, "perplexity/llama-3.1-sonar-huge-128k-online": { "max_tokens": 127072, "max_input_tokens": 127072, "max_output_tokens": 127072, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000005, "litellm_provider": "perplexity", "mode": "chat", "deprecation_date": "2025-02-22", "supports_tool_choice": true }, "perplexity/llama-3.1-sonar-large-128k-online": { "max_tokens": 127072, "max_input_tokens": 127072, "max_output_tokens": 127072, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001, "litellm_provider": "perplexity", "mode": "chat", "deprecation_date": "2025-02-22", "supports_tool_choice": true }, "perplexity/llama-3.1-sonar-large-128k-chat": { "max_tokens": 131072, "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001, "litellm_provider": "perplexity", "mode": "chat", "deprecation_date": "2025-02-22", "supports_tool_choice": true }, "perplexity/llama-3.1-sonar-small-128k-chat": { "max_tokens": 131072, "max_input_tokens": 131072, "max_output_tokens": 131072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002, "litellm_provider": "perplexity", "mode": "chat", "deprecation_date": "2025-02-22", "supports_tool_choice": true }, "perplexity/llama-3.1-sonar-small-128k-online": { "max_tokens": 127072, "max_input_tokens": 127072, "max_output_tokens": 127072, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002, "litellm_provider": "perplexity", "mode": "chat" , "deprecation_date": "2025-02-22", "supports_tool_choice": true }, "perplexity/pplx-7b-chat": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000028, "litellm_provider": "perplexity", "mode": "chat" , "supports_tool_choice": true }, "perplexity/pplx-70b-chat": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000070, "output_cost_per_token": 0.00000280, "litellm_provider": "perplexity", "mode": "chat" , "supports_tool_choice": true }, "perplexity/pplx-7b-online": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000000, "output_cost_per_token": 0.00000028, "input_cost_per_request": 0.005, "litellm_provider": "perplexity", "mode": "chat" , "supports_tool_choice": true }, "perplexity/pplx-70b-online": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000000, "output_cost_per_token": 0.00000280, "input_cost_per_request": 0.005, "litellm_provider": "perplexity", "mode": "chat" , "supports_tool_choice": true }, "perplexity/llama-2-70b-chat": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000070, "output_cost_per_token": 0.00000280, "litellm_provider": "perplexity", "mode": "chat" , "supports_tool_choice": true }, "perplexity/mistral-7b-instruct": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000028, "litellm_provider": "perplexity", "mode": "chat" , "supports_tool_choice": true }, "perplexity/mixtral-8x7b-instruct": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000028, "litellm_provider": "perplexity", "mode": "chat", "supports_tool_choice": true }, "perplexity/sonar-small-chat": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000007, "output_cost_per_token": 0.00000028, "litellm_provider": "perplexity", "mode": "chat", "supports_tool_choice": true }, "perplexity/sonar-small-online": { "max_tokens": 12000, "max_input_tokens": 12000, "max_output_tokens": 12000, "input_cost_per_token": 0, "output_cost_per_token": 0.00000028, "input_cost_per_request": 0.005, "litellm_provider": "perplexity", "mode": "chat", "supports_tool_choice": true }, "perplexity/sonar-medium-chat": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000018, "litellm_provider": "perplexity", "mode": "chat", "supports_tool_choice": true }, "perplexity/sonar-medium-online": { "max_tokens": 12000, "max_input_tokens": 12000, "max_output_tokens": 12000, "input_cost_per_token": 0, "output_cost_per_token": 0.0000018, "input_cost_per_request": 0.005, "litellm_provider": "perplexity", "mode": "chat", "supports_tool_choice": true }, "fireworks_ai/accounts/fireworks/models/llama-v3p2-1b-instruct": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "source": "https://fireworks.ai/pricing", "supports_tool_choice": true }, "fireworks_ai/accounts/fireworks/models/llama-v3p2-3b-instruct": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "source": "https://fireworks.ai/pricing", "supports_tool_choice": true }, "fireworks_ai/accounts/fireworks/models/llama-v3p1-8b-instruct": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000001, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "source": "https://fireworks.ai/pricing", "supports_tool_choice": true }, "fireworks_ai/accounts/fireworks/models/llama-v3p2-11b-vision-instruct": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "source": "https://fireworks.ai/pricing", "supports_tool_choice": true }, "accounts/fireworks/models/llama-v3p2-90b-vision-instruct": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_function_calling": true, "supports_vision": true, "supports_response_schema": true, "source": "https://fireworks.ai/pricing" }, "fireworks_ai/accounts/fireworks/models/firefunction-v2": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "source": "https://fireworks.ai/pricing", "supports_tool_choice": true }, "fireworks_ai/accounts/fireworks/models/mixtral-8x22b-instruct-hf": { "max_tokens": 65536, "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "source": "https://fireworks.ai/pricing", "supports_tool_choice": true }, "fireworks_ai/accounts/fireworks/models/qwen2-72b-instruct": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "source": "https://fireworks.ai/pricing", "supports_tool_choice": true }, "fireworks_ai/accounts/fireworks/models/qwen2p5-coder-32b-instruct": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "source": "https://fireworks.ai/pricing", "supports_tool_choice": true }, "fireworks_ai/accounts/fireworks/models/yi-large": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000003, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "source": "https://fireworks.ai/pricing", "supports_tool_choice": true }, "fireworks_ai/accounts/fireworks/models/deepseek-coder-v2-instruct": { "max_tokens": 65536, "max_input_tokens": 65536, "max_output_tokens": 8192, "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_function_calling": true, "supports_response_schema": true, "source": "https://fireworks.ai/pricing", "supports_tool_choice": true }, "fireworks_ai/accounts/fireworks/models/deepseek-v3": { "max_tokens": 8192, "max_input_tokens": 128000, "max_output_tokens": 8192, "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009, "litellm_provider": "fireworks_ai", "mode": "chat", "supports_response_schema": true, "source": "https://fireworks.ai/pricing", "supports_tool_choice": true }, "fireworks_ai/nomic-ai/nomic-embed-text-v1.5": { "max_tokens": 8192, "max_input_tokens": 8192, "input_cost_per_token": 0.000000008, "output_cost_per_token": 0.000000, "litellm_provider": "fireworks_ai-embedding-models", "mode": "embedding", "source": "https://fireworks.ai/pricing" }, "fireworks_ai/nomic-ai/nomic-embed-text-v1": { "max_tokens": 8192, "max_input_tokens": 8192, "input_cost_per_token": 0.000000008, "output_cost_per_token": 0.000000, "litellm_provider": "fireworks_ai-embedding-models", "mode": "embedding", "source": "https://fireworks.ai/pricing" }, "fireworks_ai/WhereIsAI/UAE-Large-V1": { "max_tokens": 512, "max_input_tokens": 512, "input_cost_per_token": 0.000000016, "output_cost_per_token": 0.000000, "litellm_provider": "fireworks_ai-embedding-models", "mode": "embedding", "source": "https://fireworks.ai/pricing" }, "fireworks_ai/thenlper/gte-large": { "max_tokens": 512, "max_input_tokens": 512, "input_cost_per_token": 0.000000016, "output_cost_per_token": 0.000000, "litellm_provider": "fireworks_ai-embedding-models", "mode": "embedding", "source": "https://fireworks.ai/pricing" }, "fireworks_ai/thenlper/gte-base": { "max_tokens": 512, "max_input_tokens": 512, "input_cost_per_token": 0.000000008, "output_cost_per_token": 0.000000, "litellm_provider": "fireworks_ai-embedding-models", "mode": "embedding", "source": "https://fireworks.ai/pricing" }, "fireworks-ai-up-to-16b": { "input_cost_per_token": 0.0000002, "output_cost_per_token": 0.0000002, "litellm_provider": "fireworks_ai" }, "fireworks-ai-16.1b-to-80b": { "input_cost_per_token": 0.0000009, "output_cost_per_token": 0.0000009, "litellm_provider": "fireworks_ai" }, "fireworks-ai-moe-up-to-56b": { "input_cost_per_token": 0.0000005, "output_cost_per_token": 0.0000005, "litellm_provider": "fireworks_ai" }, "fireworks-ai-56b-to-176b": { "input_cost_per_token": 0.0000012, "output_cost_per_token": 0.0000012, "litellm_provider": "fireworks_ai" }, "fireworks-ai-default": { "input_cost_per_token": 0.0, "output_cost_per_token": 0.0, "litellm_provider": "fireworks_ai" }, "fireworks-ai-embedding-up-to-150m": { "input_cost_per_token": 0.000000008, "output_cost_per_token": 0.000000, "litellm_provider": "fireworks_ai-embedding-models" }, "fireworks-ai-embedding-150m-to-350m": { "input_cost_per_token": 0.000000016, "output_cost_per_token": 0.000000, "litellm_provider": "fireworks_ai-embedding-models" }, "anyscale/mistralai/Mistral-7B-Instruct-v0.1": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015, "litellm_provider": "anyscale", "mode": "chat", "supports_function_calling": true, "source": "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/mistralai-Mistral-7B-Instruct-v0.1" }, "anyscale/mistralai/Mixtral-8x7B-Instruct-v0.1": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015, "litellm_provider": "anyscale", "mode": "chat", "supports_function_calling": true, "source": "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/mistralai-Mixtral-8x7B-Instruct-v0.1" }, "anyscale/mistralai/Mixtral-8x22B-Instruct-v0.1": { "max_tokens": 65536, "max_input_tokens": 65536, "max_output_tokens": 65536, "input_cost_per_token": 0.00000090, "output_cost_per_token": 0.00000090, "litellm_provider": "anyscale", "mode": "chat", "supports_function_calling": true, "source": "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/mistralai-Mixtral-8x22B-Instruct-v0.1" }, "anyscale/HuggingFaceH4/zephyr-7b-beta": { "max_tokens": 16384, "max_input_tokens": 16384, "max_output_tokens": 16384, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015, "litellm_provider": "anyscale", "mode": "chat" }, "anyscale/google/gemma-7b-it": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015, "litellm_provider": "anyscale", "mode": "chat", "source": "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/google-gemma-7b-it" }, "anyscale/meta-llama/Llama-2-7b-chat-hf": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015, "litellm_provider": "anyscale", "mode": "chat" }, "anyscale/meta-llama/Llama-2-13b-chat-hf": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000025, "output_cost_per_token": 0.00000025, "litellm_provider": "anyscale", "mode": "chat" }, "anyscale/meta-llama/Llama-2-70b-chat-hf": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001, "litellm_provider": "anyscale", "mode": "chat" }, "anyscale/codellama/CodeLlama-34b-Instruct-hf": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001, "litellm_provider": "anyscale", "mode": "chat" }, "anyscale/codellama/CodeLlama-70b-Instruct-hf": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000001, "litellm_provider": "anyscale", "mode": "chat", "source" : "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/codellama-CodeLlama-70b-Instruct-hf" }, "anyscale/meta-llama/Meta-Llama-3-8B-Instruct": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000015, "output_cost_per_token": 0.00000015, "litellm_provider": "anyscale", "mode": "chat", "source": "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/meta-llama-Meta-Llama-3-8B-Instruct" }, "anyscale/meta-llama/Meta-Llama-3-70B-Instruct": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000100, "output_cost_per_token": 0.00000100, "litellm_provider": "anyscale", "mode": "chat", "source" : "https://docs.anyscale.com/preview/endpoints/text-generation/supported-models/meta-llama-Meta-Llama-3-70B-Instruct" }, "cloudflare/@cf/meta/llama-2-7b-chat-fp16": { "max_tokens": 3072, "max_input_tokens": 3072, "max_output_tokens": 3072, "input_cost_per_token": 0.000001923, "output_cost_per_token": 0.000001923, "litellm_provider": "cloudflare", "mode": "chat" }, "cloudflare/@cf/meta/llama-2-7b-chat-int8": { "max_tokens": 2048, "max_input_tokens": 2048, "max_output_tokens": 2048, "input_cost_per_token": 0.000001923, "output_cost_per_token": 0.000001923, "litellm_provider": "cloudflare", "mode": "chat" }, "cloudflare/@cf/mistral/mistral-7b-instruct-v0.1": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.000001923, "output_cost_per_token": 0.000001923, "litellm_provider": "cloudflare", "mode": "chat" }, "cloudflare/@hf/thebloke/codellama-7b-instruct-awq": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.000001923, "output_cost_per_token": 0.000001923, "litellm_provider": "cloudflare", "mode": "chat" }, "voyage/voyage-01": { "max_tokens": 4096, "max_input_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-lite-01": { "max_tokens": 4096, "max_input_tokens": 4096, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-large-2": { "max_tokens": 16000, "max_input_tokens": 16000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-finance-2": { "max_tokens": 32000, "max_input_tokens": 32000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-lite-02-instruct": { "max_tokens": 4000, "max_input_tokens": 4000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-law-2": { "max_tokens": 16000, "max_input_tokens": 16000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-code-2": { "max_tokens": 16000, "max_input_tokens": 16000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-2": { "max_tokens": 4000, "max_input_tokens": 4000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-3-large": { "max_tokens": 32000, "max_input_tokens": 32000, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-3": { "max_tokens": 32000, "max_input_tokens": 32000, "input_cost_per_token": 0.00000006, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-3-lite": { "max_tokens": 32000, "max_input_tokens": 32000, "input_cost_per_token": 0.00000002, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-code-3": { "max_tokens": 32000, "max_input_tokens": 32000, "input_cost_per_token": 0.00000018, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/voyage-multimodal-3": { "max_tokens": 32000, "max_input_tokens": 32000, "input_cost_per_token": 0.00000012, "output_cost_per_token": 0.000000, "litellm_provider": "voyage", "mode": "embedding" }, "voyage/rerank-2": { "max_tokens": 16000, "max_input_tokens": 16000, "max_output_tokens": 16000, "max_query_tokens": 16000, "input_cost_per_token": 0.00000005, "input_cost_per_query": 0.00000005, "output_cost_per_token": 0.0, "litellm_provider": "voyage", "mode": "rerank" }, "voyage/rerank-2-lite": { "max_tokens": 8000, "max_input_tokens": 8000, "max_output_tokens": 8000, "max_query_tokens": 8000, "input_cost_per_token": 0.00000002, "input_cost_per_query": 0.00000002, "output_cost_per_token": 0.0, "litellm_provider": "voyage", "mode": "rerank" }, "databricks/databricks-meta-llama-3-1-405b-instruct": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.000005, "input_dbu_cost_per_token": 0.000071429, "output_cost_per_token": 0.00001500002, "output_db_cost_per_token": 0.000214286, "litellm_provider": "databricks", "mode": "chat", "source": "https://www.databricks.com/product/pricing/foundation-model-serving", "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."}, "supports_tool_choice": true }, "databricks/databricks-meta-llama-3-1-70b-instruct": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000100002, "input_dbu_cost_per_token": 0.000014286, "output_cost_per_token": 0.00000299999, "output_dbu_cost_per_token": 0.000042857, "litellm_provider": "databricks", "mode": "chat", "source": "https://www.databricks.com/product/pricing/foundation-model-serving", "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."}, "supports_tool_choice": true }, "databricks/meta-llama-3.3-70b-instruct": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000100002, "input_dbu_cost_per_token": 0.000014286, "output_cost_per_token": 0.00000299999, "output_dbu_cost_per_token": 0.000042857, "litellm_provider": "databricks", "mode": "chat", "source": "https://www.databricks.com/product/pricing/foundation-model-serving", "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."}, "supports_tool_choice": true }, "databricks/databricks-dbrx-instruct": { "max_tokens": 32768, "max_input_tokens": 32768, "max_output_tokens": 32768, "input_cost_per_token": 0.00000074998, "input_dbu_cost_per_token": 0.000010714, "output_cost_per_token": 0.00000224901, "output_dbu_cost_per_token": 0.000032143, "litellm_provider": "databricks", "mode": "chat", "source": "https://www.databricks.com/product/pricing/foundation-model-serving", "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."}, "supports_tool_choice": true }, "databricks/databricks-meta-llama-3-70b-instruct": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.00000100002, "input_dbu_cost_per_token": 0.000014286, "output_cost_per_token": 0.00000299999, "output_dbu_cost_per_token": 0.000042857, "litellm_provider": "databricks", "mode": "chat", "source": "https://www.databricks.com/product/pricing/foundation-model-serving", "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."}, "supports_tool_choice": true }, "databricks/databricks-llama-2-70b-chat": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000050001, "input_dbu_cost_per_token": 0.000007143, "output_cost_per_token": 0.0000015, "output_dbu_cost_per_token": 0.000021429, "litellm_provider": "databricks", "mode": "chat", "source": "https://www.databricks.com/product/pricing/foundation-model-serving", "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."}, "supports_tool_choice": true }, "databricks/databricks-mixtral-8x7b-instruct": { "max_tokens": 4096, "max_input_tokens": 4096, "max_output_tokens": 4096, "input_cost_per_token": 0.00000050001, "input_dbu_cost_per_token": 0.000007143, "output_cost_per_token": 0.00000099902, "output_dbu_cost_per_token": 0.000014286, "litellm_provider": "databricks", "mode": "chat", "source": "https://www.databricks.com/product/pricing/foundation-model-serving", "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."}, "supports_tool_choice": true }, "databricks/databricks-mpt-30b-instruct": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000099902, "input_dbu_cost_per_token": 0.000014286, "output_cost_per_token": 0.00000099902, "output_dbu_cost_per_token": 0.000014286, "litellm_provider": "databricks", "mode": "chat", "source": "https://www.databricks.com/product/pricing/foundation-model-serving", "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."}, "supports_tool_choice": true }, "databricks/databricks-mpt-7b-instruct": { "max_tokens": 8192, "max_input_tokens": 8192, "max_output_tokens": 8192, "input_cost_per_token": 0.00000050001, "input_dbu_cost_per_token": 0.000007143, "output_cost_per_token": 0.0, "output_dbu_cost_per_token": 0.0, "litellm_provider": "databricks", "mode": "chat", "source": "https://www.databricks.com/product/pricing/foundation-model-serving", "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."}, "supports_tool_choice": true }, "databricks/databricks-bge-large-en": { "max_tokens": 512, "max_input_tokens": 512, "output_vector_size": 1024, "input_cost_per_token": 0.00000010003, "input_dbu_cost_per_token": 0.000001429, "output_cost_per_token": 0.0, "output_dbu_cost_per_token": 0.0, "litellm_provider": "databricks", "mode": "embedding", "source": "https://www.databricks.com/product/pricing/foundation-model-serving", "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."} }, "databricks/databricks-gte-large-en": { "max_tokens": 8192, "max_input_tokens": 8192, "output_vector_size": 1024, "input_cost_per_token": 0.00000012999, "input_dbu_cost_per_token": 0.000001857, "output_cost_per_token": 0.0, "output_dbu_cost_per_token": 0.0, "litellm_provider": "databricks", "mode": "embedding", "source": "https://www.databricks.com/product/pricing/foundation-model-serving", "metadata": {"notes": "Input/output cost per token is dbu cost * $0.070, based on databricks Llama 3.1 70B conversion. Number provided for reference, '*_dbu_cost_per_token' used in actual calculation."} }, "sambanova/Meta-Llama-3.1-8B-Instruct": { "max_tokens": 16000, "max_input_tokens": 16000, "max_output_tokens": 16000, "input_cost_per_token": 0.0000001, "output_cost_per_token": 0.0000002, "litellm_provider": "sambanova", "supports_function_calling": true, "mode": "chat", "supports_tool_choice": true }, "sambanova/Meta-Llama-3.1-70B-Instruct": { "max_tokens": 128000, "max_input_tokens": 128000, "max_output_tokens": 128000, "input_cost_per_token": 0.0000006, "output_cost_per_token": 0.0000012, "litellm_provider": "sambanova", "supports_function_calling": true, "mode": "chat", "supports_tool_choice": true }, "sambanova/Meta-Llama-3.1-405B-Instruct": { "max_tokens": 16000, "max_input_tokens": 16000, "max_output_tokens": 16000, "input_cost_per_token": 0.000005, "output_cost_per_token": 0.000010, "litellm_provider": "sambanova", "supports_function_calling": true, "mode": "chat", "supports_tool_choice": true }, "sambanova/Meta-Llama-3.2-1B-Instruct": { "max_tokens": 16000, "max_input_tokens": 16000, "max_output_tokens": 16000, "input_cost_per_token": 0.0000004, "output_cost_per_token": 0.0000008, "litellm_provider": "sambanova", "supports_function_calling": true, "mode": "chat", "supports_tool_choice": true }, "sambanova/Meta-Llama-3.2-3B-Instruct": { "max_tokens": 4000, "max_input_tokens": 4000, "max_output_tokens": 4000, "input_cost_per_token": 0.0000008, "output_cost_per_token": 0.0000016, "litellm_provider": "sambanova", "supports_function_calling": true, "mode": "chat", "supports_tool_choice": true }, "sambanova/Qwen2.5-Coder-32B-Instruct": { "max_tokens": 8000, "max_input_tokens": 8000, "max_output_tokens": 8000, "input_cost_per_token": 0.0000015, "output_cost_per_token": 0.000003, "litellm_provider": "sambanova", "supports_function_calling": true, "mode": "chat", "supports_tool_choice": true }, "sambanova/Qwen2.5-72B-Instruct": { "max_tokens": 8000, "max_input_tokens": 8000, "max_output_tokens": 8000, "input_cost_per_token": 0.000002, "output_cost_per_token": 0.000004, "litellm_provider": "sambanova", "supports_function_calling": true, "mode": "chat", "supports_tool_choice": true }, "assemblyai/nano": { "mode": "audio_transcription", "input_cost_per_second": 0.00010278, "output_cost_per_second": 0.00, "litellm_provider": "assemblyai" }, "assemblyai/best": { "mode": "audio_transcription", "input_cost_per_second": 0.00003333, "output_cost_per_second": 0.00, "litellm_provider": "assemblyai" } }