Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
9 changes: 8 additions & 1 deletion pricing_table.md
Original file line number Diff line number Diff line change
Expand Up @@ -1237,4 +1237,11 @@
| xai/grok-3-mini-fast | $0.6 | $4 | 131,072 | 131072 |
| vertex_ai/imagen-4.0-generate-preview-06-06 | -- | -- | nan | nan |
| vertex_ai/imagen-4.0-ultra-generate-preview-06-06 | -- | -- | nan | nan |
| vertex_ai/imagen-4.0-fast-generate-preview-06-06 | -- | -- | nan | nan |
| vertex_ai/imagen-4.0-fast-generate-preview-06-06 | -- | -- | nan | nan |
| gemini/gemini-2.5-pro | $1.25 | $10 | 1,048,576 | 65535 |
| gemini-2.5-flash | $0.3 | $2.5 | 1,048,576 | 65535 |
| gemini-2.5-flash-lite-preview-06-17 | $0.1 | $0.4 | 1,048,576 | 65535 |
| openrouter/deepseek/deepseek-r1-0528 | $0.5 | $2.15 | 65,336 | 8192 |
| openrouter/google/gemini-2.5-pro | $1.25 | $10 | 1,048,576 | 8192 |
| openrouter/google/gemini-2.5-flash | $0.3 | $2.5 | 1,048,576 | 8192 |
| openrouter/anthropic/claude-sonnet-4 | $3 | $15 | 200,000 | 8192 |
202 changes: 202 additions & 0 deletions tokencost/model_prices.json
Original file line number Diff line number Diff line change
Expand Up @@ -16919,5 +16919,207 @@
"litellm_provider": "vertex_ai-image-models",
"mode": "image_generation",
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing"
},
"gemini/gemini-2.5-pro": {
"max_tokens": 65535,
"max_input_tokens": 1048576,
"max_output_tokens": 65535,
"max_images_per_prompt": 3000,
"max_videos_per_prompt": 10,
"max_video_length": 1,
"max_audio_length_hours": 8.4,
"max_audio_per_prompt": 1,
"max_pdf_size_mb": 30,
"input_cost_per_token": 1.25e-06,
"input_cost_per_token_above_200k_tokens": 2.5e-06,
"output_cost_per_token": 1e-05,
"output_cost_per_token_above_200k_tokens": 1.5e-05,
"litellm_provider": "gemini",
"mode": "chat",
"rpm": 5,
"tpm": 250000,
"supports_system_messages": true,
"supports_function_calling": true,
"supports_vision": true,
"supports_audio_input": true,
"supports_video_input": true,
"supports_pdf_input": true,
"supports_response_schema": true,
"supports_tool_choice": true,
"supported_endpoints": [
"/v1/chat/completions",
"/v1/completions"
],
"supported_modalities": [
"text",
"image",
"audio",
"video"
],
"supported_output_modalities": [
"text"
],
"source": "https://cloud.google.com/vertex-ai/generative-ai/pricing",
"supports_web_search": true
},
"gemini-2.5-flash": {
"max_tokens": 65535,
"max_input_tokens": 1048576,
"max_output_tokens": 65535,
"max_images_per_prompt": 3000,
"max_videos_per_prompt": 10,
"max_video_length": 1,
"max_audio_length_hours": 8.4,
"max_audio_per_prompt": 1,
"max_pdf_size_mb": 30,
"input_cost_per_audio_token": 1e-06,
"input_cost_per_token": 3e-07,
"output_cost_per_token": 2.5e-06,
"output_cost_per_reasoning_token": 2.5e-06,
"litellm_provider": "vertex_ai-language-models",
"mode": "chat",
"supports_reasoning": true,
"supports_system_messages": true,
"supports_function_calling": true,
"supports_vision": true,
"supports_response_schema": true,
"supports_audio_output": false,
"supports_tool_choice": true,
"supported_endpoints": [
"/v1/chat/completions",
"/v1/completions",
"/v1/batch"
],
"supported_modalities": [
"text",
"image",
"audio",
"video"
],
"supported_output_modalities": [
"text"
],
"source": "https://ai.google.dev/gemini-api/docs/models#gemini-2.5-flash-preview",
"supports_parallel_function_calling": true,
"supports_web_search": true,
"supports_url_context": true
},
"gemini-2.5-flash-lite-preview-06-17": {
"max_tokens": 65535,
"max_input_tokens": 1048576,
"max_output_tokens": 65535,
"max_images_per_prompt": 3000,
"max_videos_per_prompt": 10,
"max_video_length": 1,
"max_audio_length_hours": 8.4,
"max_audio_per_prompt": 1,
"max_pdf_size_mb": 30,
"input_cost_per_audio_token": 1e-06,
"input_cost_per_token": 1e-07,
"output_cost_per_token": 4e-07,
"output_cost_per_reasoning_token": 4e-07,
"litellm_provider": "vertex_ai-language-models",
"mode": "chat",
"supports_reasoning": true,
"supports_system_messages": true,
"supports_function_calling": true,
"supports_vision": true,
"supports_response_schema": true,
"supports_audio_output": false,
"supports_tool_choice": true,
"supported_endpoints": [
"/v1/chat/completions",
"/v1/completions",
"/v1/batch"
],
"supported_modalities": [
"text",
"image",
"audio",
"video"
],
"supported_output_modalities": [
"text"
],
"source": "https://ai.google.dev/gemini-api/docs/models#gemini-2.5-flash-preview",
"supports_parallel_function_calling": true,
"supports_web_search": true,
"supports_url_context": true
},
"openrouter/deepseek/deepseek-r1-0528": {
"max_tokens": 8192,
"max_input_tokens": 65336,
"max_output_tokens": 8192,
"input_cost_per_token": 5e-07,
"input_cost_per_token_cache_hit": 1.4e-07,
"output_cost_per_token": 2.15e-06,
"litellm_provider": "openrouter",
"mode": "chat",
"supports_function_calling": true,
"supports_assistant_prefill": true,
"supports_reasoning": true,
"supports_tool_choice": true,
"supports_prompt_caching": true
},
"openrouter/google/gemini-2.5-pro": {
"max_tokens": 8192,
"max_input_tokens": 1048576,
"max_output_tokens": 8192,
"max_images_per_prompt": 3000,
"max_videos_per_prompt": 10,
"max_video_length": 1,
"max_audio_length_hours": 8.4,
"max_audio_per_prompt": 1,
"max_pdf_size_mb": 30,
"input_cost_per_audio_token": 7e-07,
"input_cost_per_token": 1.25e-06,
"output_cost_per_token": 1e-05,
"litellm_provider": "openrouter",
"mode": "chat",
"supports_system_messages": true,
"supports_function_calling": true,
"supports_vision": true,
"supports_response_schema": true,
"supports_audio_output": true,
"supports_tool_choice": true
},
"openrouter/google/gemini-2.5-flash": {
"max_tokens": 8192,
"max_input_tokens": 1048576,
"max_output_tokens": 8192,
"max_images_per_prompt": 3000,
"max_videos_per_prompt": 10,
"max_video_length": 1,
"max_audio_length_hours": 8.4,
"max_audio_per_prompt": 1,
"max_pdf_size_mb": 30,
"input_cost_per_audio_token": 7e-07,
"input_cost_per_token": 3e-07,
"output_cost_per_token": 2.5e-06,
"litellm_provider": "openrouter",
"mode": "chat",
"supports_system_messages": true,
"supports_function_calling": true,
"supports_vision": true,
"supports_response_schema": true,
"supports_audio_output": true,
"supports_tool_choice": true
},
"openrouter/anthropic/claude-sonnet-4": {
"supports_computer_use": true,
"max_tokens": 8192,
"max_input_tokens": 200000,
"max_output_tokens": 8192,
"input_cost_per_token": 3e-06,
"output_cost_per_token": 1.5e-05,
"input_cost_per_image": 0.0048,
"litellm_provider": "openrouter",
"mode": "chat",
"supports_function_calling": true,
"supports_vision": true,
"supports_reasoning": true,
"tool_use_system_prompt_tokens": 159,
"supports_assistant_prefill": true,
"supports_tool_choice": true
}
}