Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
6 changes: 5 additions & 1 deletion pricing_table.md
Original file line number Diff line number Diff line change
Expand Up @@ -1065,4 +1065,8 @@
| mistral/mistral-medium-2505 | $0.4 | $2 | 131,072 | 8191 |
| embed-v4.0 | $0.12 | $0 | 1,024 | nan |
| cerebras/qwen-3-32b | $0.4 | $0.8 | 128,000 | 128000 |
| gemini-embedding-001 | $0.15 | $0 | 2,048 | nan |
| gemini-embedding-001 | $0.15 | $0 | 2,048 | nan |
| claude-4-opus-20250514 | $15 | $75 | 200,000 | 32000 |
| claude-4-sonnet-20250514 | $3 | $15 | 200,000 | 64000 |
| fireworks_ai/accounts/fireworks/models/llama-v3p2-90b-vision-instruct | $0.9 | $0.9 | 16,384 | 16384 |
| fireworks_ai/accounts/fireworks/models/deepseek-r1-0528 | $3 | $8 | 160,000 | 160000 |
122 changes: 100 additions & 22 deletions tokencost/model_prices.json
Original file line number Diff line number Diff line change
Expand Up @@ -6780,10 +6780,10 @@
"output_cost_per_token": 1e-07,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_function_calling": false,
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"fireworks_ai/accounts/fireworks/models/llama-v3p2-3b-instruct": {
"max_tokens": 16384,
Expand All @@ -6793,10 +6793,10 @@
"output_cost_per_token": 1e-07,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_function_calling": false,
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"fireworks_ai/accounts/fireworks/models/llama-v3p2-11b-vision-instruct": {
"max_tokens": 16384,
Expand All @@ -6806,11 +6806,11 @@
"output_cost_per_token": 2e-07,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_function_calling": false,
"supports_vision": true,
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"accounts/fireworks/models/llama-v3p2-90b-vision-instruct": {
"max_tokens": 16384,
Expand Down Expand Up @@ -6859,10 +6859,10 @@
"output_cost_per_token": 9e-07,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_function_calling": false,
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"fireworks_ai/accounts/fireworks/models/yi-large": {
"max_tokens": 32768,
Expand All @@ -6872,10 +6872,10 @@
"output_cost_per_token": 3e-06,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_function_calling": false,
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"fireworks_ai/accounts/fireworks/models/deepseek-coder-v2-instruct": {
"max_tokens": 65536,
Expand All @@ -6885,10 +6885,10 @@
"output_cost_per_token": 1.2e-06,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_function_calling": false,
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"fireworks_ai/nomic-ai/nomic-embed-text-v1.5": {
"max_tokens": 8192,
Expand Down Expand Up @@ -7984,10 +7984,10 @@
"output_cost_per_token": 9e-07,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_function_calling": false,
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"omni-moderation-latest": {
"max_tokens": 32768,
Expand Down Expand Up @@ -8662,7 +8662,7 @@
"mode": "chat",
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"voyage/voyage-3-large": {
"max_tokens": 32000,
Expand Down Expand Up @@ -9468,10 +9468,10 @@
"output_cost_per_token": 1e-07,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_function_calling": true,
"supports_function_calling": false,
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"assemblyai/nano": {
"mode": "audio_transcription",
Expand Down Expand Up @@ -12947,7 +12947,7 @@
"mode": "chat",
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"fireworks_ai/accounts/fireworks/models/deepseek-r1-basic": {
"max_tokens": 20480,
Expand All @@ -12959,7 +12959,7 @@
"mode": "chat",
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"fireworks_ai/accounts/fireworks/models/llama-v3p1-405b-instruct": {
"max_tokens": 16384,
Expand All @@ -12971,7 +12971,8 @@
"mode": "chat",
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": true,
"supports_function_calling": true
},
"fireworks_ai/accounts/fireworks/models/llama4-maverick-instruct-basic": {
"max_tokens": 131072,
Expand All @@ -12983,7 +12984,7 @@
"mode": "chat",
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"fireworks_ai/accounts/fireworks/models/llama4-scout-instruct-basic": {
"max_tokens": 131072,
Expand All @@ -12995,7 +12996,7 @@
"mode": "chat",
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": true
"supports_tool_choice": false
},
"fireworks-ai-up-to-4b": {
"input_cost_per_token": 2e-07,
Expand Down Expand Up @@ -14151,5 +14152,82 @@
"litellm_provider": "vertex_ai-embedding-models",
"mode": "embedding",
"source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models"
},
"claude-4-opus-20250514": {
"max_tokens": 32000,
"max_input_tokens": 200000,
"max_output_tokens": 32000,
"input_cost_per_token": 1.5e-05,
"output_cost_per_token": 7.5e-05,
"search_context_cost_per_query": {
"search_context_size_low": 0.01,
"search_context_size_medium": 0.01,
"search_context_size_high": 0.01
},
"cache_creation_input_token_cost": 1.875e-05,
"cache_read_input_token_cost": 1.5e-06,
"litellm_provider": "anthropic",
"mode": "chat",
"supports_function_calling": true,
"supports_vision": true,
"tool_use_system_prompt_tokens": 159,
"supports_assistant_prefill": true,
"supports_pdf_input": true,
"supports_prompt_caching": true,
"supports_response_schema": true,
"supports_tool_choice": true,
"supports_reasoning": true,
"supports_computer_use": true
},
"claude-4-sonnet-20250514": {
"max_tokens": 64000,
"max_input_tokens": 200000,
"max_output_tokens": 64000,
"input_cost_per_token": 3e-06,
"output_cost_per_token": 1.5e-05,
"search_context_cost_per_query": {
"search_context_size_low": 0.01,
"search_context_size_medium": 0.01,
"search_context_size_high": 0.01
},
"cache_creation_input_token_cost": 3.75e-06,
"cache_read_input_token_cost": 3e-07,
"litellm_provider": "anthropic",
"mode": "chat",
"supports_function_calling": true,
"supports_vision": true,
"tool_use_system_prompt_tokens": 159,
"supports_assistant_prefill": true,
"supports_pdf_input": true,
"supports_prompt_caching": true,
"supports_response_schema": true,
"supports_tool_choice": true,
"supports_reasoning": true,
"supports_computer_use": true
},
"fireworks_ai/accounts/fireworks/models/llama-v3p2-90b-vision-instruct": {
"max_tokens": 16384,
"max_input_tokens": 16384,
"max_output_tokens": 16384,
"input_cost_per_token": 9e-07,
"output_cost_per_token": 9e-07,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"supports_tool_choice": false,
"supports_vision": true,
"supports_response_schema": true,
"source": "https://fireworks.ai/pricing"
},
"fireworks_ai/accounts/fireworks/models/deepseek-r1-0528": {
"max_tokens": 160000,
"max_input_tokens": 160000,
"max_output_tokens": 160000,
"input_cost_per_token": 3e-06,
"output_cost_per_token": 8e-06,
"litellm_provider": "fireworks_ai",
"mode": "chat",
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": false,
"supports_response_schema": true
}
}