Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
26 changes: 15 additions & 11 deletions pricing_table.md
Original file line number Diff line number Diff line change
Expand Up @@ -729,9 +729,9 @@
| rerank-v3.5 | $0 | $0 | 4,096 | 4096 |
| openrouter/deepseek/deepseek-chat | $0.14 | $0.28 | 65,536 | 8192 |
| openrouter/openai/o1 | $15 | $60 | 200,000 | 100000 |
| amazon.nova-micro-v1:0 | $0.04 | $0.14 | 300,000 | 4096 |
| amazon.nova-lite-v1:0 | $0.06 | $0.24 | 128,000 | 4096 |
| amazon.nova-pro-v1:0 | $0.8 | $3.2 | 300,000 | 4096 |
| amazon.nova-micro-v1:0 | $0.04 | $0.14 | 300,000 | 10000 |
| amazon.nova-lite-v1:0 | $0.06 | $0.24 | 128,000 | 10000 |
| amazon.nova-pro-v1:0 | $0.8 | $3.2 | 300,000 | 10000 |
| meta.llama3-3-70b-instruct-v1:0 | $0.72 | $0.72 | 128,000 | 4096 |
| together_ai/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo | $0.18 | $0.18 | nan | nan |
| together_ai/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo | $0.88 | $0.88 | nan | nan |
Expand Down Expand Up @@ -780,9 +780,9 @@
| openrouter/deepseek/deepseek-r1 | $0.55 | $2.19 | 65,336 | 8192 |
| ai21.jamba-1-5-large-v1:0 | $2 | $8 | 256,000 | 256000 |
| ai21.jamba-1-5-mini-v1:0 | $0.2 | $0.4 | 256,000 | 256000 |
| us.amazon.nova-micro-v1:0 | $0.04 | $0.14 | 300,000 | 4096 |
| us.amazon.nova-lite-v1:0 | $0.06 | $0.24 | 128,000 | 4096 |
| us.amazon.nova-pro-v1:0 | $0.8 | $3.2 | 300,000 | 4096 |
| us.amazon.nova-micro-v1:0 | $0.04 | $0.14 | 300,000 | 10000 |
| us.amazon.nova-lite-v1:0 | $0.06 | $0.24 | 128,000 | 10000 |
| us.amazon.nova-pro-v1:0 | $0.8 | $3.2 | 300,000 | 10000 |
| stability.sd3-5-large-v1:0 | -- | -- | 77 | nan |
| stability.stable-image-core-v1:0 | -- | -- | 77 | nan |
| stability.stable-image-core-v1:1 | -- | -- | 77 | nan |
Expand Down Expand Up @@ -846,10 +846,10 @@
| vertex_ai/imagen-3.0-generate-002 | -- | -- | nan | nan |
| jamba-large-1.6 | $2 | $8 | 256,000 | 256000 |
| jamba-mini-1.6 | $0.2 | $0.4 | 256,000 | 256000 |
| eu.amazon.nova-micro-v1:0 | $0.05 | $0.18 | 300,000 | 4096 |
| eu.amazon.nova-lite-v1:0 | $0.08 | $0.31 | 128,000 | 4096 |
| eu.amazon.nova-micro-v1:0 | $0.05 | $0.18 | 300,000 | 10000 |
| eu.amazon.nova-lite-v1:0 | $0.08 | $0.31 | 128,000 | 10000 |
| 1024-x-1024/50-steps/bedrock/amazon.nova-canvas-v1:0 | -- | -- | 2,600 | nan |
| eu.amazon.nova-pro-v1:0 | $1.05 | $4.2 | 300,000 | 4096 |
| eu.amazon.nova-pro-v1:0 | $1.05 | $4.2 | 300,000 | 10000 |
| us.deepseek.r1-v1:0 | $1.35 | $5.4 | 128,000 | 4096 |
| snowflake/deepseek-r1 | -- | -- | 32,768 | 8192 |
| snowflake/snowflake-arctic | -- | -- | 4,096 | 8192 |
Expand Down Expand Up @@ -975,7 +975,7 @@
| mistralai/mistral-small-3.1-24b-instruct | $0.1 | $0.3 | nan | nan |
| openrouter/openai/o3-mini | $1.1 | $4.4 | 128,000 | 65536 |
| openrouter/openai/o3-mini-high | $1.1 | $4.4 | 128,000 | 65536 |
| us.amazon.nova-premier-v1:0 | $2.5 | $12.5 | 1,000,000 | 4096 |
| us.amazon.nova-premier-v1:0 | $2.5 | $12.5 | 1,000,000 | 10000 |
| meta.llama4-maverick-17b-instruct-v1:0 | $0.24 | $0.97 | 128,000 | 4096 |
| us.meta.llama4-maverick-17b-instruct-v1:0 | $0.24 | $0.97 | 128,000 | 4096 |
| meta.llama4-scout-17b-instruct-v1:0 | $0.17 | $0.66 | 128,000 | 4096 |
Expand Down Expand Up @@ -1069,4 +1069,8 @@
| claude-4-opus-20250514 | $15 | $75 | 200,000 | 32000 |
| claude-4-sonnet-20250514 | $3 | $15 | 200,000 | 64000 |
| fireworks_ai/accounts/fireworks/models/llama-v3p2-90b-vision-instruct | $0.9 | $0.9 | 16,384 | 16384 |
| fireworks_ai/accounts/fireworks/models/deepseek-r1-0528 | $3 | $8 | 160,000 | 160000 |
| fireworks_ai/accounts/fireworks/models/deepseek-r1-0528 | $3 | $8 | 160,000 | 160000 |
| codex-mini-latest | $1.5 | $6 | 200,000 | 100000 |
| azure/codex-mini-latest | $1.5 | $6 | 200,000 | 100000 |
| gemini-2.5-pro-preview-06-05 | $1.25 | $10 | 1,048,576 | 65535 |
| gemini/gemini-2.5-pro-preview-06-05 | $1.25 | $10 | 1,048,576 | 65535 |
178 changes: 158 additions & 20 deletions tokencost/model_prices.json
Original file line number Diff line number Diff line change
Expand Up @@ -8561,9 +8561,9 @@
"supports_tool_choice": true
},
"amazon.nova-micro-v1:0": {
"max_tokens": 4096,
"max_tokens": 10000,
"max_input_tokens": 300000,
"max_output_tokens": 4096,
"max_output_tokens": 10000,
"input_cost_per_token": 3.5e-08,
"output_cost_per_token": 1.4e-07,
"litellm_provider": "bedrock_converse",
Expand All @@ -8573,9 +8573,9 @@
"supports_response_schema": true
},
"amazon.nova-lite-v1:0": {
"max_tokens": 4096,
"max_tokens": 10000,
"max_input_tokens": 128000,
"max_output_tokens": 4096,
"max_output_tokens": 10000,
"input_cost_per_token": 6e-08,
"output_cost_per_token": 2.4e-07,
"litellm_provider": "bedrock_converse",
Expand All @@ -8587,9 +8587,9 @@
"supports_response_schema": true
},
"amazon.nova-pro-v1:0": {
"max_tokens": 4096,
"max_tokens": 10000,
"max_input_tokens": 300000,
"max_output_tokens": 4096,
"max_output_tokens": 10000,
"input_cost_per_token": 8e-07,
"output_cost_per_token": 3.2e-06,
"litellm_provider": "bedrock_converse",
Expand Down Expand Up @@ -9374,9 +9374,9 @@
"mode": "chat"
},
"us.amazon.nova-micro-v1:0": {
"max_tokens": 4096,
"max_tokens": 10000,
"max_input_tokens": 300000,
"max_output_tokens": 4096,
"max_output_tokens": 10000,
"input_cost_per_token": 3.5e-08,
"output_cost_per_token": 1.4e-07,
"litellm_provider": "bedrock_converse",
Expand All @@ -9386,9 +9386,9 @@
"supports_response_schema": true
},
"us.amazon.nova-lite-v1:0": {
"max_tokens": 4096,
"max_tokens": 10000,
"max_input_tokens": 128000,
"max_output_tokens": 4096,
"max_output_tokens": 10000,
"input_cost_per_token": 6e-08,
"output_cost_per_token": 2.4e-07,
"litellm_provider": "bedrock_converse",
Expand All @@ -9400,9 +9400,9 @@
"supports_response_schema": true
},
"us.amazon.nova-pro-v1:0": {
"max_tokens": 4096,
"max_tokens": 10000,
"max_input_tokens": 300000,
"max_output_tokens": 4096,
"max_output_tokens": 10000,
"input_cost_per_token": 8e-07,
"output_cost_per_token": 3.2e-06,
"litellm_provider": "bedrock_converse",
Expand Down Expand Up @@ -10452,9 +10452,9 @@
"supports_tool_choice": true
},
"eu.amazon.nova-micro-v1:0": {
"max_tokens": 4096,
"max_tokens": 10000,
"max_input_tokens": 300000,
"max_output_tokens": 4096,
"max_output_tokens": 10000,
"input_cost_per_token": 4.6e-08,
"output_cost_per_token": 1.84e-07,
"litellm_provider": "bedrock_converse",
Expand All @@ -10464,9 +10464,9 @@
"supports_response_schema": true
},
"eu.amazon.nova-lite-v1:0": {
"max_tokens": 4096,
"max_tokens": 10000,
"max_input_tokens": 128000,
"max_output_tokens": 4096,
"max_output_tokens": 10000,
"input_cost_per_token": 7.8e-08,
"output_cost_per_token": 3.12e-07,
"litellm_provider": "bedrock_converse",
Expand All @@ -10484,9 +10484,9 @@
"mode": "image_generation"
},
"eu.amazon.nova-pro-v1:0": {
"max_tokens": 4096,
"max_tokens": 10000,
"max_input_tokens": 300000,
"max_output_tokens": 4096,
"max_output_tokens": 10000,
"input_cost_per_token": 1.05e-06,
"output_cost_per_token": 4.2e-06,
"litellm_provider": "bedrock_converse",
Expand Down Expand Up @@ -12778,9 +12778,9 @@
"supports_tool_choice": true
},
"us.amazon.nova-premier-v1:0": {
"max_tokens": 4096,
"max_tokens": 10000,
"max_input_tokens": 1000000,
"max_output_tokens": 4096,
"max_output_tokens": 10000,
"input_cost_per_token": 2.5e-06,
"output_cost_per_token": 1.25e-05,
"litellm_provider": "bedrock_converse",
Expand Down Expand Up @@ -14234,5 +14234,143 @@
"source": "https://fireworks.ai/pricing",
"supports_tool_choice": false,
"supports_response_schema": true
},
"codex-mini-latest": {
"max_tokens": 100000,
"max_input_tokens": 200000,
"max_output_tokens": 100000,
"input_cost_per_token": 1.5e-06,
"output_cost_per_token": 6e-06,
"cache_read_input_token_cost": 3.75e-07,
"litellm_provider": "openai",
"mode": "responses",
"supports_pdf_input": true,
"supports_function_calling": true,
"supports_parallel_function_calling": true,
"supports_vision": true,
"supports_prompt_caching": true,
"supports_system_messages": true,
"supports_response_schema": true,
"supports_tool_choice": true,
"supports_reasoning": true,
"supported_modalities": [
"text",
"image"
],
"supported_output_modalities": [
"text"
],
"supported_endpoints": [
"/v1/responses"
]
},
"azure/codex-mini-latest": {
"max_tokens": 100000,
"max_input_tokens": 200000,
"max_output_tokens": 100000,
"input_cost_per_token": 1.5e-06,
"output_cost_per_token": 6e-06,
"cache_read_input_token_cost": 3.75e-07,
"litellm_provider": "azure",
"mode": "responses",
"supports_pdf_input": true,
"supports_function_calling": true,
"supports_parallel_function_calling": true,
"supports_vision": true,
"supports_prompt_caching": true,
"supports_system_messages": true,
"supports_response_schema": true,
"supports_tool_choice": true,
"supports_reasoning": true,
"supported_modalities": [
"text",
"image"
],
"supported_output_modalities": [
"text"
],
"supported_endpoints": [
"/v1/responses"
]
},
"gemini-2.5-pro-preview-06-05": {
"max_tokens": 65535,
"max_input_tokens": 1048576,
"max_output_tokens": 65535,
"max_images_per_prompt": 3000,
"max_videos_per_prompt": 10,
"max_video_length": 1,
"max_audio_length_hours": 8.4,
"max_audio_per_prompt": 1,
"max_pdf_size_mb": 30,
"input_cost_per_audio_token": 1.25e-06,
"input_cost_per_token": 1.25e-06,
"input_cost_per_token_above_200k_tokens": 2.5e-06,
"output_cost_per_token": 1e-05,
"output_cost_per_token_above_200k_tokens": 1.5e-05,
"litellm_provider": "vertex_ai-language-models",
"mode": "chat",
"supports_reasoning": true,
"supports_system_messages": true,
"supports_function_calling": true,
"supports_vision": true,
"supports_response_schema": true,
"supports_audio_output": false,
"supports_tool_choice": true,
"supported_endpoints": [
"/v1/chat/completions",
"/v1/completions",
"/v1/batch"
],
"supported_modalities": [
"text",
"image",
"audio",
"video"
],
"supported_output_modalities": [
"text"
],
"source": "https://ai.google.dev/gemini-api/docs/models#gemini-2.5-flash-preview",
"supports_parallel_function_calling": true,
"supports_web_search": true
},
"gemini/gemini-2.5-pro-preview-06-05": {
"max_tokens": 65535,
"max_input_tokens": 1048576,
"max_output_tokens": 65535,
"max_images_per_prompt": 3000,
"max_videos_per_prompt": 10,
"max_video_length": 1,
"max_audio_length_hours": 8.4,
"max_audio_per_prompt": 1,
"max_pdf_size_mb": 30,
"input_cost_per_audio_token": 7e-07,
"input_cost_per_token": 1.25e-06,
"input_cost_per_token_above_200k_tokens": 2.5e-06,
"output_cost_per_token": 1e-05,
"output_cost_per_token_above_200k_tokens": 1.5e-05,
"litellm_provider": "gemini",
"mode": "chat",
"rpm": 10000,
"tpm": 10000000,
"supports_system_messages": true,
"supports_function_calling": true,
"supports_vision": true,
"supports_response_schema": true,
"supports_audio_output": false,
"supports_tool_choice": true,
"supported_modalities": [
"text",
"image",
"audio",
"video"
],
"supported_output_modalities": [
"text"
],
"source": "https://ai.google.dev/gemini-api/docs/pricing#gemini-2.5-pro-preview",
"supports_web_search": true,
"supports_url_context": true
}
}