Skip to content
Merged
Show file tree
Hide file tree
Changes from 1 commit
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
54 changes: 45 additions & 9 deletions pricing_table.md
Original file line number Diff line number Diff line change
Expand Up @@ -151,7 +151,7 @@
| groq/llama2-70b-4096 | $0.7 | $0.8 | 4,096 | 4096 |
| groq/llama3-8b-8192 | $0.05 | $0.08 | 8,192 | 8192 |
| groq/llama3-70b-8192 | $0.59 | $0.79 | 8,192 | 8192 |
| groq/llama-3.1-8b-instant | $0.05 | $0.08 | 8,192 | 8192 |
| groq/llama-3.1-8b-instant | $0.05 | $0.08 | 128,000 | 8192 |
| groq/llama-3.1-70b-versatile | $0.59 | $0.79 | 8,192 | 8192 |
| groq/llama-3.1-405b-reasoning | $0.59 | $0.79 | 8,192 | 8192 |
| groq/mixtral-8x7b-32768 | $0.24 | $0.24 | 32,768 | 32768 |
Expand Down Expand Up @@ -714,7 +714,7 @@
| mistral/pixtral-large-2411 | $2 | $6 | 128,000 | 128000 |
| deepseek/deepseek-chat | $0.27 | $1.1 | 65,536 | 8192 |
| deepseek/deepseek-coder | $0.14 | $0.28 | 128,000 | 4096 |
| groq/llama-3.3-70b-versatile | $0.59 | $0.79 | 128,000 | 8192 |
| groq/llama-3.3-70b-versatile | $0.59 | $0.79 | 128,000 | 32768 |
| groq/llama-3.3-70b-specdec | $0.59 | $0.99 | 8,192 | 8192 |
| friendliai/meta-llama-3.1-8b-instruct | $0.1 | $0.1 | 8,192 | 8192 |
| friendliai/meta-llama-3.1-70b-instruct | $0.6 | $0.6 | 8,192 | 8192 |
Expand Down Expand Up @@ -746,12 +746,12 @@
| voyage/rerank-2 | $0.05 | $0 | 16,000 | 16000 |
| voyage/rerank-2-lite | $0.02 | $0 | 8,000 | 8000 |
| databricks/meta-llama-3.3-70b-instruct | $1 | $3 | 128,000 | 128000 |
| sambanova/Meta-Llama-3.1-8B-Instruct | $0.1 | $0.2 | 16,000 | 16000 |
| sambanova/Meta-Llama-3.1-8B-Instruct | $0.1 | $0.2 | 16,384 | 16384 |
| sambanova/Meta-Llama-3.1-70B-Instruct | $0.6 | $1.2 | 128,000 | 128000 |
| sambanova/Meta-Llama-3.1-405B-Instruct | $5 | $10 | 16,000 | 16000 |
| sambanova/Meta-Llama-3.2-1B-Instruct | $0.4 | $0.8 | 16,000 | 16000 |
| sambanova/Meta-Llama-3.2-3B-Instruct | $0.8 | $1.6 | 4,000 | 4000 |
| sambanova/Meta-Llama-3.3-70B-Instruct | $0.6 | $1.2 | 128,000 | 128000 |
| sambanova/Meta-Llama-3.1-405B-Instruct | $5 | $10 | 16,384 | 16384 |
| sambanova/Meta-Llama-3.2-1B-Instruct | $0.04 | $0.08 | 16,384 | 16384 |
| sambanova/Meta-Llama-3.2-3B-Instruct | $0.08 | $0.16 | 4,096 | 4096 |
| sambanova/Meta-Llama-3.3-70B-Instruct | $0.6 | $1.2 | 131,072 | 131072 |
| sambanova/Qwen2.5-Coder-32B-Instruct | $1.5 | $3 | 8,000 | 8000 |
| sambanova/Qwen2.5-72B-Instruct | $2 | $4 | 8,000 | 8000 |
| o3-mini | $1.1 | $4.4 | 200,000 | 100000 |
Expand All @@ -768,7 +768,7 @@
| xai/grok-2-1212 | $2 | $10 | 131,072 | 131072 |
| xai/grok-2 | $2 | $10 | 131,072 | 131072 |
| xai/grok-2-latest | $2 | $10 | 131,072 | 131072 |
| groq/deepseek-r1-distill-llama-70b | $0.75 | $0.99 | 131,072 | 131072 |
| groq/deepseek-r1-distill-llama-70b | $0.75 | $0.99 | 128,000 | 128000 |
| gemini/gemini-2.0-flash | $0.1 | $0.4 | 1,048,576 | 8192 |
| gemini-2.0-flash-001 | $0.15 | $0.6 | 1,048,576 | 8192 |
| gemini-2.0-flash-thinking-exp | $0 | $0 | 1,048,576 | 8192 |
Expand Down Expand Up @@ -1022,4 +1022,40 @@
| nscale/stabilityai/stable-diffusion-xl-base-1.0 | -- | -- | nan | nan |
| azure/gpt-4o-mini-tts | $2.5 | $10 | nan | nan |
| azure_ai/embed-v-4-0 | $0.12 | $0 | 128,000 | nan |
| eu.anthropic.claude-3-7-sonnet-20250219-v1:0 | $3 | $15 | 200,000 | 8192 |
| eu.anthropic.claude-3-7-sonnet-20250219-v1:0 | $3 | $15 | 200,000 | 8192 |
| xai/grok-3 | $3 | $15 | 131,072 | 131072 |
| groq/llama-guard-3-8b | $0.2 | $0.2 | 8,192 | 8192 |
| groq/meta-llama/llama-4-scout-17b-16e-instruct | $0.11 | $0.34 | 131,072 | 8192 |
| groq/meta-llama/llama-4-maverick-17b-128e-instruct | $0.2 | $0.6 | 131,072 | 8192 |
| groq/mistral-saba-24b | $0.79 | $0.79 | 32,000 | 32000 |
| groq/qwen-qwq-32b | $0.29 | $0.39 | 128,000 | 128000 |
| groq/playai-tts | -- | -- | 10,000 | 10000 |
| claude-opus-4-20250514 | $15 | $75 | 200,000 | 128000 |
| claude-sonnet-4-20250514 | $3 | $15 | 200,000 | 128000 |
| gemini/gemini-2.5-flash-preview-tts | $0.15 | $0.6 | 1,048,576 | 65535 |
| gemini/gemini-2.5-flash-preview-05-20 | $0.15 | $0.6 | 1,048,576 | 65535 |
| gemini-2.5-flash-preview-05-20 | $0.15 | $0.6 | 1,048,576 | 65535 |
| gemini-2.0-flash-preview-image-generation | $0.1 | $0.4 | 1,048,576 | 8192 |
| gemini-2.5-pro-preview-tts | $1.25 | $10 | 1,048,576 | 65535 |
| gemini/gemini-2.0-flash-preview-image-generation | $0.1 | $0.4 | 1,048,576 | 8192 |
| gemini/gemini-2.5-pro-preview-tts | $1.25 | $10 | 1,048,576 | 65535 |
| vertex_ai/claude-opus-4@20250514 | $15 | $75 | 200,000 | 128000 |
| vertex_ai/claude-sonnet-4@20250514 | $3 | $15 | 200,000 | 128000 |
| anthropic.claude-opus-4-20250514-v1:0 | $15 | $75 | 200,000 | 128000 |
| anthropic.claude-sonnet-4-20250514-v1:0 | $3 | $15 | 200,000 | 128000 |
| us.anthropic.claude-opus-4-20250514-v1:0 | $15 | $75 | 200,000 | 128000 |
| us.anthropic.claude-sonnet-4-20250514-v1:0 | $3 | $15 | 200,000 | 128000 |
| eu.anthropic.claude-opus-4-20250514-v1:0 | $15 | $75 | 200,000 | 128000 |
| eu.anthropic.claude-sonnet-4-20250514-v1:0 | $3 | $15 | 200,000 | 128000 |
| databricks/databricks-llama-4-maverick | $5 | $15 | 128,000 | 128000 |
| sambanova/Llama-4-Maverick-17B-128E-Instruct | $0.63 | $1.8 | 131,072 | 131072 |
| sambanova/Llama-4-Scout-17B-16E-Instruct | $0.4 | $0.7 | 8,192 | 8192 |
| sambanova/Meta-Llama-Guard-3-8B | $0.3 | $0.3 | 16,384 | 16384 |
| sambanova/Qwen3-32B | $0.4 | $0.8 | 8,192 | 8192 |
| sambanova/QwQ-32B | $0.5 | $1 | 16,384 | 16384 |
| sambanova/Qwen2-Audio-7B-Instruct | $0.5 | $100 | 4,096 | 4096 |
| sambanova/DeepSeek-R1-Distill-Llama-70B | $0.7 | $1.4 | 131,072 | 131072 |
| sambanova/DeepSeek-R1 | $5 | $7 | 32,768 | 32768 |
| sambanova/DeepSeek-V3-0324 | $3 | $4.5 | 32,768 | 32768 |
| featherless_ai/featherless-ai/Qwerky-72B | -- | -- | 32,768 | 4096 |
| featherless_ai/featherless-ai/Qwerky-QwQ-32B | -- | -- | 32,768 | 4096 |
Loading