vertex_ai-language-models, gemini, openrouter | ▶gemini-2.5-pro-exp-03-25 (4 endpoints) | 1048k | $0.00–$1.25 >200k: $0.00–$2.50 | $0.00–$10.00 >200k: $0.00–$15.00 | 83.8% | – | – | – |
vertex_ai-language-models | gemini-2.5-pro-exp-03-25ℹ️ | 1048k | $0.00 >200k: $0.00 | $0.00 >200k: $0.00 | 83.8% | – | – | – |
gemini | gemini/gemini-2.5-pro-exp-03-25ℹ️ gemini-2.5-pro-exp-03-25 | 1048k | $0.00 >200k: $0.00 | $0.00 >200k: $0.00 | 83.8% | – | – | – |
openrouter | google/gemini-2.5-pro-exp-03-25 gemini-2.5-pro-exp-03-25 | 1048k | $0.00 | $0.00 | 83.8% | – | – | – |
gemini | gemini/gemini-2.5-pro-preview-03-25ℹ️ gemini-2.5-pro-exp-03-25 | 1048k | $1.25 >200k: $2.50 | $10.00 >200k: $15.00 | 83.8% | – | – | – |
openai, azure, openrouter | ▶o3 (5 endpoints) | 200k | $10.00 | $40.00 | 81.8% | 97.8% | 83.9% | – |
openai | o3 | 200k | $10.00 | $40.00 | 81.8% | 97.8% | 83.9% | – |
azure | azure/o3 o3 | 200k | $10.00 | $40.00 | 81.8% | 97.8% | 83.9% | – |
openrouter | openai/o3 o3 | 200k | $10.00 | $40.00 | 81.8% | 97.8% | 83.9% | – |
openai | o3-2025-04-16 | 200k | $10.00 | $40.00 | 81.8% | 97.8% | 83.9% | – |
azure | azure/o3-2025-04-16 o3-2025-04-16 | 200k | $10.00 | $40.00 | 81.8% | 97.8% | 83.9% | – |
openai, azure, openrouter | ▶o4-mini (6 endpoints) | 200k | $1.10 | $4.40 | 79.6% | 97.8% | 81.7% | – |
openai | o4-mini | 200k | $1.10 | $4.40 | 79.6% | 97.8% | 81.7% | – |
azure | azure/o4-mini o4-mini | 200k | $1.10 | $4.40 | 79.6% | 97.8% | 81.7% | – |
openrouter | openai/o4-mini o4-mini | 200k | $1.10 | $4.40 | 79.6% | 97.8% | 81.7% | – |
openai | o4-mini-2025-04-16 | 200k | $1.10 | $4.40 | 79.6% | 97.8% | 81.7% | – |
azure | azure/o4-mini-2025-04-16 o4-mini-2025-04-16 | 200k | $1.10 | $4.40 | 79.6% | 97.8% | 81.7% | – |
openrouter | openai/o4-mini-high o4-mini-high | 200k | $1.10 | $4.40 | 79.6% | 97.8% | 81.7% | – |
openai, azure, openrouter | ▶o3-mini (8 endpoints) | 200k | $1.10–$1.21 | $4.40–$4.84 | 77% | 96.5% | 76.9% | – |
openai | o3-mini | 200k | $1.10 | $4.40 | 77% | 96.5% | 76.9% | – |
azure | azure/o3-mini o3-mini | 200k | $1.10 | $4.40 | 77% | 96.5% | 76.9% | – |
openrouter | openai/o3-mini o3-mini | 200k | $1.10 | $4.40 | 77% | 96.5% | 76.9% | – |
openai | o3-mini-2025-01-31 | 200k | $1.10 | $4.40 | 77% | 96.5% | 76.9% | – |
azure | azure/o3-mini-2025-01-31 o3-mini-2025-01-31 | 200k | $1.10 | $4.40 | 77% | 96.5% | 76.9% | – |
openrouter | openai/o3-mini-high o3-mini-high | 200k | $1.10 | $4.40 | 77% | 96.5% | 76.9% | – |
azure | azure/us/o3-mini-2025-01-31 o3-mini-2025-01-31 | 200k | $1.21 | $4.84 | 77% | 96.5% | 76.9% | – |
azure | azure/eu/o3-mini-2025-01-31 o3-mini-2025-01-31 | 200k | $1.21 | $4.84 | 77% | 96.5% | 76.9% | – |
openai, azure, openrouter | ▶o1 (7 endpoints) | 200k | $15.00–$16.50 | $60.00–$66.00 | 76.8% | 94.7% | 73.3% | – |
openai | o1 | 200k | $15.00 | $60.00 | 76.8% | 94.7% | 73.3% | – |
azure | azure/o1 o1 | 200k | $15.00 | $60.00 | 76.8% | 94.7% | 73.3% | – |
openrouter | openai/o1 o1 | 200k | $15.00 | $60.00 | 76.8% | 94.7% | 73.3% | – |
openai | o1-2024-12-17 | 200k | $15.00 | $60.00 | 76.8% | 94.7% | 73.3% | – |
azure | azure/o1-2024-12-17 o1-2024-12-17 | 200k | $15.00 | $60.00 | 76.8% | 94.7% | 73.3% | – |
azure | azure/us/o1-2024-12-17 o1-2024-12-17 | 200k | $16.50 | $66.00 | 76.8% | 94.7% | 73.3% | – |
azure | azure/eu/o1-2024-12-17 o1-2024-12-17 | 200k | $16.50 | $66.00 | 76.8% | 94.7% | 73.3% | – |
xai, openrouter | ▶grok-3-mini-beta (3 endpoints) | 131k | $0.30 | $0.50 | 76.3% | 90.9% | 77.8% | – |
xai | xai/grok-3-mini-betaℹ️ grok-3-mini-beta | 131k | $0.30 | $0.50 | 76.3% | 90.9% | 77.8% | – |
openrouter | x-ai/grok-3-mini-beta grok-3-mini-beta | 131k | $0.30 | $0.50 | 76.3% | 90.9% | 77.8% | – |
xai | grok-3-mini-beta | 131k | $0.30 | $0.50 | 76.3% | 90.9% | 77.8% | – |
xai, openrouter | ▶grok-3-beta (3 endpoints) | 131k | $3.00 | $15.00 | 75.8% | 88.7% | 55.6% | – |
xai | xai/grok-3-betaℹ️ grok-3-beta | 131k | $3.00 | $15.00 | 75.8% | 88.7% | 55.6% | – |
openrouter | x-ai/grok-3-beta grok-3-beta | 131k | $3.00 | $15.00 | 75.8% | 88.7% | 55.6% | – |
xai | grok-3-beta | 131k | $3.00 | $15.00 | 75.8% | 88.7% | 55.6% | – |
lambda, openrouter, azure_ai, bedrock_converse, fireworks_ai, deepseek, sambanova | ▶deepseek-r1 (8 endpoints) | 32k–164k | $0.00–$5.00 | $0.00–$8.00 | 71.7% | 93.1% | 53.3% | – |
lambda | deepseek-r1-671b deepseek-r1 | 164k | $0.54 | $2.18 | 71.7% | 93.1% | 53.3% | – |
openrouter | deepseek/deepseek-r1:free deepseek-r1 | 163k | $0.00 | $0.00 | 71.7% | 93.1% | 53.3% | – |
openrouter | deepseek/deepseek-r1 deepseek-r1 | 163k | $0.50 | $2.18 | 71.7% | 93.1% | 53.3% | – |
azure_ai | azure_ai/deepseek-r1ℹ️ deepseek-r1 | 128k | $1.35 | $5.40 | 71.7% | 93.1% | 53.3% | – |
bedrock_converse | us.deepseek.r1-v1:0 deepseek-r1 | 128k | $1.35 | $5.40 | 71.7% | 93.1% | 53.3% | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/deepseek-r1ℹ️ deepseek-r1 | 128k | $3.00 | $8.00 | 71.7% | 93.1% | 53.3% | – |
deepseek | deepseek/deepseek-reasoner deepseek-r1 | 65k | $0.55 | $2.19 | 71.7% | 93.1% | 53.3% | – |
sambanova | sambanova/DeepSeek-R1ℹ️ deepseek-r1 | 32k | $5.00 | $7.00 | 71.7% | 93.1% | 53.3% | – |
openai, azure, openrouter | ▶gpt-4.5-preview (4 endpoints) | 128k | $75.00 | $150.00 | 68.7% | 78.6% | 37.8% | – |
openai | gpt-4.5-preview | 128k | $75.00 | $150.00 | 68.7% | 78.6% | 37.8% | – |
azure | azure/gpt-4.5-preview gpt-4.5-preview | 128k | $75.00 | $150.00 | 68.7% | 78.6% | 37.8% | – |
openrouter | openai/gpt-4.5-preview gpt-4.5-preview | 128k | $75.00 | $150.00 | 68.7% | 78.6% | 37.8% | – |
openai | gpt-4.5-preview-2025-02-27 | 128k | $75.00 | $150.00 | 68.7% | 78.6% | 37.8% | – |
openrouter, fireworks_ai, azure_ai, deepseek, sambanova | ▶deepseek-v3 (8 endpoints) | 32k–163k | $0.00–$3.00 | $0.00–$4.56 | 67.6% | 75.5% | 37.8% | – |
openrouter | deepseek/deepseek-chat-v3-0324:free deepseek-v3 | 163k | $0.00 | $0.00 | 56.5% | 64.9% | 15.8% | – |
openrouter | deepseek/deepseek-chat-v3-0324 deepseek-v3 | 163k | $0.30 | $0.88 | 56.5% | 64.9% | 15.8% | – |
openrouter | deepseek/deepseek-chat deepseek-v3 | 163k | $0.38 | $0.89 | 56.5% | 64.9% | 15.8% | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/deepseek-v3ℹ️ deepseek-v3 | 128k | $0.90 | $0.90 | 56.5% | 64.9% | 15.8% | – |
azure_ai | azure_ai/deepseek-v3-0324ℹ️ deepseek-v3-0324 | 128k | $1.14 | $4.56 | 67.6% | 75.5% | 37.8% | – |
azure_ai | azure_ai/deepseek-v3ℹ️ deepseek-v3 | 128k | $1.14 | $4.56 | 56.5% | 64.9% | 15.8% | – |
deepseek | deepseek/deepseek-chat deepseek-v3 | 65k | $0.27 | $1.10 | 56.5% | 64.9% | 15.8% | – |
sambanova | sambanova/DeepSeek-V3-0324ℹ️ deepseek-v3-0324 | 32k | $3.00 | $4.50 | 67.6% | 75.5% | 37.8% | – |
openrouter, lambda | ▶llama-4-maverick (3 endpoints) | 128k–1048k | $0.00–$0.20 | $0.00–$0.60 | 67% | 73% | 20.6% | – |
openrouter | meta-llama/llama-4-maverick llama-4-maverick | 1048k | $0.16 | $0.60 | 67% | 73% | 20.6% | – |
lambda | llama-4-maverick-17b-128e-instruct-fp8 llama-4-maverick | 1000k | $0.20 | $0.60 | 67% | 73% | 20.6% | – |
openrouter | meta-llama/llama-4-maverick:free llama-4-maverick | 128k | $0.00 | $0.00 | 67% | 73% | 20.6% | – |
openai, azure, openrouter | ▶gpt-4.1 (5 endpoints) | 1047k | $2.00 | $8.00 | 66.9% | 83% | 38.3% | – |
openai | gpt-4.1 | 1047k | $2.00 | $8.00 | 66.9% | 83% | 38.3% | – |
azure | azure/gpt-4.1 gpt-4.1 | 1047k | $2.00 | $8.00 | 66.9% | 83% | 38.3% | – |
openrouter | openai/gpt-4.1 gpt-4.1 | 1047k | $2.00 | $8.00 | 66.9% | 83% | 38.3% | – |
openai | gpt-4.1-2025-04-14 | 1047k | $2.00 | $8.00 | 66.9% | 83% | 38.3% | – |
azure | azure/gpt-4.1-2025-04-14 gpt-4.1-2025-04-14 | 1047k | $2.00 | $8.00 | 66.9% | 83% | 38.3% | – |
openrouter, anthropic, vertex_ai-anthropic_models, bedrock_converse, bedrock | ▶claude-3.7-sonnet (8 endpoints) | 200k | $3.00 | $15.00 | 66% | 68.2% | 21.9% | – |
openrouter | anthropic/claude-3.7-sonnet claude-3.7-sonnet | 200k | $3.00 | $15.00 | 66% | 68.2% | 21.9% | – |
anthropic | claude-3-7-sonnet-20250219 | 200k | $3.00 | $15.00 | 66% | 68.2% | 21.9% | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-7-sonnet@20250219 claude-3-7-sonnet@20250219 | 200k | $3.00 | $15.00 | 66% | 68.2% | 21.9% | – |
bedrock_converse | anthropic.claude-3-7-sonnet-20250219-v1:0 claude-3-7-sonnet-20250219-v1.0 | 200k | $3.00 | $15.00 | 66% | 68.2% | 21.9% | – |
bedrock_converse | us.anthropic.claude-3-7-sonnet-20250219-v1:0 claude-3-7-sonnet-20250219-v1.0 | 200k | $3.00 | $15.00 | 66% | 68.2% | 21.9% | – |
bedrock | eu.anthropic.claude-3-7-sonnet-20250219-v1:0 claude-3-7-sonnet-20250219-v1.0 | 200k | $3.00 | $15.00 | 66% | 68.2% | 21.9% | – |
anthropic | claude-3-7-sonnet-latest | 200k | $3.00 | $15.00 | 66% | 68.2% | 21.9% | – |
openrouter | anthropic/claude-3.7-sonnet:thinking claude-3.7-sonnet:thinking | 200k | $3.00 | $15.00 | 66% | 68.2% | 21.9% | – |
openai, azure, openrouter | ▶gpt-4.1-mini (5 endpoints) | 1047k | $0.40 | $1.60 | 65.8% | 87.3% | 44.7% | – |
openai | gpt-4.1-mini | 1047k | $0.40 | $1.60 | 65.8% | 87.3% | 44.7% | – |
azure | azure/gpt-4.1-mini gpt-4.1-mini | 1047k | $0.40 | $1.60 | 65.8% | 87.3% | 44.7% | – |
openrouter | openai/gpt-4.1-mini gpt-4.1-mini | 1047k | $0.40 | $1.60 | 65.8% | 87.3% | 44.7% | – |
openai | gpt-4.1-mini-2025-04-14 | 1047k | $0.40 | $1.60 | 65.8% | 87.3% | 44.7% | – |
azure | azure/gpt-4.1-mini-2025-04-14 gpt-4.1-mini-2025-04-14 | 1047k | $0.40 | $1.60 | 65.8% | 87.3% | 44.7% | – |
gemini, openrouter, vertex_ai-language-models | ▶gemini-2.0-flash-001 (3 endpoints) | 1048k | $0.10–$0.15 | $0.40–$0.60 | 64.1% | 82.2% | 31.1% | – |
gemini | gemini/gemini-2.0-flash-001ℹ️ gemini-2.0-flash-001 | 1048k | $0.10 | $0.40 | 64.1% | 82.2% | 31.1% | – |
openrouter | google/gemini-2.0-flash-001 gemini-2.0-flash-001 | 1048k | $0.10 | $0.40 | 64.1% | 82.2% | 31.1% | – |
vertex_ai-language-models | gemini-2.0-flash-001ℹ️ | 1048k | $0.15 | $0.60 | 64.1% | 82.2% | 31.1% | – |
openai, openrouter, azure | ▶o1-mini (8 endpoints) | 128k | $1.10–$3.00 | $4.40–$12.00 | 62.4% | 89.2% | 46.9% | – |
openai | o1-mini | 128k | $1.10 | $4.40 | 62.4% | 89.2% | 46.9% | – |
openrouter | openai/o1-mini o1-mini | 128k | $1.10 | $4.40 | 62.4% | 89.2% | 46.9% | – |
azure | azure/o1-mini-2024-09-12 o1-mini-2024-09-12 | 128k | $1.10 | $4.40 | 62.4% | 89.2% | 46.9% | – |
openrouter | openai/o1-mini-2024-09-12 o1-mini-2024-09-12 | 128k | $1.10 | $4.40 | 62.4% | 89.2% | 46.9% | – |
azure | azure/o1-mini o1-mini | 128k | $1.21 | $4.84 | 62.4% | 89.2% | 46.9% | – |
azure | azure/us/o1-mini-2024-09-12 o1-mini-2024-09-12 | 128k | $1.21 | $4.84 | 62.4% | 89.2% | 46.9% | – |
azure | azure/eu/o1-mini-2024-09-12 o1-mini-2024-09-12 | 128k | $1.21 | $4.84 | 62.4% | 89.2% | 46.9% | – |
openai | o1-mini-2024-09-12 | 128k | $3.00 | $12.00 | 62.4% | 89.2% | 46.9% | – |
vertex_ai-language-models, gemini | ▶gemini-1.5-pro-002 (2 endpoints) | 2097k | $1.25–$3.50 >128k: $2.50–$7.00 | $5.00–$10.50 >128k: $10.00–$21.00 | 57.2% | 70.4% | 23.1% | – |
vertex_ai-language-models | gemini-1.5-pro-002ℹ️ | 2097k | $1.25 >128k: $2.50 | $5.00 >128k: $10.00 | 57.2% | 70.4% | 23.1% | – |
gemini | gemini/gemini-1.5-pro-002ℹ️ gemini-1.5-pro-002 | 2097k | $3.50 >128k: $7.00 | $10.50 >128k: $21.00 | 57.2% | 70.4% | 23.1% | – |
vertex_ai-language-models, gemini | ▶gemini-2.0-flash-thinking-exp (4 endpoints) | 1048k | $0.00 >128k: $0.00 | $0.00 >128k: $0.00 | 57.1% | – | 57.8% | – |
vertex_ai-language-models | gemini-2.0-flash-thinking-expℹ️ | 1048k | $0.00 >128k: $0.00 | $0.00 >128k: $0.00 | 57.1% | – | 57.8% | – |
gemini | gemini/gemini-2.0-flash-thinking-expℹ️ gemini-2.0-flash-thinking-exp | 1048k | $0.00 >128k: $0.00 | $0.00 >128k: $0.00 | 57.1% | – | 57.8% | – |
vertex_ai-language-models | gemini-2.0-flash-thinking-exp-01-21ℹ️ | 1048k | $0.00 >128k: $0.00 | $0.00 >128k: $0.00 | 57.1% | – | 57.8% | – |
gemini | gemini/gemini-2.0-flash-thinking-exp-01-21ℹ️ gemini-2.0-flash-thinking-exp-01-21 | 1048k | $0.00 >128k: $0.00 | $0.00 >128k: $0.00 | 57.1% | – | 57.8% | – |
openrouter, azure_ai | ▶phi-4 (2 endpoints) | 16k | $0.07–$0.125 | $0.14–$0.50 | 56.1% | 64.9% | 13.8% | – |
openrouter | microsoft/phi-4 phi-4 | 16k | $0.07 | $0.14 | 56.1% | 64.9% | 13.8% | – |
azure_ai | azure_ai/Phi-4ℹ️ phi-4 | 16k | $0.125 | $0.50 | 56.1% | 64.9% | 13.8% | – |
openrouter, sambanova, groq, nscale | ▶deepseek-r1-distill-llama-70b (5 endpoints) | 8k–131k | $0.00–$0.75 | $0.00–$1.40 | 55.7% | 89.9% | 51.4% | – |
openrouter | deepseek/deepseek-r1-distill-llama-70b deepseek-r1-distill-llama-70b | 131k | $0.10 | $0.40 | 55.7% | 89.9% | 51.4% | – |
sambanova | sambanova/DeepSeek-R1-Distill-Llama-70Bℹ️ deepseek-r1-distill-llama-70b | 131k | $0.70 | $1.40 | 55.7% | 89.9% | 51.4% | – |
groq | groq/deepseek-r1-distill-llama-70b deepseek-r1-distill-llama-70b | 128k | $0.75 | $0.99 | 55.7% | 89.9% | 51.4% | – |
openrouter | deepseek/deepseek-r1-distill-llama-70b:free deepseek-r1-distill-llama-70b | 8k | $0.00 | $0.00 | 55.7% | 89.9% | 51.4% | – |
nscale | nscale/deepseek-ai/DeepSeek-R1-Distill-Llama-70Bℹ️ deepseek-r1-distill-llama-70b | – | $0.375 | $0.375 | 55.7% | 89.9% | 51.4% | – |
vertex_ai-anthropic_models, openrouter, anthropic, bedrock | ▶claude-3-5-sonnet (11 endpoints) | 200k | $3.00 | $15.00 | 55.3% | 56.9% | 8.47% | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-5-sonnet claude-3-5-sonnet | 200k | $3.00 | $15.00 | 55.3% | 56.9% | 8.47% | – |
openrouter | anthropic/claude-3.5-sonnet claude-3.5-sonnet | 200k | $3.00 | $15.00 | 55.3% | 56.9% | 8.47% | – |
anthropic | claude-3-5-sonnet-20241022 | 200k | $3.00 | $15.00 | 55.3% | 56.9% | 8.47% | – |
anthropic | claude-3-5-sonnet-latest | 200k | $3.00 | $15.00 | 55.3% | 56.9% | 8.47% | – |
anthropic | claude-3-5-sonnet-20240620 | 200k | $3.00 | $15.00 | 54% | 51.7% | 6.53% | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-5-sonnet@20240620 claude-3-5-sonnet@20240620 | 200k | $3.00 | $15.00 | 54% | 51.7% | 6.53% | – |
openrouter | anthropic/claude-3.5-sonnet-20240620 claude-3.5-sonnet-20240620 | 200k | $3.00 | $15.00 | 54% | 51.7% | 6.53% | – |
bedrock | bedrock/invoke/anthropic.claude-3-5-sonnet-20240620-v1:0 claude-3-5-sonnet-20240620-v1.0 | 200k | $3.00 | $15.00 | 54% | 51.7% | 6.53% | – |
bedrock | anthropic.claude-3-5-sonnet-20240620-v1:0 claude-3-5-sonnet-20240620-v1.0 | 200k | $3.00 | $15.00 | 54% | 51.7% | 6.53% | – |
bedrock | us.anthropic.claude-3-5-sonnet-20240620-v1:0 claude-3-5-sonnet-20240620-v1.0 | 200k | $3.00 | $15.00 | 54% | 51.7% | 6.53% | – |
bedrock | eu.anthropic.claude-3-5-sonnet-20240620-v1:0 claude-3-5-sonnet-20240620-v1.0 | 200k | $3.00 | $15.00 | 54% | 51.7% | 6.53% | – |
xai, openrouter | ▶grok-2 (4 endpoints) | 131k | $2.00 | $10.00 | 53.8% | 63.5% | 11.5% | – |
xai | xai/grok-2 grok-2 | 131k | $2.00 | $10.00 | 53.8% | 63.5% | 11.5% | – |
xai | xai/grok-2-1212 grok-2-1212 | 131k | $2.00 | $10.00 | 53.8% | 63.5% | 11.5% | – |
openrouter | x-ai/grok-2-1212 grok-2-1212 | 131k | $2.00 | $10.00 | 53.8% | 63.5% | 11.5% | – |
xai | xai/grok-2-latest grok-2-latest | 131k | $2.00 | $10.00 | 53.8% | 63.5% | 11.5% | – |
openrouter, lambda | ▶llama-4-scout (3 endpoints) | 256k–1048k | $0.00–$0.10 | $0.00–$0.30 | 51.8% | 62.3% | 7.78% | – |
openrouter | meta-llama/llama-4-scout llama-4-scout | 1048k | $0.08 | $0.30 | 51.8% | 62.3% | 7.78% | – |
lambda | llama-4-scout-17b-16e-instruct llama-4-scout | 1000k | $0.10 | $0.30 | 51.8% | 62.3% | 7.78% | – |
openrouter | meta-llama/llama-4-scout:free llama-4-scout | 256k | $0.00 | $0.00 | 51.8% | 62.3% | 7.78% | – |
openrouter, mistral, vertex_ai-mistral_models, azure_ai, bedrock, azure | ▶mistral-large (19 endpoints) | 32k–131k | $2.00–$10.40 | $6.00–$31.20 | 51.3% | 50.3% | 8.47% | – |
openrouter | mistralai/mistral-large-2411 mistral-large-2411 | 131k | $2.00 | $6.00 | 51.3% | 50.3% | 7.78% | – |
openrouter | mistralai/mistral-large-2407 mistral-large-2407 | 131k | $2.00 | $6.00 | 49% | 44.8% | 8.47% | – |
openrouter | mistralai/mistral-large mistral-large | 128k | $2.00 | $6.00 | 51.3% | 50.3% | 8.47% | – |
mistral | mistral/mistral-large-2411 mistral-large-2411 | 128k | $2.00 | $6.00 | 51.3% | 50.3% | 7.78% | – |
vertex_ai-mistral_models | vertex_ai/mistral-large-2411 mistral-large-2411 | 128k | $2.00 | $6.00 | 51.3% | 50.3% | 7.78% | – |
azure_ai | azure_ai/mistral-large-latestℹ️ mistral-large-latest | 128k | $2.00 | $6.00 | 51.3% | 50.3% | 8.47% | – |
mistral | mistral/mistral-large-latest mistral-large-latest | 128k | $2.00 | $6.00 | 51.3% | 50.3% | 8.47% | – |
azure_ai | azure_ai/mistral-large-2407ℹ️ mistral-large-2407 | 128k | $2.00 | $6.00 | 49% | 44.8% | 8.47% | – |
vertex_ai-mistral_models | vertex_ai/mistral-large@2407 mistral-large@2407 | 128k | $2.00 | $6.00 | 49% | 44.8% | 8.47% | – |
mistral | mistral/mistral-large-2407 mistral-large-2407 | 128k | $3.00 | $9.00 | 49% | 44.8% | 8.47% | – |
bedrock | mistral.mistral-large-2407-v1:0 mistral-large-2407-v1.0 | 128k | $3.00 | $9.00 | 49% | 44.8% | 8.47% | – |
azure_ai | azure_ai/mistral-large mistral-large | 32k | $4.00 | $12.00 | 51.3% | 50.3% | 8.47% | – |
mistral | mistral/mistral-large-2402 mistral-large-2402 | 32k | $4.00 | $12.00 | 38.8% | 24.5% | 1.94% | – |
azure | azure/mistral-large-latest mistral-large-latest | 32k | $8.00 | $24.00 | 51.3% | 50.3% | 8.47% | – |
azure | azure/mistral-large-2402 mistral-large-2402 | 32k | $8.00 | $24.00 | 38.8% | 24.5% | 1.94% | – |
bedrock | mistral.mistral-large-2402-v1:0 mistral-large-2402-v1.0 | 32k | $8.00 | $24.00 | 38.8% | 24.5% | 1.94% | – |
bedrock | bedrock/us-east-1/mistral.mistral-large-2402-v1:0 mistral-large-2402-v1.0 | 32k | $8.00 | $24.00 | 38.8% | 24.5% | 1.94% | – |
bedrock | bedrock/us-west-2/mistral.mistral-large-2402-v1:0 mistral-large-2402-v1.0 | 32k | $8.00 | $24.00 | 38.8% | 24.5% | 1.94% | – |
bedrock | bedrock/eu-west-3/mistral.mistral-large-2402-v1:0 mistral-large-2402-v1.0 | 32k | $10.40 | $31.20 | 38.8% | 24.5% | 1.94% | – |
bedrock, openrouter | ▶llama-3.1-405b-instruct (3 endpoints) | 32k–128k | $0.80–$5.32 | $0.80–$16.00 | 50.9% | 49.8% | 9.72% | – |
bedrock | meta.llama3-1-405b-instruct-v1:0 llama3-1-405b-instruct-v1.0 | 128k | $5.32 | $16.00 | 50.9% | 49.8% | 9.72% | – |
bedrock | us.meta.llama3-1-405b-instruct-v1:0 llama3-1-405b-instruct-v1.0 | 128k | $5.32 | $16.00 | 50.9% | 49.8% | 9.72% | – |
openrouter | meta-llama/llama-3.1-405b-instruct llama-3.1-405b-instruct | 32k | $0.80 | $0.80 | 50.9% | 49.8% | 9.72% | – |
openai, azure, openrouter | ▶o1-preview (8 endpoints) | 128k | $15.00–$16.50 | $60.00–$66.00 | 50.3% | 81.6% | 31.1% | – |
openai | o1-preview | 128k | $15.00 | $60.00 | 50.3% | 81.6% | 31.1% | – |
azure | azure/o1-preview o1-preview | 128k | $15.00 | $60.00 | 50.3% | 81.6% | 31.1% | – |
openrouter | openai/o1-preview o1-preview | 128k | $15.00 | $60.00 | 50.3% | 81.6% | 31.1% | – |
openai | o1-preview-2024-09-12 | 128k | $15.00 | $60.00 | 50.3% | 81.6% | 31.1% | – |
azure | azure/o1-preview-2024-09-12 o1-preview-2024-09-12 | 128k | $15.00 | $60.00 | 50.3% | 81.6% | 31.1% | – |
openrouter | openai/o1-preview-2024-09-12 o1-preview-2024-09-12 | 128k | $15.00 | $60.00 | 50.3% | 81.6% | 31.1% | – |
azure | azure/us/o1-preview-2024-09-12 o1-preview-2024-09-12 | 128k | $16.50 | $66.00 | 50.3% | 81.6% | 31.1% | – |
azure | azure/eu/o1-preview-2024-09-12 o1-preview-2024-09-12 | 128k | $16.50 | $66.00 | 50.3% | 81.6% | 31.1% | – |
openai, azure, openrouter | ▶gpt-4o (20 endpoints) | 128k | $2.50–$5.00 | $10.00–$15.00 | 49.2% | 53.3% | 6.39% | – |
openai | gpt-4o | 128k | $2.50 | $10.00 | 49.2% | 53.3% | 6.39% | – |
azure | azure/gpt-4o gpt-4o | 128k | $2.50 | $10.00 | 49.2% | 53.3% | 6.39% | – |
openrouter | openai/gpt-4o gpt-4o | 128k | $2.50 | $10.00 | 49.2% | 53.3% | 6.39% | – |
openai | gpt-4o-2024-08-06 | 128k | $2.50 | $10.00 | 49.2% | 53.3% | 6.39% | – |
azure | azure/gpt-4o-2024-08-06 gpt-4o-2024-08-06 | 128k | $2.50 | $10.00 | 49.2% | 53.3% | 6.39% | – |
azure | azure/global/gpt-4o-2024-08-06 gpt-4o-2024-08-06 | 128k | $2.50 | $10.00 | 49.2% | 53.3% | 6.39% | – |
azure | azure/global-standard/gpt-4o-2024-08-06 gpt-4o-2024-08-06 | 128k | $2.50 | $10.00 | 49.2% | 53.3% | 6.39% | – |
openrouter | openai/gpt-4o-2024-08-06 gpt-4o-2024-08-06 | 128k | $2.50 | $10.00 | 49.2% | 53.3% | 6.39% | – |
openai | gpt-4o-2024-11-20 | 128k | $2.50 | $10.00 | 47.9% | 49.8% | 6.25% | – |
azure | azure/global/gpt-4o-2024-11-20 gpt-4o-2024-11-20 | 128k | $2.50 | $10.00 | 47.9% | 49.8% | 6.25% | – |
azure | azure/global-standard/gpt-4o-2024-11-20 gpt-4o-2024-11-20 | 128k | $2.50 | $10.00 | 47.9% | 49.8% | 6.25% | – |
openrouter | openai/gpt-4o-2024-11-20 gpt-4o-2024-11-20 | 128k | $2.50 | $10.00 | 47.9% | 49.8% | 6.25% | – |
azure | azure/us/gpt-4o-2024-08-06 gpt-4o-2024-08-06 | 128k | $2.75 | $11.00 | 49.2% | 53.3% | 6.39% | – |
azure | azure/eu/gpt-4o-2024-08-06 gpt-4o-2024-08-06 | 128k | $2.75 | $11.00 | 49.2% | 53.3% | 6.39% | – |
azure | azure/gpt-4o-2024-11-20 gpt-4o-2024-11-20 | 128k | $2.75 | $11.00 | 47.9% | 49.8% | 6.25% | – |
azure | azure/us/gpt-4o-2024-11-20 gpt-4o-2024-11-20 | 128k | $2.75 | $11.00 | 47.9% | 49.8% | 6.25% | – |
azure | azure/eu/gpt-4o-2024-11-20 gpt-4o-2024-11-20 | 128k | $2.75 | $11.00 | 47.9% | 49.8% | 6.25% | – |
openai | gpt-4o-2024-05-13 | 128k | $5.00 | $15.00 | 48.9% | 51% | 6.25% | – |
azure | azure/gpt-4o-2024-05-13 gpt-4o-2024-05-13 | 128k | $5.00 | $15.00 | 48.9% | 51% | 6.25% | – |
openrouter | openai/gpt-4o-2024-05-13 gpt-4o-2024-05-13 | 128k | $5.00 | $15.00 | 48.9% | 51% | 6.25% | – |
openrouter | ▶qwen-2.5-72b-instruct (2 endpoints) | 32k | $0.00–$0.12 | $0.00–$0.39 | 49.1% | 63.2% | 8.06% | – |
openrouter | qwen/qwen-2.5-72b-instruct:free qwen-2.5-72b-instruct | 32k | $0.00 | $0.00 | 49.1% | 63.2% | 8.06% | – |
openrouter | qwen/qwen-2.5-72b-instruct qwen-2.5-72b-instruct | 32k | $0.12 | $0.39 | 49.1% | 63.2% | 8.06% | – |
openai, azure, openrouter | ▶gpt-4.1-nano (5 endpoints) | 1047k | $0.10 | $0.40 | 48.9% | 70% | 28.9% | – |
openai | gpt-4.1-nano | 1047k | $0.10 | $0.40 | 48.9% | 70% | 28.9% | – |
azure | azure/gpt-4.1-nano gpt-4.1-nano | 1047k | $0.10 | $0.40 | 48.9% | 70% | 28.9% | – |
openrouter | openai/gpt-4.1-nano gpt-4.1-nano | 1047k | $0.10 | $0.40 | 48.9% | 70% | 28.9% | – |
openai | gpt-4.1-nano-2025-04-14 | 1047k | $0.10 | $0.40 | 48.9% | 70% | 28.9% | – |
azure | azure/gpt-4.1-nano-2025-04-14 gpt-4.1-nano-2025-04-14 | 1047k | $0.10 | $0.40 | 48.9% | 70% | 28.9% | – |
gemini, openrouter | ▶gemma-3-27b-it (3 endpoints) | 96k–131k | $0.00–$0.10 >128k: $0.00 | $0.00–$0.20 >128k: $0.00 | 48.9% | 74% | 19.7% | – |
gemini | gemini/gemma-3-27b-itℹ️ gemma-3-27b-it | 131k | $0.00 >128k: $0.00 | $0.00 >128k: $0.00 | 48.9% | 74% | 19.7% | – |
openrouter | google/gemma-3-27b-it gemma-3-27b-it | 131k | $0.10 | $0.20 | 48.9% | 74% | 19.7% | – |
openrouter | google/gemma-3-27b-it:free gemma-3-27b-it | 96k | $0.00 | $0.00 | 48.9% | 74% | 19.7% | – |
azure_ai, vertex_ai-mistral_models, openrouter, mistral, bedrock | ▶mistral-small (7 endpoints) | 32k–128k | $0.10–$1.00 | $0.30–$3.00 | 47.5% | 46.8% | 5.83% | – |
azure_ai | azure_ai/mistral-small-2503 mistral-small-2503 | 128k | $1.00 | $3.00 | 47.5% | 46.8% | 5.83% | – |
vertex_ai-mistral_models | vertex_ai/mistral-small-2503 mistral-small-2503 | 128k | $1.00 | $3.00 | 47.5% | 46.8% | 5.83% | – |
openrouter | mistralai/mistral-small mistral-small | 32k | $0.20 | $0.60 | 47.5% | 46.8% | 5.83% | – |
mistral | mistral/mistral-small mistral-small | 32k | $0.10 | $0.30 | 47.5% | 46.8% | 5.83% | – |
mistral | mistral/mistral-small-latest mistral-small-latest | 32k | $0.10 | $0.30 | 47.5% | 46.8% | 5.83% | – |
azure_ai | azure_ai/mistral-small mistral-small | 32k | $1.00 | $3.00 | 47.5% | 46.8% | 5.83% | – |
bedrock | mistral.mistral-small-2402-v1:0 mistral-small-2402-v1.0 | 32k | $1.00 | $3.00 | – | – | – | – |
vertex_ai-language-models, gemini | ▶gemini-1.5-flash-002 (2 endpoints) | 1048k | $0.075 >128k: $0.15–$1.00 | $0.30 >128k: $0.60 | 47.3% | 61.9% | 16.3% | – |
vertex_ai-language-models | gemini-1.5-flash-002ℹ️ | 1048k | $0.075 >128k: $1.00 | $0.30 >128k: $0.60 | 47.3% | 61.9% | 16.3% | – |
gemini | gemini/gemini-1.5-flash-002ℹ️ gemini-1.5-flash-002 | 1048k | $0.075 >128k: $0.15 | $0.30 >128k: $0.60 | 47.3% | 61.9% | 16.3% | – |
openrouter, nscale | ▶deepseek-r1-distill-qwen-14b (3 endpoints) | 64k | $0.00–$0.15 | $0.00–$0.15 | 44.7% | 87.1% | – | – |
openrouter | deepseek/deepseek-r1-distill-qwen-14b:free deepseek-r1-distill-qwen-14b | 64k | $0.00 | $0.00 | 44.7% | 87.1% | – | – |
openrouter | deepseek/deepseek-r1-distill-qwen-14b deepseek-r1-distill-qwen-14b | 64k | $0.15 | $0.15 | 44.7% | 87.1% | – | – |
nscale | nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-14Bℹ️ deepseek-r1-distill-qwen-14b | – | $0.07 | $0.07 | 44.7% | 87.1% | – | – |
openai, azure, openrouter | ▶gpt-4o-mini (9 endpoints) | 128k | $0.15–$0.165 | $0.60–$0.66 | 37.7% | 52.6% | – | – |
openai | gpt-4o-mini | 128k | $0.15 | $0.60 | 37.7% | 52.6% | – | – |
azure | azure/global-standard/gpt-4o-mini gpt-4o-mini | 128k | $0.15 | $0.60 | 37.7% | 52.6% | – | – |
openrouter | openai/gpt-4o-mini gpt-4o-mini | 128k | $0.15 | $0.60 | 37.7% | 52.6% | – | – |
openai | gpt-4o-mini-2024-07-18 | 128k | $0.15 | $0.60 | 37.7% | 52.6% | – | – |
openrouter | openai/gpt-4o-mini-2024-07-18 gpt-4o-mini-2024-07-18 | 128k | $0.15 | $0.60 | 37.7% | 52.6% | – | – |
azure | azure/gpt-4o-mini gpt-4o-mini | 128k | $0.165 | $0.66 | 37.7% | 52.6% | – | – |
azure | azure/gpt-4o-mini-2024-07-18 gpt-4o-mini-2024-07-18 | 128k | $0.165 | $0.66 | 37.7% | 52.6% | – | – |
azure | azure/us/gpt-4o-mini-2024-07-18 gpt-4o-mini-2024-07-18 | 128k | $0.165 | $0.66 | 37.7% | 52.6% | – | – |
azure | azure/eu/gpt-4o-mini-2024-07-18 gpt-4o-mini-2024-07-18 | 128k | $0.165 | $0.66 | 37.7% | 52.6% | – | – |
openai, openrouter | ▶chatgpt-4o-latest (2 endpoints) | 128k | $5.00 | $15.00 | – | – | – | – |
openai | chatgpt-4o-latest | 128k | $5.00 | $15.00 | – | – | – | – |
openrouter | openai/chatgpt-4o-latest chatgpt-4o-latest | 128k | $5.00 | $15.00 | – | – | – | – |
openrouter, vertex_ai-mistral_models, codestral, mistral | ▶codestral-latest (7 endpoints) | 32k–262k | $0.00–$1.00 | $0.00–$3.00 | – | – | – | – |
openrouter | mistralai/codestral-2501 codestral-2501 | 262k | $0.30 | $0.90 | – | – | – | – |
vertex_ai-mistral_models | vertex_ai/codestral@2405 codestral@2405 | 128k | $0.20 | $0.60 | – | – | – | – |
vertex_ai-mistral_models | vertex_ai/codestral-2501 codestral-2501 | 128k | $0.20 | $0.60 | – | – | – | – |
codestral | codestral/codestral-2405ℹ️ codestral-2405 | 32k | $0.00 | $0.00 | – | – | – | – |
codestral | codestral/codestral-latestℹ️ codestral-latest | 32k | $0.00 | $0.00 | – | – | – | – |
mistral | mistral/codestral-2405 codestral-2405 | 32k | $1.00 | $3.00 | – | – | – | – |
mistral | mistral/codestral-latest codestral-latest | 32k | $1.00 | $3.00 | – | – | – | – |
vertex_ai-language-models, gemini | ▶gemini-2.0-flash (2 endpoints) | 1048k | $0.10 | $0.40 | – | – | – | – |
vertex_ai-language-models | gemini-2.0-flashℹ️ | 1048k | $0.10 | $0.40 | – | – | – | – |
gemini | gemini/gemini-2.0-flashℹ️ gemini-2.0-flash | 1048k | $0.10 | $0.40 | – | – | – | – |
vertex_ai-language-models, gemini | ▶gemini-2.0-flash-lite (2 endpoints) | 1048k | $0.075 | $0.30 | – | – | – | – |
vertex_ai-language-models | gemini-2.0-flash-liteℹ️ | 1048k | $0.075 | $0.30 | – | – | – | – |
gemini | gemini/gemini-2.0-flash-liteℹ️ gemini-2.0-flash-lite | 1048k | $0.075 | $0.30 | – | – | – | – |
openrouter, gemini, vertex_ai-language-models | ▶gemini-2.5-flash-preview (4 endpoints) | 1048k | $0.15 | $0.60–$3.50 | – | – | 73.1% | – |
openrouter | google/gemini-2.5-flash-preview gemini-2.5-flash-preview | 1048k | $0.15 | $0.60 | – | – | 73.1% | – |
gemini | gemini/gemini-2.5-flash-preview-04-17ℹ️ gemini-2.5-flash-preview-04-17 | 1048k | $0.15 | $0.60 | – | – | 73.1% | – |
vertex_ai-language-models | gemini-2.5-flash-preview-04-17ℹ️ | 1048k | $0.15 | $0.60 | – | – | 73.1% | – |
openrouter | google/gemini-2.5-flash-preview:thinking gemini-2.5-flash-preview:thinking | 1048k | $0.15 | $3.50 | – | – | 73.1% | – |
openrouter, vertex_ai-language-models, gemini | ▶gemini-2.5-pro-preview (4 endpoints) | 1048k | $1.25 >200k: $2.50 | $10.00 >200k: $15.00 | – | 95.9% | – | – |
openrouter | google/gemini-2.5-pro-preview gemini-2.5-pro-preview | 1048k | $1.25 | $10.00 | – | 95.9% | – | – |
vertex_ai-language-models | gemini-2.5-pro-preview-03-25ℹ️ | 1048k | $1.25 >200k: $2.50 | $10.00 >200k: $15.00 | – | – | – | – |
vertex_ai-language-models | gemini-2.5-pro-preview-05-06ℹ️ | 1048k | $1.25 >200k: $2.50 | $10.00 >200k: $15.00 | – | 95.9% | – | – |
gemini | gemini/gemini-2.5-pro-preview-05-06ℹ️ gemini-2.5-pro-preview-05-06 | 1048k | $1.25 >200k: $2.50 | $10.00 >200k: $15.00 | – | 95.9% | – | – |
openrouter | openai/o1-pro o1-pro | 200k | $150.00 | $600.00 | – | – | – | – |
openrouter, azure_ai, bedrock_converse, nscale | ▶llama-3.3-70b-instruct (6 endpoints) | 128k–131k | $0.00–$0.72 | $0.00–$0.72 | 47.4% | 41.6% | 5.14% | – |
openrouter | meta-llama/llama-3.3-70b-instruct:free llama-3.3-70b-instruct | 131k | $0.00 | $0.00 | 47.4% | 41.6% | 5.14% | – |
openrouter | meta-llama/llama-3.3-70b-instruct llama-3.3-70b-instruct | 131k | $0.07 | $0.33 | 47.4% | 41.6% | 5.14% | – |
azure_ai | azure_ai/Llama-3.3-70B-Instructℹ️ llama-3.3-70b-instruct | 128k | $0.71 | $0.71 | 47.4% | 41.6% | 5.14% | – |
bedrock_converse | meta.llama3-3-70b-instruct-v1:0 llama3-3-70b-instruct-v1.0 | 128k | $0.72 | $0.72 | 47.4% | 41.6% | 5.14% | – |
bedrock_converse | us.meta.llama3-3-70b-instruct-v1:0 llama3-3-70b-instruct-v1.0 | 128k | $0.72 | $0.72 | 47.4% | 41.6% | 5.14% | – |
nscale | nscale/meta-llama/Llama-3.3-70B-Instructℹ️ llama-3.3-70b-instruct | – | $0.20 | $0.20 | 47.4% | 41.6% | 5.14% | – |
vertex_ai-anthropic_models, openrouter, anthropic, bedrock | ▶claude-3-opus (8 endpoints) | 200k | $15.00 | $75.00 | 47.2% | 37.5% | 4.72% | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-opus claude-3-opus | 200k | $15.00 | $75.00 | 47.2% | 37.5% | 4.72% | – |
openrouter | anthropic/claude-3-opus claude-3-opus | 200k | $15.00 | $75.00 | 47.2% | 37.5% | 4.72% | – |
anthropic | claude-3-opus-20240229 | 200k | $15.00 | $75.00 | 47.2% | 37.5% | 4.72% | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-opus@20240229 claude-3-opus@20240229 | 200k | $15.00 | $75.00 | 47.2% | 37.5% | 4.72% | – |
bedrock | anthropic.claude-3-opus-20240229-v1:0 claude-3-opus-20240229-v1.0 | 200k | $15.00 | $75.00 | 47.2% | 37.5% | 4.72% | – |
bedrock | us.anthropic.claude-3-opus-20240229-v1:0 claude-3-opus-20240229-v1.0 | 200k | $15.00 | $75.00 | 47.2% | 37.5% | 4.72% | – |
bedrock | eu.anthropic.claude-3-opus-20240229-v1:0 claude-3-opus-20240229-v1.0 | 200k | $15.00 | $75.00 | 47.2% | 37.5% | 4.72% | – |
anthropic | claude-3-opus-latest | 200k | $15.00 | $75.00 | 47.2% | 37.5% | 4.72% | – |
openai, azure, openrouter | ▶gpt-4-turbo (5 endpoints) | 128k | $10.00 | $30.00 | 46.6% | 46.7% | 6.67% | – |
openai | gpt-4-turbo | 128k | $10.00 | $30.00 | 46.6% | 46.7% | 6.67% | – |
azure | azure/gpt-4-turbo gpt-4-turbo | 128k | $10.00 | $30.00 | 46.6% | 46.7% | 6.67% | – |
openrouter | openai/gpt-4-turbo gpt-4-turbo | 128k | $10.00 | $30.00 | 46.6% | 46.7% | 6.67% | – |
openai | gpt-4-turbo-2024-04-09 | 128k | $10.00 | $30.00 | 46.6% | 46.7% | 6.67% | – |
azure | azure/gpt-4-turbo-2024-04-09 gpt-4-turbo-2024-04-09 | 128k | $10.00 | $30.00 | 46.6% | 46.7% | 6.67% | – |
gemini, vertex_ai-language-models | ▶gemini-1.5-pro-001 (2 endpoints) | 1000k–2097k | $1.25–$3.50 >128k: $2.50–$7.00 | $5.00–$10.50 >128k: $10.00–$21.00 | 45.9% | 40.7% | 6.81% | – |
gemini | gemini/gemini-1.5-pro-001ℹ️ gemini-1.5-pro-001 | 2097k | $3.50 >128k: $7.00 | $10.50 >128k: $21.00 | 45.9% | 40.7% | 6.81% | – |
vertex_ai-language-models | gemini-1.5-pro-001ℹ️ | 1000k | $1.25 >128k: $2.50 | $5.00 >128k: $10.00 | 45.9% | 40.7% | 6.81% | – |
openrouter, perplexity, bedrock | ▶llama-3.1-70b-instruct (4 endpoints) | 128k–131k | $0.10–$1.00 | $0.28–$1.00 | 44.2% | 36.7% | 3.61% | – |
openrouter | meta-llama/llama-3.1-70b-instruct llama-3.1-70b-instruct | 131k | $0.10 | $0.28 | 44.2% | 36.7% | 3.61% | – |
perplexity | perplexity/llama-3.1-70b-instruct llama-3.1-70b-instruct | 131k | $1.00 | $1.00 | 44.2% | 36.7% | 3.61% | – |
bedrock | meta.llama3-1-70b-instruct-v1:0 llama3-1-70b-instruct-v1.0 | 128k | $0.99 | $0.99 | 44.2% | 36.7% | 3.61% | – |
bedrock | us.meta.llama3-1-70b-instruct-v1:0 llama3-1-70b-instruct-v1.0 | 128k | $0.99 | $0.99 | 44.2% | 36.7% | 3.61% | – |
openrouter | microsoft/wizardlm-2-8x22b wizardlm-2-8x22b | 65k | $0.50 | $0.50 | 43.4% | 25.7% | – | – |
openai, azure, openrouter | ▶gpt-4-1106-preview (3 endpoints) | 128k | $10.00 | $30.00 | 42.4% | 40% | – | – |
openai | gpt-4-1106-preview | 128k | $10.00 | $30.00 | 42.4% | 40% | – | – |
azure | azure/gpt-4-1106-preview gpt-4-1106-preview | 128k | $10.00 | $30.00 | 42.4% | 40% | – | – |
openrouter | openai/gpt-4-1106-preview gpt-4-1106-preview | 128k | $10.00 | $30.00 | 42.4% | 40% | – | – |
openai, azure | ▶gpt-4-0125-preview (2 endpoints) | 128k | $10.00 | $30.00 | 42.3% | 35.4% | – | – |
openai | gpt-4-0125-preview | 128k | $10.00 | $30.00 | 42.3% | 35.4% | – | – |
azure | azure/gpt-4-0125-preview gpt-4-0125-preview | 128k | $10.00 | $30.00 | 42.3% | 35.4% | – | – |
openrouter, azure_ai | ▶llama-3.2-90b-vision-instruct (2 endpoints) | 128k–131k | $1.20–$2.04 | $1.20–$2.04 | 41% | 39.4% | 2.64% | – |
openrouter | meta-llama/llama-3.2-90b-vision-instruct llama-3.2-90b-vision-instruct | 131k | $1.20 | $1.20 | 41% | 39.4% | 2.64% | – |
azure_ai | azure_ai/Llama-3.2-90B-Vision-Instructℹ️ llama-3.2-90b-vision-instruct | 128k | $2.04 | $2.04 | 41% | 39.4% | 2.64% | – |
fireworks_ai, openrouter | ▶qwen2-72b-instruct (2 endpoints) | 32k | $0.90 | $0.90 | 40.8% | 39.1% | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/qwen2-72b-instructℹ️ qwen2-72b-instruct | 32k | $0.90 | $0.90 | 40.8% | 39.1% | – | – |
openrouter | qwen/qwen-2-72b-instruct qwen-2-72b-instruct | 32k | $0.90 | $0.90 | 40.8% | 39.1% | – | – |
vertex_ai-anthropic_models, openrouter, anthropic, bedrock | ▶claude-3-sonnet (7 endpoints) | 200k | $3.00 | $15.00 | 40.6% | 18.2% | 2.5% | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-sonnet claude-3-sonnet | 200k | $3.00 | $15.00 | 40.6% | 18.2% | 2.5% | – |
openrouter | anthropic/claude-3-sonnet claude-3-sonnet | 200k | $3.00 | $15.00 | 40.6% | 18.2% | 2.5% | – |
anthropic | claude-3-sonnet-20240229 | 200k | $3.00 | $15.00 | 40.6% | 18.2% | 2.5% | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-sonnet@20240229 claude-3-sonnet@20240229 | 200k | $3.00 | $15.00 | 40.6% | 18.2% | 2.5% | – |
bedrock | anthropic.claude-3-sonnet-20240229-v1:0 claude-3-sonnet-20240229-v1.0 | 200k | $3.00 | $15.00 | 40.6% | 18.2% | 2.5% | – |
bedrock | us.anthropic.claude-3-sonnet-20240229-v1:0 claude-3-sonnet-20240229-v1.0 | 200k | $3.00 | $15.00 | 40.6% | 18.2% | 2.5% | – |
bedrock | eu.anthropic.claude-3-sonnet-20240229-v1:0 claude-3-sonnet-20240229-v1.0 | 200k | $3.00 | $15.00 | 40.6% | 18.2% | 2.5% | – |
anyscale, azure_ai, deepinfra | ▶meta-llama-3-70b-instruct (3 endpoints) | 8k–8k | $0.59–$1.10 | $0.37–$1.00 | 40.6% | 22.6% | 4.31% | – |
anyscale | anyscale/meta-llama/Meta-Llama-3-70B-Instructℹ️ meta-llama-3-70b-instruct | 8k | $1.00 | $1.00 | 40.6% | 22.6% | 4.31% | – |
azure_ai | azure_ai/Meta-Llama-3-70B-Instruct meta-llama-3-70b-instruct | 8k | $1.10 | $0.37 | 40.6% | 22.6% | 4.31% | – |
deepinfra | deepinfra/meta-llama/Meta-Llama-3-70B-Instruct meta-llama-3-70b-instruct | 8k | $0.59 | $0.79 | 40.6% | 22.6% | 4.31% | – |
gemini, vertex_ai-language-models | ▶gemini-1.5-flash-001 (2 endpoints) | 1000k–1048k | $0.075 >128k: $0.15–$1.00 | $0.30 >128k: $0.60 | 40.4% | 25.1% | 3.89% | – |
gemini | gemini/gemini-1.5-flash-001ℹ️ gemini-1.5-flash-001 | 1048k | $0.075 >128k: $0.15 | $0.30 >128k: $0.60 | 40.4% | 25.1% | 3.89% | – |
vertex_ai-language-models | gemini-1.5-flash-001ℹ️ | 1000k | $0.075 >128k: $1.00 | $0.30 >128k: $0.60 | 40.4% | 25.1% | 3.89% | – |
bedrock, openrouter, anthropic, vertex_ai-anthropic_models | ▶claude-3.5-haiku (9 endpoints) | 200k | $0.25–$1.00 | $1.25–$5.00 | 38.1% | 46.4% | 4.31% | – |
bedrock | eu.anthropic.claude-3-5-haiku-20241022-v1:0 claude-3-5-haiku-20241022-v1.0 | 200k | $0.25 | $1.25 | 38.1% | 46.4% | 4.31% | – |
openrouter | anthropic/claude-3.5-haiku claude-3.5-haiku | 200k | $0.80 | $4.00 | 38.1% | 46.4% | 4.31% | – |
anthropic | claude-3-5-haiku-20241022 | 200k | $0.80 | $4.00 | 38.1% | 46.4% | 4.31% | – |
openrouter | anthropic/claude-3.5-haiku-20241022 claude-3.5-haiku-20241022 | 200k | $0.80 | $4.00 | 38.1% | 46.4% | 4.31% | – |
bedrock | anthropic.claude-3-5-haiku-20241022-v1:0 claude-3-5-haiku-20241022-v1.0 | 200k | $0.80 | $4.00 | 38.1% | 46.4% | 4.31% | – |
bedrock | us.anthropic.claude-3-5-haiku-20241022-v1:0 claude-3-5-haiku-20241022-v1.0 | 200k | $0.80 | $4.00 | 38.1% | 46.4% | 4.31% | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-5-haiku claude-3-5-haiku | 200k | $1.00 | $5.00 | 38.1% | 46.4% | 4.31% | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-5-haiku@20241022 claude-3-5-haiku@20241022 | 200k | $1.00 | $5.00 | 38.1% | 46.4% | 4.31% | – |
anthropic | claude-3-5-haiku-latest | 200k | $1.00 | $5.00 | 38.1% | 46.4% | 4.31% | – |
openrouter | google/gemma-2-27b-it gemma-2-27b-it | 8k | $0.10 | $0.30 | 36.5% | 27.9% | 1.39% | – |
vertex_ai-anthropic_models, openrouter, anthropic, bedrock | ▶claude-3-haiku (7 endpoints) | 200k | $0.25 | $1.25 | 36.3% | 14.9% | 1.81% | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-haiku claude-3-haiku | 200k | $0.25 | $1.25 | 36.3% | 14.9% | 1.81% | – |
openrouter | anthropic/claude-3-haiku claude-3-haiku | 200k | $0.25 | $1.25 | 36.3% | 14.9% | 1.81% | – |
anthropic | claude-3-haiku-20240307 | 200k | $0.25 | $1.25 | 36.3% | 14.9% | 1.81% | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-haiku@20240307 claude-3-haiku@20240307 | 200k | $0.25 | $1.25 | 36.3% | 14.9% | 1.81% | – |
bedrock | anthropic.claude-3-haiku-20240307-v1:0 claude-3-haiku-20240307-v1.0 | 200k | $0.25 | $1.25 | 36.3% | 14.9% | 1.81% | – |
bedrock | us.anthropic.claude-3-haiku-20240307-v1:0 claude-3-haiku-20240307-v1.0 | 200k | $0.25 | $1.25 | 36.3% | 14.9% | 1.81% | – |
bedrock | eu.anthropic.claude-3-haiku-20240307-v1:0 claude-3-haiku-20240307-v1.0 | 200k | $0.25 | $1.25 | 36.3% | 14.9% | 1.81% | – |
openrouter, anthropic | ▶claude-2 (3 endpoints) | 100k–200k | $8.00 | $24.00 | 34.7% | 11.7% | 2.5% | – |
openrouter | anthropic/claude-2 claude-2 | 200k | $8.00 | $24.00 | 34.7% | 11.7% | 2.5% | – |
anthropic | claude-2.0 claude-2 | 100k | $8.00 | $24.00 | 34.7% | 11.7% | 2.5% | – |
openrouter | anthropic/claude-2.0 claude-2.0 | 100k | $8.00 | $24.00 | 34.7% | 11.7% | 2.5% | – |
mistral | mistral/open-mixtral-8x22b open-mixtral-8x22b | 65k | $2.00 | $6.00 | 34.1% | 24.2% | – | – |
vertex_ai-language-models | gemini-1.0-pro-001ℹ️ | 32k | $0.50 | $1.50 | 34% | 11.2% | 1.11% | – |
anthropic, openrouter | ▶claude-2.1 (2 endpoints) | 200k | $8.00 | $24.00 | 33% | – | 1.94% | – |
anthropic | claude-2.1 | 200k | $8.00 | $24.00 | 33% | – | 1.94% | – |
openrouter | anthropic/claude-2.1 claude-2.1 | 200k | $8.00 | $24.00 | 33% | – | 1.94% | – |
openai, azure, openrouter | ▶gpt-4 (6 endpoints) | 8k–8k | $30.00 | $60.00 | 30.7% | 23% | – | – |
openai | gpt-4 | 8k | $30.00 | $60.00 | 30.7% | 23% | – | – |
azure | azure/gpt-4 gpt-4 | 8k | $30.00 | $60.00 | 30.7% | 23% | – | – |
openai | gpt-4-0613 | 8k | $30.00 | $60.00 | 30.7% | 23% | – | – |
azure | azure/gpt-4-0613 gpt-4-0613 | 8k | $30.00 | $60.00 | 30.7% | 23% | – | – |
openrouter | openai/gpt-4 gpt-4 | 8k | $30.00 | $60.00 | 30.7% | 23% | – | – |
openrouter | openai/gpt-4-0314 gpt-4-0314 | 8k | $30.00 | $60.00 | – | – | – | – |
deepinfra, bedrock, anyscale, replicate, together_ai | ▶mixtral-8x7b-instruct-v0.1 (8 endpoints) | 4k–32k | $0.15–$0.60 | $0.15–$1.00 | 30.6% | 9.29% | – | – |
deepinfra | deepinfra/mistralai/Mixtral-8x7B-Instruct-v0.1 mixtral-8x7b-instruct-v0.1 | 32k | $0.27 | $0.27 | 30.6% | 9.29% | – | – |
bedrock | mistral.mixtral-8x7b-instruct-v0:1 mixtral-8x7b-instruct-v0.1 | 32k | $0.45 | $0.70 | 30.6% | 9.29% | – | – |
bedrock | bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1 mixtral-8x7b-instruct-v0.1 | 32k | $0.45 | $0.70 | 30.6% | 9.29% | – | – |
bedrock | bedrock/us-east-1/mistral.mixtral-8x7b-instruct-v0:1 mixtral-8x7b-instruct-v0.1 | 32k | $0.45 | $0.70 | 30.6% | 9.29% | – | – |
bedrock | bedrock/eu-west-3/mistral.mixtral-8x7b-instruct-v0:1 mixtral-8x7b-instruct-v0.1 | 32k | $0.59 | $0.91 | 30.6% | 9.29% | – | – |
anyscale | anyscale/mistralai/Mixtral-8x7B-Instruct-v0.1ℹ️ mixtral-8x7b-instruct-v0.1 | 16k | $0.15 | $0.15 | 30.6% | 9.29% | – | – |
replicate | replicate/mistralai/mixtral-8x7b-instruct-v0.1 mixtral-8x7b-instruct-v0.1 | 4k | $0.30 | $1.00 | 30.6% | 9.29% | – | – |
together_ai | together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1 mixtral-8x7b-instruct-v0.1 | – | $0.60 | $0.60 | 30.6% | 9.29% | – | – |
mistral | ▶open-mistral-nemo (2 endpoints) | 128k | $0.30 | $0.30 | 29.9% | 10.8% | – | – |
mistral | mistral/open-mistral-nemoℹ️ open-mistral-nemo | 128k | $0.30 | $0.30 | 29.9% | 10.8% | – | – |
mistral | mistral/open-mistral-nemo-2407ℹ️ open-mistral-nemo-2407 | 128k | $0.30 | $0.30 | 29.9% | 10.8% | – | – |
mistral | mistral/open-mixtral-8x7b open-mixtral-8x7b | 32k | $0.70 | $0.70 | 29.8% | 9.95% | – | – |
openrouter, openai, azure | ▶gpt-3.5-turbo (14 endpoints) | 4k–16k | $0.20–$1.50 | $1.50–$2.00 | 28% | 15.9% | – | – |
openrouter | openai/gpt-3.5-turbo gpt-3.5-turbo | 16k | $0.50 | $1.50 | 28% | 15.9% | – | – |
openai | gpt-3.5-turbo-0125 | 16k | $0.50 | $1.50 | 27.2% | 11.6% | – | – |
openrouter | openai/gpt-3.5-turbo-0125 gpt-3.5-turbo-0125 | 16k | $0.50 | $1.50 | 27.2% | 11.6% | – | – |
openai | gpt-3.5-turbo-1106 | 16k | $1.00 | $2.00 | 28% | 15.9% | – | – |
openrouter | openai/gpt-3.5-turbo-1106 gpt-3.5-turbo-1106 | 16k | $1.00 | $2.00 | 28% | 15.9% | – | – |
openai | gpt-3.5-turbo | 16k | $1.50 | $2.00 | 28% | 15.9% | – | – |
azure | azure/gpt-35-turbo-0125 gpt-35-turbo-0125 | 16k | $0.50 | $1.50 | 27.2% | 11.6% | – | – |
azure | azure/gpt-3.5-turbo-0125 gpt-3.5-turbo-0125 | 16k | $0.50 | $1.50 | 27.2% | 11.6% | – | – |
azure | azure/gpt-35-turbo-1106 gpt-35-turbo-1106 | 16k | $1.00 | $2.00 | 28% | 15.9% | – | – |
azure | azure/gpt-35-turbo-0301 gpt-35-turbo-0301 | 4k | $0.20 | $2.00 | – | – | – | – |
azure | azure/gpt-35-turbo gpt-35-turbo | 4k | $0.50 | $1.50 | 28% | 15.9% | – | – |
azure | azure/gpt-3.5-turbo gpt-3.5-turbo | 4k | $0.50 | $1.50 | 28% | 15.9% | – | – |
azure | azure/gpt-35-turbo-0613 gpt-35-turbo-0613 | 4k | $1.50 | $2.00 | – | – | – | – |
openrouter | openai/gpt-3.5-turbo-0613 gpt-3.5-turbo-0613 | 4k | $1.00 | $2.00 | – | – | – | – |
openrouter, azure_ai | ▶phi-3-medium-128k-instruct (2 endpoints) | 128k–131k | $0.10–$0.17 | $0.30–$0.68 | 27.6% | 17.6% | – | – |
openrouter | microsoft/phi-3-medium-128k-instruct phi-3-medium-128k-instruct | 131k | $0.10 | $0.30 | 27.6% | 17.6% | – | – |
azure_ai | azure_ai/Phi-3-medium-128k-instructℹ️ phi-3-medium-128k-instruct | 128k | $0.17 | $0.68 | 27.6% | 17.6% | – | – |
openrouter, groq | ▶gemma-2-9b-it (3 endpoints) | 8k | $0.00–$0.20 | $0.00–$0.20 | 27.5% | 21% | 0.556% | – |
openrouter | google/gemma-2-9b-it:free gemma-2-9b-it | 8k | $0.00 | $0.00 | 27.5% | 21% | 0.556% | – |
openrouter | google/gemma-2-9b-it gemma-2-9b-it | 8k | $0.02 | $0.06 | 27.5% | 21% | 0.556% | – |
groq | groq/gemma2-9b-it gemma2-9b-it | 8k | $0.20 | $0.20 | 27.5% | 21% | 0.556% | – |
replicate, deepinfra, perplexity, openrouter, anyscale | ▶llama-2-70b-chat (5 endpoints) | 4k | $0.65–$1.00 | $0.90–$2.80 | 26.3% | 3.29% | 0% | – |
replicate | replicate/meta/llama-2-70b-chat llama-2-70b-chat | 4k | $0.65 | $2.75 | – | – | – | – |
deepinfra | deepinfra/meta-llama/Llama-2-70b-chat-hf llama-2-70b-chat | 4k | $0.70 | $0.90 | 26.3% | 3.29% | 0% | – |
perplexity | perplexity/llama-2-70b-chat llama-2-70b-chat | 4k | $0.70 | $2.80 | – | – | – | – |
openrouter | meta-llama/llama-2-70b-chat llama-2-70b-chat | 4k | $0.90 | $0.90 | – | – | – | – |
anyscale | anyscale/meta-llama/Llama-2-70b-chat-hf llama-2-70b-chat | 4k | $1.00 | $1.00 | 26.3% | 3.29% | 0% | – |
anyscale, deepinfra | ▶meta-llama-3-8b-instruct (2 endpoints) | 8k–8k | $0.08–$0.15 | $0.08–$0.15 | 26.1% | 6.13% | 0.833% | – |
anyscale | anyscale/meta-llama/Meta-Llama-3-8B-Instructℹ️ meta-llama-3-8b-instruct | 8k | $0.15 | $0.15 | – | – | – | – |
deepinfra | deepinfra/meta-llama/Meta-Llama-3-8B-Instruct meta-llama-3-8b-instruct | 8k | $0.08 | $0.08 | 26.1% | 6.13% | 0.833% | – |
openrouter, perplexity, lambda, bedrock, nscale | ▶llama-3.1-8b-instruct (7 endpoints) | 16k–131k | $0.00–$0.22 | $0.00–$0.22 | 25.9% | 22.9% | 2.5% | – |
openrouter | meta-llama/llama-3.1-8b-instruct:free llama-3.1-8b-instruct | 131k | $0.00 | $0.00 | 25.9% | 22.9% | 2.5% | – |
perplexity | perplexity/llama-3.1-8b-instruct llama-3.1-8b-instruct | 131k | $0.20 | $0.20 | 25.9% | 22.9% | 2.5% | – |
lambda | llama3.1-8b-instruct | 131k | $0.025 | $0.04 | 25.9% | 22.9% | 2.5% | – |
bedrock | meta.llama3-1-8b-instruct-v1:0 llama3-1-8b-instruct-v1.0 | 128k | $0.22 | $0.22 | 25.9% | 22.9% | 2.5% | – |
bedrock | us.meta.llama3-1-8b-instruct-v1:0 llama3-1-8b-instruct-v1.0 | 128k | $0.22 | $0.22 | 25.9% | 22.9% | 2.5% | – |
openrouter | meta-llama/llama-3.1-8b-instruct llama-3.1-8b-instruct | 16k | $0.02 | $0.03 | 25.9% | 22.9% | 2.5% | – |
nscale | nscale/meta-llama/Llama-3.1-8B-Instructℹ️ llama-3.1-8b-instruct | – | $0.03 | $0.03 | 25.9% | 22.9% | 2.5% | – |
azure_ai, sambanova, friendliai | ▶meta-llama-3.1-8b-instruct (3 endpoints) | 8k–128k | $0.10–$0.30 | $0.10–$0.61 | 25.9% | 22.9% | 2.5% | – |
azure_ai | azure_ai/Meta-Llama-3.1-8B-Instructℹ️ meta-llama-3.1-8b-instruct | 128k | $0.30 | $0.61 | 25.9% | 22.9% | 2.5% | – |
sambanova | sambanova/Meta-Llama-3.1-8B-Instructℹ️ meta-llama-3.1-8b-instruct | 16k | $0.10 | $0.20 | 25.9% | 22.9% | 2.5% | – |
friendliai | friendliai/meta-llama-3.1-8b-instruct meta-llama-3.1-8b-instruct | 8k | $0.10 | $0.10 | – | – | – | – |
openrouter | mistralai/mistral-7b-instruct-v0.3 mistral-7b-instruct-v0.3 | 32k | $0.028 | $0.054 | 15.2% | 3.6% | – | – |
deepinfra | deepinfra/01-ai/Yi-34B-Chat yi-34b-chat | 4k | $0.60 | $0.60 | 14.7% | 5.15% | – | – |
mistral | mistral/open-mistral-7b open-mistral-7b | 32k | $0.25 | $0.25 | 13.2% | 3.68% | – | – |
openrouter | aion-labs/aion-1.0 aion-1.0 | 131k | $4.00 | $8.00 | – | – | – | – |
openrouter | aion-labs/aion-1.0-mini aion-1.0-mini | 131k | $0.70 | $1.40 | – | – | – | – |
openrouter | aion-labs/aion-rp-llama-3.1-8b aion-rp-llama-3.1-8b | 32k | $0.20 | $0.20 | – | – | – | – |
deepinfra | deepinfra/deepinfra/airoboros-70b airoboros-70b | 4k | $0.70 | $0.90 | – | – | – | – |
openrouter | jondurbin/airoboros-l2-70b airoboros-l2-70b | 4k | $0.50 | $0.50 | – | – | – | – |
deepinfra | deepinfra/jondurbin/airoboros-l2-70b-gpt4-1.4.1 airoboros-l2-70b-gpt4-1.4.1 | 4k | $0.70 | $0.90 | – | – | – | – |
openrouter | thedrummer/anubis-pro-105b-v1 anubis-pro-105b-v1 | 131k | $0.80 | $1.00 | – | – | – | – |
openrouter | arcee-ai/arcee-blitz arcee-blitz | 32k | $0.45 | $0.75 | – | – | – | – |
openrouter | arcee-ai/caller-large caller-large | 32k | $0.55 | $0.85 | – | – | – | – |
vertex_ai-chat-models, palm | ▶chat-bison (2 endpoints) | 8k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-chat-models | chat-bisonℹ️ | 8k | $0.125 | $0.125 | – | – | – | – |
palm | palm/chat-bisonℹ️ chat-bison | 8k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-chat-models, palm | ▶chat-bison@001 (2 endpoints) | 8k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-chat-models | chat-bison@001ℹ️ | 8k | $0.125 | $0.125 | – | – | – | – |
palm | palm/chat-bison-001ℹ️ chat-bison-001 | 8k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-chat-models | chat-bison@002ℹ️ | 8k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-chat-models | chat-bison-32kℹ️ | 32k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-chat-models | chat-bison-32k@002ℹ️ | 32k | $0.125 | $0.125 | – | – | – | – |
nlp_cloud | chatdolphin | 16k | $0.50 | $0.50 | – | – | – | – |
openrouter | anthropic/claude-2.0:beta claude-2.0:beta | 100k | $8.00 | $24.00 | – | – | – | – |
openrouter | anthropic/claude-2.1:beta claude-2.1:beta | 200k | $8.00 | $24.00 | – | – | – | – |
openrouter | anthropic/claude-2:beta claude-2:beta | 200k | $8.00 | $24.00 | – | – | – | – |
openrouter | anthropic/claude-3.5-haiku-20241022:beta claude-3.5-haiku-20241022:beta | 200k | $0.80 | $4.00 | – | – | – | – |
openrouter | anthropic/claude-3.5-haiku:beta claude-3.5-haiku:beta | 200k | $0.80 | $4.00 | – | – | – | – |
openrouter | anthropic/claude-3.5-sonnet-20240620:beta claude-3.5-sonnet-20240620:beta | 200k | $3.00 | $15.00 | – | – | – | – |
bedrock | ▶claude-3-5-sonnet-20241022-v2.0 (3 endpoints) | 200k | $3.00 | $15.00 | – | – | – | – |
bedrock | anthropic.claude-3-5-sonnet-20241022-v2:0 claude-3-5-sonnet-20241022-v2.0 | 200k | $3.00 | $15.00 | – | – | – | – |
bedrock | us.anthropic.claude-3-5-sonnet-20241022-v2:0 claude-3-5-sonnet-20241022-v2.0 | 200k | $3.00 | $15.00 | – | – | – | – |
bedrock | eu.anthropic.claude-3-5-sonnet-20241022-v2:0 claude-3-5-sonnet-20241022-v2.0 | 200k | $3.00 | $15.00 | – | – | – | – |
openrouter | anthropic/claude-3.5-sonnet:beta claude-3.5-sonnet:beta | 200k | $3.00 | $15.00 | – | – | – | – |
vertex_ai-anthropic_models | ▶claude-3-5-sonnet-v2 (2 endpoints) | 200k | $3.00 | $15.00 | – | – | – | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-5-sonnet-v2 claude-3-5-sonnet-v2 | 200k | $3.00 | $15.00 | – | – | – | – |
vertex_ai-anthropic_models | vertex_ai/claude-3-5-sonnet-v2@20241022 claude-3-5-sonnet-v2@20241022 | 200k | $3.00 | $15.00 | – | – | – | – |
openrouter | anthropic/claude-3.7-sonnet:beta claude-3.7-sonnet:beta | 200k | $3.00 | $15.00 | – | – | – | – |
openrouter | anthropic/claude-3-haiku:beta claude-3-haiku:beta | 200k | $0.25 | $1.25 | – | – | – | – |
openrouter | anthropic/claude-3-opus:beta claude-3-opus:beta | 200k | $15.00 | $75.00 | – | – | – | – |
openrouter | anthropic/claude-3-sonnet:beta claude-3-sonnet:beta | 200k | $3.00 | $15.00 | – | – | – | – |
bedrock | ▶claude-instant-v1 (5 endpoints) | 100k | $0.80–$2.48 | $2.40–$8.38 | – | – | – | – |
bedrock | anthropic.claude-instant-v1 claude-instant-v1 | 100k | $0.80 | $2.40 | – | – | – | – |
bedrock | bedrock/us-east-1/anthropic.claude-instant-v1 claude-instant-v1 | 100k | $0.80 | $2.40 | – | – | – | – |
bedrock | bedrock/us-west-2/anthropic.claude-instant-v1 claude-instant-v1 | 100k | $0.80 | $2.40 | – | – | – | – |
bedrock | bedrock/ap-northeast-1/anthropic.claude-instant-v1 claude-instant-v1 | 100k | $2.23 | $7.55 | – | – | – | – |
bedrock | bedrock/eu-central-1/anthropic.claude-instant-v1 claude-instant-v1 | 100k | $2.48 | $8.38 | – | – | – | – |
bedrock | ▶claude-v1 (5 endpoints) | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | anthropic.claude-v1 claude-v1 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/us-east-1/anthropic.claude-v1 claude-v1 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/us-west-2/anthropic.claude-v1 claude-v1 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/ap-northeast-1/anthropic.claude-v1 claude-v1 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/eu-central-1/anthropic.claude-v1 claude-v1 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | ▶claude-v2 (5 endpoints) | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | anthropic.claude-v2 claude-v2 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/us-east-1/anthropic.claude-v2 claude-v2 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/us-west-2/anthropic.claude-v2 claude-v2 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/ap-northeast-1/anthropic.claude-v2 claude-v2 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/eu-central-1/anthropic.claude-v2 claude-v2 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | ▶claude-v2.1 (5 endpoints) | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | anthropic.claude-v2:1 claude-v2.1 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/us-east-1/anthropic.claude-v2:1 claude-v2.1 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/us-west-2/anthropic.claude-v2:1 claude-v2.1 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/ap-northeast-1/anthropic.claude-v2:1 claude-v2.1 | 100k | $8.00 | $24.00 | – | – | – | – |
bedrock | bedrock/eu-central-1/anthropic.claude-v2:1 claude-v2.1 | 100k | $8.00 | $24.00 | – | – | – | – |
vertex_ai-code-text-models | code-bisonℹ️ | 6k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-code-chat-models | codechat-bisonℹ️ | 6k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-code-chat-models | codechat-bison@001ℹ️ | 6k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-code-chat-models | codechat-bison@002ℹ️ | 6k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-code-chat-models | codechat-bison-32kℹ️ | 32k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-code-chat-models | codechat-bison-32k@002ℹ️ | 32k | $0.125 | $0.125 | – | – | – | – |
vertex_ai-code-chat-models | codechat-bison@latestℹ️ | 6k | $0.125 | $0.125 | – | – | – | – |
perplexity, deepinfra, anyscale | ▶codellama-34b-instruct (3 endpoints) | 4k–16k | $0.35–$1.00 | $0.60–$1.40 | – | – | – | – |
perplexity | perplexity/codellama-34b-instruct codellama-34b-instruct | 16k | $0.35 | $1.40 | – | – | – | – |
deepinfra | deepinfra/codellama/CodeLlama-34b-Instruct-hf codellama-34b-instruct | 4k | $0.60 | $0.60 | – | – | – | – |
anyscale | anyscale/codellama/CodeLlama-34b-Instruct-hf codellama-34b-instruct | 4k | $1.00 | $1.00 | – | – | – | – |
perplexity, anyscale | ▶codellama-70b-instruct (2 endpoints) | 4k–16k | $0.70–$1.00 | $1.00–$2.80 | – | – | – | – |
perplexity | perplexity/codellama-70b-instruct codellama-70b-instruct | 16k | $0.70 | $2.80 | – | – | – | – |
anyscale | anyscale/codellama/CodeLlama-70b-Instruct-hfℹ️ codellama-70b-instruct | 4k | $1.00 | $1.00 | – | – | – | – |
cloudflare | cloudflare/@hf/thebloke/codellama-7b-instruct-awq codellama-7b-instruct-awq | 4k | $1.923 | $1.923 | – | – | – | – |
openrouter | alfredpros/codellama-7b-instruct-solidity codellama-7b-instruct-solidity | 4k | $0.80 | $1.20 | – | – | – | – |
openrouter | arcee-ai/coder-large coder-large | 32k | $0.50 | $0.80 | – | – | – | – |
vertex_ai-mistral_models | vertex_ai/codestral@latest codestral@latest | 128k | $0.20 | $0.60 | – | – | – | – |
openrouter, mistral | ▶codestral-mamba (2 endpoints) | 256k–262k | $0.25 | $0.25 | – | – | – | – |
openrouter | mistralai/codestral-mamba codestral-mamba | 262k | $0.25 | $0.25 | – | – | – | – |
mistral | mistral/codestral-mamba-latestℹ️ codestral-mamba-latest | 256k | $0.25 | $0.25 | – | – | – | – |
openrouter | openai/codex-mini codex-mini | 200k | $1.50 | $6.00 | – | – | – | – |
openrouter | cohere/command command | 4k | $1.00 | $2.00 | – | – | – | – |
openrouter, cohere_chat | ▶command-a (2 endpoints) | 256k | $2.50 | $10.00 | – | – | – | – |
openrouter | cohere/command-a command-a | 256k | $2.50 | $10.00 | – | – | – | – |
cohere_chat | command-a-03-2025 | 256k | $2.50 | $10.00 | – | – | – | – |
cohere_chat | command-light | 4k | $0.30 | $0.60 | – | – | – | – |
bedrock | cohere.command-light-text-v14 command-light-text-v14 | 4k | $0.30 | $0.60 | – | – | – | – |
cohere_chat, openrouter, bedrock | ▶command-r (6 endpoints) | 128k | $0.15–$0.50 | $0.60–$1.50 | – | – | – | – |
cohere_chat | command-r | 128k | $0.15 | $0.60 | – | – | – | – |
cohere_chat | command-r-08-2024 | 128k | $0.15 | $0.60 | – | – | – | – |
openrouter | cohere/command-r-08-2024 command-r-08-2024 | 128k | $0.15 | $0.60 | – | – | – | – |
openrouter | cohere/command-r command-r | 128k | $0.50 | $1.50 | – | – | – | – |
openrouter | cohere/command-r-03-2024 command-r-03-2024 | 128k | $0.50 | $1.50 | – | – | – | – |
bedrock | cohere.command-r-v1:0 command-r-v1.0 | 128k | $0.50 | $1.50 | – | – | – | – |
openrouter, cohere_chat | ▶command-r7b-12-2024 (2 endpoints) | 128k | $0.0375–$0.15 | $0.0375–$0.15 | – | – | – | – |
openrouter | cohere/command-r7b-12-2024 command-r7b-12-2024 | 128k | $0.0375 | $0.15 | – | – | – | – |
cohere_chat | command-r7b-12-2024ℹ️ | 128k | $0.15 | $0.0375 | – | – | – | – |
cohere_chat, openrouter, azure, bedrock | ▶command-r-plus (7 endpoints) | 128k | $2.50–$3.00 | $10.00–$15.00 | – | – | – | – |
cohere_chat | command-r-plus | 128k | $2.50 | $10.00 | – | – | – | – |
cohere_chat | command-r-plus-08-2024 | 128k | $2.50 | $10.00 | – | – | – | – |
openrouter | cohere/command-r-plus-08-2024 command-r-plus-08-2024 | 128k | $2.50 | $10.00 | – | – | – | – |
azure | azure/command-r-plus command-r-plus | 128k | $3.00 | $15.00 | – | – | – | – |
openrouter | cohere/command-r-plus command-r-plus | 128k | $3.00 | $15.00 | – | – | – | – |
openrouter | cohere/command-r-plus-04-2024 command-r-plus-04-2024 | 128k | $3.00 | $15.00 | – | – | – | – |
bedrock | cohere.command-r-plus-v1:0 command-r-plus-v1.0 | 128k | $3.00 | $15.00 | – | – | – | – |
bedrock | cohere.command-text-v14 command-text-v14 | 4k | $1.50 | $2.00 | – | – | – | – |
azure | ▶computer-use-preview (2 endpoints) | 8k | $3.00 | $12.00 | – | – | – | – |
azure | computer-use-preview | 8k | $3.00 | $12.00 | – | – | – | – |
azure | azure/computer-use-preview computer-use-preview | 8k | $3.00 | $12.00 | – | – | – | – |
databricks | databricks/databricks-claude-3-7-sonnetℹ️ databricks-claude-3-7-sonnet | 200k | $2.50 | $178.57 | – | – | – | – |
databricks | databricks/databricks-dbrx-instructℹ️ databricks-dbrx-instruct | 32k | $0.75 | $2.249 | – | – | – | – |
databricks | databricks/databricks-llama-2-70b-chatℹ️ databricks-llama-2-70b-chat | 4k | $0.50 | $1.50 | – | – | – | – |
databricks | databricks/databricks-meta-llama-3-1-405b-instructℹ️ databricks-meta-llama-3-1-405b-instruct | 128k | $5.00 | $15.00 | – | – | – | – |
databricks | databricks/databricks-meta-llama-3-1-70b-instructℹ️ databricks-meta-llama-3-1-70b-instruct | 128k | $1.00 | $3.00 | – | – | – | – |
databricks | databricks/databricks-meta-llama-3-3-70b-instructℹ️ databricks-meta-llama-3-3-70b-instruct | 128k | $1.00 | $3.00 | – | – | – | – |
databricks | databricks/databricks-meta-llama-3-70b-instructℹ️ databricks-meta-llama-3-70b-instruct | 128k | $1.00 | $3.00 | – | – | – | – |
databricks | databricks/databricks-mixtral-8x7b-instructℹ️ databricks-mixtral-8x7b-instruct | 4k | $0.50 | $0.999 | – | – | – | – |
databricks | databricks/databricks-mpt-30b-instructℹ️ databricks-mpt-30b-instruct | 8k | $0.999 | $0.999 | – | – | – | – |
databricks | databricks/databricks-mpt-7b-instructℹ️ databricks-mpt-7b-instruct | 8k | $0.50 | $0.00 | – | – | – | – |
openrouter | agentica-org/deepcoder-14b-preview:free deepcoder-14b-preview | 96k | $0.00 | $0.00 | – | – | – | – |
openrouter | nousresearch/deephermes-3-llama-3-8b-preview:free deephermes-3-llama-3-8b-preview | 131k | $0.00 | $0.00 | – | – | – | – |
openrouter | nousresearch/deephermes-3-mistral-24b-preview:free deephermes-3-mistral-24b-preview | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | deepseek/deepseek-chat:free deepseek-chat | 163k | $0.00 | $0.00 | – | – | – | – |
openrouter, deepseek | ▶deepseek-coder (2 endpoints) | 128k | $0.04–$0.14 | $0.12–$0.28 | – | – | – | – |
openrouter | deepseek/deepseek-coder deepseek-coder | 128k | $0.04 | $0.12 | – | – | – | – |
deepseek | deepseek/deepseek-coder deepseek-coder | 128k | $0.14 | $0.28 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/deepseek-coder-v2-instructℹ️ deepseek-coder-v2-instruct | 65k | $1.20 | $1.20 | – | – | – | – |
lambda | deepseek-llama3.3-70b | 131k | $0.20 | $0.60 | – | – | – | – |
openrouter | ▶deepseek-prover-v2 (2 endpoints) | 131k–163k | $0.00–$0.50 | $0.00–$2.18 | – | – | – | – |
openrouter | deepseek/deepseek-prover-v2:free deepseek-prover-v2 | 163k | $0.00 | $0.00 | – | – | – | – |
openrouter | deepseek/deepseek-prover-v2 deepseek-prover-v2 | 131k | $0.50 | $2.18 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/deepseek-r1-basicℹ️ deepseek-r1-basic | 128k | $0.55 | $2.19 | – | – | – | – |
openrouter, nscale | ▶deepseek-r1-distill-llama-8b (2 endpoints) | 32k | $0.025–$0.04 | $0.025–$0.04 | – | – | – | – |
openrouter | deepseek/deepseek-r1-distill-llama-8b deepseek-r1-distill-llama-8b | 32k | $0.04 | $0.04 | – | – | – | – |
nscale | nscale/deepseek-ai/DeepSeek-R1-Distill-Llama-8Bℹ️ deepseek-r1-distill-llama-8b | – | $0.025 | $0.025 | – | – | – | – |
openrouter, nscale | ▶deepseek-r1-distill-qwen-1.5b (2 endpoints) | 131k | $0.09–$0.18 | $0.09–$0.18 | – | – | – | – |
openrouter | deepseek/deepseek-r1-distill-qwen-1.5b deepseek-r1-distill-qwen-1.5b | 131k | $0.18 | $0.18 | – | – | – | – |
nscale | nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5Bℹ️ deepseek-r1-distill-qwen-1.5b | – | $0.09 | $0.09 | – | – | – | – |
openrouter, nscale | ▶deepseek-r1-distill-qwen-32b (3 endpoints) | 16k–131k | $0.00–$0.15 | $0.00–$0.18 | – | – | – | – |
openrouter | deepseek/deepseek-r1-distill-qwen-32b deepseek-r1-distill-qwen-32b | 131k | $0.12 | $0.18 | – | – | – | – |
openrouter | deepseek/deepseek-r1-distill-qwen-32b:free deepseek-r1-distill-qwen-32b | 16k | $0.00 | $0.00 | – | – | – | – |
nscale | nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-32Bℹ️ deepseek-r1-distill-qwen-32b | – | $0.15 | $0.15 | – | – | – | – |
nscale | nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-7Bℹ️ deepseek-r1-distill-qwen-7b | – | $0.20 | $0.20 | – | – | – | – |
openrouter | tngtech/deepseek-r1t-chimera:free deepseek-r1t-chimera | 163k | $0.00 | $0.00 | – | – | – | – |
openrouter | deepseek/deepseek-r1-zero:free deepseek-r1-zero | 128k | $0.00 | $0.00 | – | – | – | – |
openrouter | deepseek/deepseek-v3-base:free deepseek-v3-base | 163k | $0.00 | $0.00 | – | – | – | – |
deepinfra | deepinfra/cognitivecomputations/dolphin-2.6-mixtral-8x7b dolphin-2.6-mixtral-8x7b | 32k | $0.27 | $0.27 | – | – | – | – |
openrouter | cognitivecomputations/dolphin3.0-mistral-24b:free dolphin3.0-mistral-24b | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | cognitivecomputations/dolphin3.0-r1-mistral-24b:free dolphin3.0-r1-mistral-24b | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | cognitivecomputations/dolphin-mixtral-8x22b dolphin-mixtral-8x22b | 16k | $0.90 | $0.90 | – | – | – | – |
openrouter | eva-unit-01/eva-llama-3.33-70b eva-llama-3.33-70b | 16k | $4.00 | $6.00 | – | – | – | – |
openrouter | eva-unit-01/eva-qwen-2.5-32b eva-qwen-2.5-32b | 16k | $2.60 | $3.40 | – | – | – | – |
openrouter | eva-unit-01/eva-qwen-2.5-72b eva-qwen-2.5-72b | 16k | $4.00 | $6.00 | – | – | – | – |
openrouter | sao10k/fimbulvetr-11b-v2 fimbulvetr-11b-v2 | 4k | $0.80 | $1.20 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/firefunction-v2ℹ️ firefunction-v2 | 8k | $0.90 | $0.90 | – | – | – | – |
vertex_ai-language-models | gemini-1.0-proℹ️ | 32k | $0.50 | $1.50 | – | – | – | – |
vertex_ai-language-models | gemini-1.0-pro-002ℹ️ | 32k | $0.50 | $1.50 | – | – | – | – |
vertex_ai-vision-models | gemini-1.0-pro-visionℹ️ | 16k | $0.50 | $1.50 | – | – | – | – |
vertex_ai-vision-models | gemini-1.0-pro-vision-001ℹ️ | 16k | $0.50 | $1.50 | – | – | – | – |
vertex_ai-language-models | gemini-1.0-ultraℹ️ | 8k | $0.50 | $1.50 | – | – | – | – |
vertex_ai-language-models | gemini-1.0-ultra-001ℹ️ | 8k | $0.50 | $1.50 | – | – | – | – |
gemini, vertex_ai-language-models | ▶gemini-1.5-flash (3 endpoints) | 1000k–1048k | $0.075 >128k: $0.15–$1.00 | $0.30 >128k: $0.60 | – | – | – | – |
gemini | gemini/gemini-1.5-flashℹ️ gemini-1.5-flash | 1048k | $0.075 >128k: $0.15 | $0.30 >128k: $0.60 | – | – | – | – |
gemini | gemini/gemini-1.5-flash-latestℹ️ gemini-1.5-flash-latest | 1048k | $0.075 >128k: $0.15 | $0.30 >128k: $0.60 | – | – | – | – |
vertex_ai-language-models | gemini-1.5-flashℹ️ | 1000k | $0.075 >128k: $1.00 | $0.30 >128k: $0.60 | – | – | – | – |
gemini | gemini/gemini-1.5-flash-8bℹ️ gemini-1.5-flash-8b | 1048k | $0.00 >128k: $0.00 | $0.00 >128k: $0.00 | – | – | – | – |
gemini, vertex_ai-language-models | ▶gemini-1.5-flash-exp-0827 (2 endpoints) | 1000k–1048k | $0.00–$0.0047 >128k: $0.00–$1.00 | $0.00–$0.0047 >128k: $0.00–$0.0094 | – | – | – | – |
gemini | gemini/gemini-1.5-flash-exp-0827ℹ️ gemini-1.5-flash-exp-0827 | 1048k | $0.00 >128k: $0.00 | $0.00 >128k: $0.00 | – | – | – | – |
vertex_ai-language-models | gemini-1.5-flash-exp-0827ℹ️ | 1000k | $0.0047 >128k: $1.00 | $0.0047 >128k: $0.0094 | – | – | – | – |
vertex_ai-language-models | gemini-1.5-flash-preview-0514ℹ️ | 1000k | $0.075 >128k: $1.00 | $0.0047 >128k: $0.0094 | – | – | – | – |
vertex_ai-language-models, gemini | ▶gemini-1.5-pro (3 endpoints) | 1048k–2097k | $1.25–$3.50 >128k: $2.50–$7.00 | $1.05–$10.50 >128k: $10.00–$21.00 | – | – | – | – |
vertex_ai-language-models | gemini-1.5-proℹ️ | 2097k | $1.25 >128k: $2.50 | $5.00 >128k: $10.00 | – | – | – | – |
gemini | gemini/gemini-1.5-proℹ️ gemini-1.5-pro | 2097k | $3.50 >128k: $7.00 | $10.50 >128k: $21.00 | – | – | – | – |
gemini | gemini/gemini-1.5-pro-latestℹ️ gemini-1.5-pro-latest | 1048k | $3.50 >128k: $7.00 | $1.05 >128k: $21.00 | – | – | – | – |
vertex_ai-language-models | ▶gemini-1.5-pro-preview-0215 (3 endpoints) | 1000k | $0.0781 >128k: $0.1563 | $0.3125 >128k: $0.625 | – | – | – | – |
vertex_ai-language-models | gemini-1.5-pro-preview-0215ℹ️ | 1000k | $0.0781 >128k: $0.1563 | $0.3125 >128k: $0.625 | – | – | – | – |
vertex_ai-language-models | gemini-1.5-pro-preview-0409ℹ️ | 1000k | $0.0781 >128k: $0.1563 | $0.3125 >128k: $0.625 | – | – | – | – |
vertex_ai-language-models | gemini-1.5-pro-preview-0514ℹ️ | 1000k | $0.0781 >128k: $0.1563 | $0.3125 >128k: $0.625 | – | – | – | – |
openrouter | google/gemini-2.0-flash-exp:free gemini-2.0-flash-exp | 1048k | $0.00 | $0.00 | – | – | – | – |
vertex_ai-language-models, openrouter | ▶gemini-2.0-flash-lite-001 (2 endpoints) | 1048k | $0.075 | $0.30 | – | – | – | – |
vertex_ai-language-models | gemini-2.0-flash-lite-001ℹ️ | 1048k | $0.075 | $0.30 | – | – | – | – |
openrouter | google/gemini-2.0-flash-lite-001 gemini-2.0-flash-lite-001 | 1048k | $0.075 | $0.30 | – | – | – | – |
gemini | gemini/gemini-2.0-flash-lite-preview-02-05ℹ️ gemini-2.0-flash-lite-preview-02-05 | 1048k | $0.075 | $0.30 | – | – | – | – |
openrouter | google/gemini-flash-1.5 gemini-flash-1.5 | 1000k | $0.075 | $0.30 | – | – | – | – |
openrouter | google/gemini-flash-1.5-8b gemini-flash-1.5-8b | 1000k | $0.0375 | $0.15 | – | – | – | – |
vertex_ai-language-models | gemini-flash-experimentalℹ️ | 1000k | $0.00 | $0.00 | – | – | – | – |
gemini | gemini/gemini-gemma-2-27b-itℹ️ gemini-gemma-2-27b-it | – | $0.35 | $1.05 | – | – | – | – |
gemini | gemini/gemini-gemma-2-9b-itℹ️ gemini-gemma-2-9b-it | – | $0.35 | $1.05 | – | – | – | – |
gemini, vertex_ai-language-models | ▶gemini-pro (2 endpoints) | 32k | $0.35–$0.50 >128k: $0.70 | $1.05–$1.50 >128k: $2.10 | – | – | – | – |
gemini | gemini/gemini-proℹ️ gemini-pro | 32k | $0.35 >128k: $0.70 | $1.05 >128k: $2.10 | – | – | – | – |
vertex_ai-language-models | gemini-proℹ️ | 32k | $0.50 | $1.50 | – | – | – | – |
openrouter | google/gemini-pro-1.5 gemini-pro-1.5 | 2000k | $1.25 | $5.00 | – | – | – | – |
vertex_ai-language-models | gemini-pro-experimentalℹ️ | 1000k | $0.00 | $0.00 | – | – | – | – |
gemini, vertex_ai-vision-models | ▶gemini-pro-vision (2 endpoints) | 16k–30k | $0.35–$0.50 >128k: $0.70 | $1.05–$1.50 >128k: $2.10 | – | – | – | – |
gemini | gemini/gemini-pro-visionℹ️ gemini-pro-vision | 30k | $0.35 >128k: $0.70 | $1.05 >128k: $2.10 | – | – | – | – |
vertex_ai-vision-models | gemini-pro-visionℹ️ | 16k | $0.50 | $1.50 | – | – | – | – |
openrouter | ▶gemma-3-12b-it (2 endpoints) | 131k | $0.00–$0.05 | $0.00–$0.10 | – | – | – | – |
openrouter | google/gemma-3-12b-it:free gemma-3-12b-it | 131k | $0.00 | $0.00 | – | – | – | – |
openrouter | google/gemma-3-12b-it gemma-3-12b-it | 131k | $0.05 | $0.10 | – | – | – | – |
openrouter | google/gemma-3-1b-it:free gemma-3-1b-it | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | ▶gemma-3-4b-it (2 endpoints) | 96k–131k | $0.00–$0.02 | $0.00–$0.04 | – | – | – | – |
openrouter | google/gemma-3-4b-it gemma-3-4b-it | 131k | $0.02 | $0.04 | – | – | – | – |
openrouter | google/gemma-3-4b-it:free gemma-3-4b-it | 96k | $0.00 | $0.00 | – | – | – | – |
groq, anyscale | ▶gemma-7b-it (2 endpoints) | 8k | $0.07–$0.15 | $0.07–$0.15 | – | – | – | – |
groq | groq/gemma-7b-it gemma-7b-it | 8k | $0.07 | $0.07 | – | – | – | – |
anyscale | anyscale/google/gemma-7b-itℹ️ gemma-7b-it | 8k | $0.15 | $0.15 | – | – | – | – |
openrouter | ▶glm-4-32b (2 endpoints) | 32k–32k | $0.00–$0.24 | $0.00–$0.24 | – | – | – | – |
openrouter | thudm/glm-4-32b:free glm-4-32b | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | thudm/glm-4-32b glm-4-32b | 32k | $0.24 | $0.24 | – | – | – | – |
openrouter | thudm/glm-4-9b:free glm-4-9b | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | ▶glm-z1-32b (2 endpoints) | 32k–32k | $0.00–$0.24 | $0.00–$0.24 | – | – | – | – |
openrouter | thudm/glm-z1-32b:free glm-z1-32b | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | thudm/glm-z1-32b glm-z1-32b | 32k | $0.24 | $0.24 | – | – | – | – |
openrouter | thudm/glm-z1-9b:free glm-z1-9b | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | thudm/glm-z1-rumination-32b glm-z1-rumination-32b | 32k | $0.24 | $0.24 | – | – | – | – |
openrouter | alpindale/goliath-120b goliath-120b | 6k | $10.00 | $12.50 | – | – | – | – |
openai, azure, openrouter | ▶gpt-3.5-turbo-16k (4 endpoints) | 16k | $3.00 | $4.00 | – | – | – | – |
openai | gpt-3.5-turbo-16k | 16k | $3.00 | $4.00 | – | – | – | – |
azure | azure/gpt-35-turbo-16k gpt-35-turbo-16k | 16k | $3.00 | $4.00 | – | – | – | – |
openrouter | openai/gpt-3.5-turbo-16k gpt-3.5-turbo-16k | 16k | $3.00 | $4.00 | – | – | – | – |
azure | azure/gpt-35-turbo-16k-0613 gpt-35-turbo-16k-0613 | 16k | $3.00 | $4.00 | – | – | – | – |
openrouter | openai/gpt-3.5-turbo-instruct gpt-3.5-turbo-instruct | 4k | $1.50 | $2.00 | – | – | – | – |
azure, openrouter | ▶gpt-4-32k (4 endpoints) | 32k–32k | $60.00 | $120.00 | – | – | – | – |
azure | azure/gpt-4-32k gpt-4-32k | 32k | $60.00 | $120.00 | – | – | – | – |
azure | azure/gpt-4-32k-0613 gpt-4-32k-0613 | 32k | $60.00 | $120.00 | – | – | – | – |
openrouter | openai/gpt-4-32k gpt-4-32k | 32k | $60.00 | $120.00 | – | – | – | – |
openrouter | openai/gpt-4-32k-0314 gpt-4-32k-0314 | 32k | $60.00 | $120.00 | – | – | – | – |
openai, azure | ▶gpt-4o-audio-preview (4 endpoints) | 128k | $2.50 | $10.00 | – | – | – | – |
openai | gpt-4o-audio-preview | 128k | $2.50 | $10.00 | – | – | – | – |
openai | gpt-4o-audio-preview-2024-10-01 | 128k | $2.50 | $10.00 | – | – | – | – |
openai | gpt-4o-audio-preview-2024-12-17 | 128k | $2.50 | $10.00 | – | – | – | – |
azure | azure/gpt-4o-audio-preview-2024-12-17 gpt-4o-audio-preview-2024-12-17 | 128k | $2.50 | $10.00 | – | – | – | – |
openrouter | openai/gpt-4o:extended gpt-4o:extended | 128k | $6.00 | $18.00 | – | – | – | – |
openai, azure | ▶gpt-4o-mini-audio-preview-2024-12-17 (2 endpoints) | 128k | $0.15–$2.50 | $0.60–$10.00 | – | – | – | – |
openai | gpt-4o-mini-audio-preview-2024-12-17 | 128k | $0.15 | $0.60 | – | – | – | – |
azure | azure/gpt-4o-mini-audio-preview-2024-12-17 gpt-4o-mini-audio-preview-2024-12-17 | 128k | $2.50 | $10.00 | – | – | – | – |
openai, azure | ▶gpt-4o-mini-realtime-preview (5 endpoints) | 128k | $0.60–$0.66 | $2.40–$2.64 | – | – | – | – |
openai | gpt-4o-mini-realtime-preview | 128k | $0.60 | $2.40 | – | – | – | – |
openai | gpt-4o-mini-realtime-preview-2024-12-17 | 128k | $0.60 | $2.40 | – | – | – | – |
azure | azure/gpt-4o-mini-realtime-preview-2024-12-17 gpt-4o-mini-realtime-preview-2024-12-17 | 128k | $0.60 | $2.40 | – | – | – | – |
azure | azure/eu/gpt-4o-mini-realtime-preview-2024-12-17 gpt-4o-mini-realtime-preview-2024-12-17 | 128k | $0.66 | $2.64 | – | – | – | – |
azure | azure/us/gpt-4o-mini-realtime-preview-2024-12-17 gpt-4o-mini-realtime-preview-2024-12-17 | 128k | $0.66 | $2.64 | – | – | – | – |
openai, openrouter | ▶gpt-4o-mini-search-preview (3 endpoints) | 128k | $0.15 | $0.60 | – | – | – | – |
openai | gpt-4o-mini-search-preview | 128k | $0.15 | $0.60 | – | – | – | – |
openrouter | openai/gpt-4o-mini-search-preview gpt-4o-mini-search-preview | 128k | $0.15 | $0.60 | – | – | – | – |
openai | gpt-4o-mini-search-preview-2025-03-11 | 128k | $0.15 | $0.60 | – | – | – | – |
openai, azure | ▶gpt-4o-realtime-preview (9 endpoints) | 128k | $5.00–$5.50 | $20.00–$22.00 | – | – | – | – |
openai | gpt-4o-realtime-preview | 128k | $5.00 | $20.00 | – | – | – | – |
openai | gpt-4o-realtime-preview-2024-10-01 | 128k | $5.00 | $20.00 | – | – | – | – |
azure | azure/gpt-4o-realtime-preview-2024-10-01 gpt-4o-realtime-preview-2024-10-01 | 128k | $5.00 | $20.00 | – | – | – | – |
openai | gpt-4o-realtime-preview-2024-12-17 | 128k | $5.00 | $20.00 | – | – | – | – |
azure | azure/gpt-4o-realtime-preview-2024-12-17 gpt-4o-realtime-preview-2024-12-17 | 128k | $5.00 | $20.00 | – | – | – | – |
azure | azure/us/gpt-4o-realtime-preview-2024-10-01 gpt-4o-realtime-preview-2024-10-01 | 128k | $5.50 | $22.00 | – | – | – | – |
azure | azure/eu/gpt-4o-realtime-preview-2024-10-01 gpt-4o-realtime-preview-2024-10-01 | 128k | $5.50 | $22.00 | – | – | – | – |
azure | azure/us/gpt-4o-realtime-preview-2024-12-17 gpt-4o-realtime-preview-2024-12-17 | 128k | $5.50 | $22.00 | – | – | – | – |
azure | azure/eu/gpt-4o-realtime-preview-2024-12-17 gpt-4o-realtime-preview-2024-12-17 | 128k | $5.50 | $22.00 | – | – | – | – |
openai, openrouter | ▶gpt-4o-search-preview (3 endpoints) | 128k | $2.50 | $10.00 | – | – | – | – |
openai | gpt-4o-search-preview | 128k | $2.50 | $10.00 | – | – | – | – |
openrouter | openai/gpt-4o-search-preview gpt-4o-search-preview | 128k | $2.50 | $10.00 | – | – | – | – |
openai | gpt-4o-search-preview-2025-03-11 | 128k | $2.50 | $10.00 | – | – | – | – |
openai, openrouter | ▶gpt-4-turbo-preview (2 endpoints) | 128k | $10.00 | $30.00 | – | – | – | – |
openai | gpt-4-turbo-preview | 128k | $10.00 | $30.00 | – | – | – | – |
openrouter | openai/gpt-4-turbo-preview gpt-4-turbo-preview | 128k | $10.00 | $30.00 | – | – | – | – |
azure | azure/gpt-4-turbo-vision-preview gpt-4-turbo-vision-preview | 128k | $10.00 | $30.00 | – | – | – | – |
watsonx | watsonx/ibm/granite-3-8b-instruct granite-3-8b-instruct | 8k | $200.00 | $200.00 | – | – | – | – |
xai, openrouter | ▶grok-2-vision (4 endpoints) | 32k | $2.00 | $10.00 | – | – | – | – |
xai | xai/grok-2-vision grok-2-vision | 32k | $2.00 | $10.00 | – | – | – | – |
xai | xai/grok-2-vision-1212 grok-2-vision-1212 | 32k | $2.00 | $10.00 | – | – | – | – |
openrouter | x-ai/grok-2-vision-1212 grok-2-vision-1212 | 32k | $2.00 | $10.00 | – | – | – | – |
xai | xai/grok-2-vision-latest grok-2-vision-latest | 32k | $2.00 | $10.00 | – | – | – | – |
xai | xai/grok-3-fast-betaℹ️ grok-3-fast-beta | 131k | $5.00 | $25.00 | – | – | – | – |
xai | xai/grok-3-fast-latestℹ️ grok-3-fast-latest | 131k | $5.00 | $25.00 | – | – | – | – |
xai | xai/grok-3-mini-fast-betaℹ️ grok-3-mini-fast-beta | 131k | $0.60 | $4.00 | – | – | – | – |
xai | xai/grok-3-mini-fast-latestℹ️ grok-3-mini-fast-latest | 131k | $0.60 | $4.00 | – | – | – | – |
xai, openrouter | ▶grok-beta (2 endpoints) | 131k | $5.00 | $15.00 | – | – | – | – |
xai | xai/grok-beta grok-beta | 131k | $5.00 | $15.00 | – | – | – | – |
openrouter | x-ai/grok-beta grok-beta | 131k | $5.00 | $15.00 | – | – | – | – |
xai, openrouter | ▶grok-vision-beta (2 endpoints) | 8k | $5.00 | $15.00 | – | – | – | – |
xai | xai/grok-vision-beta grok-vision-beta | 8k | $5.00 | $15.00 | – | – | – | – |
openrouter | x-ai/grok-vision-beta grok-vision-beta | 8k | $5.00 | $15.00 | – | – | – | – |
openrouter | nousresearch/hermes-2-pro-llama-3-8b hermes-2-pro-llama-3-8b | 131k | $0.025 | $0.04 | – | – | – | – |
lambda | hermes3-405b | 131k | $0.80 | $0.80 | – | – | – | – |
lambda | hermes3-70b | 131k | $0.12 | $0.30 | – | – | – | – |
lambda | hermes3-8b | 131k | $0.025 | $0.04 | – | – | – | – |
openrouter | nousresearch/hermes-3-llama-3.1-405b hermes-3-llama-3.1-405b | 131k | $0.80 | $0.80 | – | – | – | – |
openrouter | nousresearch/hermes-3-llama-3.1-70b hermes-3-llama-3.1-70b | 131k | $0.12 | $0.30 | – | – | – | – |
openrouter | inflection/inflection-3-pi inflection-3-pi | 8k | $2.50 | $10.00 | – | – | – | – |
openrouter | inflection/inflection-3-productivity inflection-3-productivity | 8k | $2.50 | $10.00 | – | – | – | – |
openrouter | opengvlab/internvl3-14b:free internvl3-14b | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | opengvlab/internvl3-2b:free internvl3-2b | 32k | $0.00 | $0.00 | – | – | – | – |
bedrock | ai21.j2-mid-v1 j2-mid-v1 | 8k | $12.50 | $12.50 | – | – | – | – |
bedrock | ai21.j2-ultra-v1 j2-ultra-v1 | 8k | $18.80 | $18.80 | – | – | – | – |
vertex_ai-ai21_models, ai21 | ▶jamba-1.5 (2 endpoints) | 256k | $0.20 | $0.40 | – | – | – | – |
vertex_ai-ai21_models | vertex_ai/jamba-1.5 jamba-1.5 | 256k | $0.20 | $0.40 | – | – | – | – |
ai21 | jamba-1.5 | 256k | $0.20 | $0.40 | – | – | – | – |
vertex_ai-ai21_models, ai21, bedrock | ▶jamba-1.5-large (3 endpoints) | 256k | $2.00 | $8.00 | – | – | – | – |
vertex_ai-ai21_models | vertex_ai/jamba-1.5-large jamba-1.5-large | 256k | $2.00 | $8.00 | – | – | – | – |
ai21 | jamba-1.5-large | 256k | $2.00 | $8.00 | – | – | – | – |
bedrock | ai21.jamba-1-5-large-v1:0 jamba-1-5-large-v1.0 | 256k | $2.00 | $8.00 | – | – | – | – |
vertex_ai-ai21_models, ai21 | ▶jamba-1.5-large@001 (2 endpoints) | 256k | $2.00 | $8.00 | – | – | – | – |
vertex_ai-ai21_models | vertex_ai/jamba-1.5-large@001 jamba-1.5-large@001 | 256k | $2.00 | $8.00 | – | – | – | – |
ai21 | jamba-1.5-large@001 | 256k | $2.00 | $8.00 | – | – | – | – |
vertex_ai-ai21_models, ai21, bedrock | ▶jamba-1.5-mini (3 endpoints) | 256k | $0.20 | $0.40 | – | – | – | – |
vertex_ai-ai21_models | vertex_ai/jamba-1.5-mini jamba-1.5-mini | 256k | $0.20 | $0.40 | – | – | – | – |
ai21 | jamba-1.5-mini | 256k | $0.20 | $0.40 | – | – | – | – |
bedrock | ai21.jamba-1-5-mini-v1:0 jamba-1-5-mini-v1.0 | 256k | $0.20 | $0.40 | – | – | – | – |
vertex_ai-ai21_models, ai21 | ▶jamba-1.5-mini@001 (2 endpoints) | 256k | $0.20 | $0.40 | – | – | – | – |
vertex_ai-ai21_models | vertex_ai/jamba-1.5-mini@001 jamba-1.5-mini@001 | 256k | $0.20 | $0.40 | – | – | – | – |
ai21 | jamba-1.5-mini@001 | 256k | $0.20 | $0.40 | – | – | – | – |
openrouter | ai21/jamba-1.6-large jamba-1.6-large | 256k | $2.00 | $8.00 | – | – | – | – |
openrouter | ai21/jamba-1.6-mini jamba-1.6-mini | 256k | $0.20 | $0.40 | – | – | – | – |
openrouter, azure_ai, bedrock | ▶jamba-instruct (3 endpoints) | 70k–256k | $0.50 | $0.70 | – | – | – | – |
openrouter | ai21/jamba-instruct jamba-instruct | 256k | $0.50 | $0.70 | – | – | – | – |
azure_ai | azure_ai/jamba-instruct jamba-instruct | 70k | $0.50 | $0.70 | – | – | – | – |
bedrock | ai21.jamba-instruct-v1:0 jamba-instruct-v1.0 | 70k | $0.50 | $0.70 | – | – | – | – |
ai21 | jamba-large-1.6 | 256k | $2.00 | $8.00 | – | – | – | – |
ai21 | jamba-mini-1.6 | 256k | $0.20 | $0.40 | – | – | – | – |
openrouter | moonshotai/kimi-vl-a3b-thinking:free kimi-vl-a3b-thinking | 131k | $0.00 | $0.00 | – | – | – | – |
openrouter | sao10k/l3.1-euryale-70b l3.1-euryale-70b | 131k | $0.70 | $0.80 | – | – | – | – |
openrouter | sao10k/l3.3-euryale-70b l3.3-euryale-70b | 131k | $0.70 | $0.80 | – | – | – | – |
openrouter | sao10k/l3-euryale-70b l3-euryale-70b | 8k | $1.48 | $1.48 | – | – | – | – |
openrouter | sao10k/l3-lunaris-8b l3-lunaris-8b | 8k | $0.02 | $0.05 | – | – | – | – |
gemini | gemini/learnlm-1.5-pro-experimentalℹ️ learnlm-1.5-pro-experimental | 32k | $0.00 >128k: $0.00 | $0.00 >128k: $0.00 | – | – | – | – |
openrouter | liquid/lfm-3b lfm-3b | 32k | $0.02 | $0.02 | – | – | – | – |
lambda, openrouter | ▶lfm-40b (2 endpoints) | 32k–66k | $0.15 | $0.15 | – | – | – | – |
lambda | lfm-40b | 66k | $0.15 | $0.15 | – | – | – | – |
openrouter | liquid/lfm-40b lfm-40b | 32k | $0.15 | $0.15 | – | – | – | – |
openrouter | liquid/lfm-7b lfm-7b | 32k | $0.01 | $0.01 | – | – | – | – |
replicate | replicate/meta/llama-2-13b llama-2-13b | 4k | $0.10 | $0.50 | – | – | – | – |
replicate, deepinfra, anyscale | ▶llama-2-13b-chat (3 endpoints) | 4k | $0.10–$0.25 | $0.22–$0.50 | – | – | – | – |
replicate | replicate/meta/llama-2-13b-chat llama-2-13b-chat | 4k | $0.10 | $0.50 | – | – | – | – |
deepinfra | deepinfra/meta-llama/Llama-2-13b-chat-hf llama-2-13b-chat | 4k | $0.22 | $0.22 | – | – | – | – |
anyscale | anyscale/meta-llama/Llama-2-13b-chat-hf llama-2-13b-chat | 4k | $0.25 | $0.25 | – | – | – | – |
bedrock | meta.llama2-13b-chat-v1 llama2-13b-chat-v1 | 4k | $0.75 | $1.00 | – | – | – | – |
replicate, groq | ▶llama-2-70b (2 endpoints) | 4k | $0.65–$0.70 | $0.80–$2.75 | – | – | – | – |
replicate | replicate/meta/llama-2-70b llama-2-70b | 4k | $0.65 | $2.75 | – | – | – | – |
groq | groq/llama2-70b-4096 llama2-70b-4096 | 4k | $0.70 | $0.80 | – | – | – | – |
bedrock | meta.llama2-70b-chat-v1 llama2-70b-chat-v1 | 4k | $1.95 | $2.56 | – | – | – | – |
replicate | replicate/meta/llama-2-7b llama-2-7b | 4k | $0.05 | $0.25 | – | – | – | – |
replicate, deepinfra, anyscale | ▶llama-2-7b-chat (3 endpoints) | 4k | $0.05–$0.15 | $0.13–$0.25 | – | – | – | – |
replicate | replicate/meta/llama-2-7b-chat llama-2-7b-chat | 4k | $0.05 | $0.25 | – | – | – | – |
deepinfra | deepinfra/meta-llama/Llama-2-7b-chat-hf llama-2-7b-chat | 4k | $0.13 | $0.13 | – | – | – | – |
anyscale | anyscale/meta-llama/Llama-2-7b-chat-hf llama-2-7b-chat | 4k | $0.15 | $0.15 | – | – | – | – |
cloudflare | cloudflare/@cf/meta/llama-2-7b-chat-fp16 llama-2-7b-chat-fp16 | 3k | $1.923 | $1.923 | – | – | – | – |
cloudflare | cloudflare/@cf/meta/llama-2-7b-chat-int8 llama-2-7b-chat-int8 | 2k | $1.923 | $1.923 | – | – | – | – |
openrouter | ▶llama-3.1-405b (2 endpoints) | 32k–64k | $0.00–$2.00 | $0.00–$2.00 | – | – | – | – |
openrouter | meta-llama/llama-3.1-405b:free llama-3.1-405b | 64k | $0.00 | $0.00 | – | – | – | – |
openrouter | meta-llama/llama-3.1-405b llama-3.1-405b | 32k | $2.00 | $2.00 | – | – | – | – |
lambda | llama3.1-405b-instruct-fp8 | 131k | $0.80 | $0.80 | – | – | – | – |
groq | groq/llama-3.1-405b-reasoning llama-3.1-405b-reasoning | 8k | $0.59 | $0.79 | – | – | – | – |
cerebras | cerebras/llama3.1-70b llama3.1-70b | 128k | $0.60 | $0.60 | – | – | – | – |
lambda | llama3.1-70b-instruct-fp8 | 131k | $0.12 | $0.30 | – | – | – | – |
groq | groq/llama-3.1-70b-versatile llama-3.1-70b-versatile | 8k | $0.59 | $0.79 | – | – | – | – |
cerebras | cerebras/llama3.1-8b llama3.1-8b | 128k | $0.10 | $0.10 | – | – | – | – |
groq | groq/llama-3.1-8b-instant llama-3.1-8b-instant | 128k | $0.05 | $0.08 | – | – | – | – |
openrouter | neversleep/llama-3.1-lumimaid-70b llama-3.1-lumimaid-70b | 16k | $2.50 | $3.00 | – | – | – | – |
openrouter | neversleep/llama-3.1-lumimaid-8b llama-3.1-lumimaid-8b | 32k | $0.20 | $1.25 | – | – | – | – |
openrouter | nvidia/llama-3.1-nemotron-70b-instruct llama-3.1-nemotron-70b-instruct | 131k | $0.12 | $0.30 | – | – | – | – |
lambda | llama3.1-nemotron-70b-instruct-fp8 | 131k | $0.12 | $0.30 | – | – | – | – |
openrouter | nvidia/llama-3.1-nemotron-ultra-253b-v1:free llama-3.1-nemotron-ultra-253b-v1 | 131k | $0.00 | $0.00 | – | – | – | – |
perplexity | perplexity/llama-3.1-sonar-huge-128k-online llama-3.1-sonar-huge-128k-online | 127k | $5.00 | $5.00 | – | – | – | – |
perplexity | perplexity/llama-3.1-sonar-large-128k-chat llama-3.1-sonar-large-128k-chat | 131k | $1.00 | $1.00 | – | – | – | – |
perplexity, openrouter | ▶llama-3.1-sonar-large-128k-online (2 endpoints) | 127k | $1.00 | $1.00 | – | – | – | – |
perplexity | perplexity/llama-3.1-sonar-large-128k-online llama-3.1-sonar-large-128k-online | 127k | $1.00 | $1.00 | – | – | – | – |
openrouter | perplexity/llama-3.1-sonar-large-128k-online llama-3.1-sonar-large-128k-online | 127k | $1.00 | $1.00 | – | – | – | – |
perplexity | perplexity/llama-3.1-sonar-small-128k-chat llama-3.1-sonar-small-128k-chat | 131k | $0.20 | $0.20 | – | – | – | – |
perplexity, openrouter | ▶llama-3.1-sonar-small-128k-online (2 endpoints) | 127k | $0.20 | $0.20 | – | – | – | – |
perplexity | perplexity/llama-3.1-sonar-small-128k-online llama-3.1-sonar-small-128k-online | 127k | $0.20 | $0.20 | – | – | – | – |
openrouter | perplexity/llama-3.1-sonar-small-128k-online llama-3.1-sonar-small-128k-online | 127k | $0.20 | $0.20 | – | – | – | – |
openrouter | scb10x/llama3.1-typhoon2-70b-instruct llama3.1-typhoon2-70b-instruct | 8k | $0.88 | $0.88 | – | – | – | – |
openrouter | scb10x/llama3.1-typhoon2-8b-instruct llama3.1-typhoon2-8b-instruct | 8k | $0.18 | $0.18 | – | – | – | – |
bedrock | ▶llama3-2-11b-instruct-v1.0 (2 endpoints) | 128k | $0.35 | $0.35 | – | – | – | – |
bedrock | meta.llama3-2-11b-instruct-v1:0 llama3-2-11b-instruct-v1.0 | 128k | $0.35 | $0.35 | – | – | – | – |
bedrock | us.meta.llama3-2-11b-instruct-v1:0 llama3-2-11b-instruct-v1.0 | 128k | $0.35 | $0.35 | – | – | – | – |
groq | groq/llama-3.2-11b-text-preview llama-3.2-11b-text-preview | 8k | $0.18 | $0.18 | – | – | – | – |
openrouter, azure_ai | ▶llama-3.2-11b-vision-instruct (3 endpoints) | 128k–131k | $0.00–$0.37 | $0.00–$0.37 | – | – | – | – |
openrouter | meta-llama/llama-3.2-11b-vision-instruct:free llama-3.2-11b-vision-instruct | 131k | $0.00 | $0.00 | – | – | – | – |
openrouter | meta-llama/llama-3.2-11b-vision-instruct llama-3.2-11b-vision-instruct | 131k | $0.049 | $0.049 | – | – | – | – |
azure_ai | azure_ai/Llama-3.2-11B-Vision-Instructℹ️ llama-3.2-11b-vision-instruct | 128k | $0.37 | $0.37 | – | – | – | – |
groq | groq/llama-3.2-11b-vision-preview llama-3.2-11b-vision-preview | 8k | $0.18 | $0.18 | – | – | – | – |
openrouter, bedrock | ▶llama-3.2-1b-instruct (5 endpoints) | 128k–131k | $0.00–$0.13 | $0.00–$0.13 | – | – | – | – |
openrouter | meta-llama/llama-3.2-1b-instruct llama-3.2-1b-instruct | 131k | $0.005 | $0.01 | – | – | – | – |
openrouter | meta-llama/llama-3.2-1b-instruct:free llama-3.2-1b-instruct | 131k | $0.00 | $0.00 | – | – | – | – |
bedrock | meta.llama3-2-1b-instruct-v1:0 llama3-2-1b-instruct-v1.0 | 128k | $0.10 | $0.10 | – | – | – | – |
bedrock | us.meta.llama3-2-1b-instruct-v1:0 llama3-2-1b-instruct-v1.0 | 128k | $0.10 | $0.10 | – | – | – | – |
bedrock | eu.meta.llama3-2-1b-instruct-v1:0 llama3-2-1b-instruct-v1.0 | 128k | $0.13 | $0.13 | – | – | – | – |
groq | groq/llama-3.2-1b-preview llama-3.2-1b-preview | 8k | $0.04 | $0.04 | – | – | – | – |
openrouter, lambda, bedrock | ▶llama-3.2-3b-instruct (6 endpoints) | 20k–131k | $0.00–$0.19 | $0.00–$0.19 | – | – | – | – |
openrouter | meta-llama/llama-3.2-3b-instruct llama-3.2-3b-instruct | 131k | $0.01 | $0.02 | – | – | – | – |
lambda | llama3.2-3b-instruct | 131k | $0.015 | $0.025 | – | – | – | – |
bedrock | meta.llama3-2-3b-instruct-v1:0 llama3-2-3b-instruct-v1.0 | 128k | $0.15 | $0.15 | – | – | – | – |
bedrock | us.meta.llama3-2-3b-instruct-v1:0 llama3-2-3b-instruct-v1.0 | 128k | $0.15 | $0.15 | – | – | – | – |
bedrock | eu.meta.llama3-2-3b-instruct-v1:0 llama3-2-3b-instruct-v1.0 | 128k | $0.19 | $0.19 | – | – | – | – |
openrouter | meta-llama/llama-3.2-3b-instruct:free llama-3.2-3b-instruct | 20k | $0.00 | $0.00 | – | – | – | – |
groq | groq/llama-3.2-3b-preview llama-3.2-3b-preview | 8k | $0.06 | $0.06 | – | – | – | – |
bedrock | ▶llama3-2-90b-instruct-v1.0 (2 endpoints) | 128k | $2.00 | $2.00 | – | – | – | – |
bedrock | meta.llama3-2-90b-instruct-v1:0 llama3-2-90b-instruct-v1.0 | 128k | $2.00 | $2.00 | – | – | – | – |
bedrock | us.meta.llama3-2-90b-instruct-v1:0 llama3-2-90b-instruct-v1.0 | 128k | $2.00 | $2.00 | – | – | – | – |
groq | groq/llama-3.2-90b-text-preview llama-3.2-90b-text-preview | 8k | $0.90 | $0.90 | – | – | – | – |
vertex_ai-llama_models | vertex_ai/meta/llama-3.2-90b-vision-instruct-maasℹ️ llama-3.2-90b-vision-instruct-maas | 128k | $0.00 | $0.00 | – | – | – | – |
groq | groq/llama-3.2-90b-vision-preview llama-3.2-90b-vision-preview | 8k | $0.90 | $0.90 | – | – | – | – |
cerebras | cerebras/llama-3.3-70b llama-3.3-70b | 128k | $0.85 | $1.20 | – | – | – | – |
lambda | llama3.3-70b-instruct-fp8 | 131k | $0.12 | $0.30 | – | – | – | – |
together_ai | together_ai/meta-llama/Llama-3.3-70B-Instruct-Turbo llama-3.3-70b-instruct-turbo | – | $0.88 | $0.88 | – | – | – | – |
together_ai | together_ai/meta-llama/Llama-3.3-70B-Instruct-Turbo-Free llama-3.3-70b-instruct-turbo-free | – | $0.00 | $0.00 | – | – | – | – |
groq | groq/llama-3.3-70b-specdec llama-3.3-70b-specdec | 8k | $0.59 | $0.99 | – | – | – | – |
groq | groq/llama-3.3-70b-versatile llama-3.3-70b-versatile | 128k | $0.59 | $0.79 | – | – | – | – |
openrouter | meta-llama/llama-3.3-8b-instruct:free llama-3.3-8b-instruct | 128k | $0.00 | $0.00 | – | – | – | – |
openrouter | ▶llama-3.3-nemotron-super-49b-v1 (2 endpoints) | 131k | $0.00–$0.13 | $0.00–$0.40 | – | – | – | – |
openrouter | nvidia/llama-3.3-nemotron-super-49b-v1:free llama-3.3-nemotron-super-49b-v1 | 131k | $0.00 | $0.00 | – | – | – | – |
openrouter | nvidia/llama-3.3-nemotron-super-49b-v1 llama-3.3-nemotron-super-49b-v1 | 131k | $0.13 | $0.40 | – | – | – | – |
vertex_ai-llama_models | vertex_ai/meta/llama3-405b-instruct-maasℹ️ llama3-405b-instruct-maas | 32k | $0.00 | $0.00 | – | – | – | – |
groq, replicate | ▶llama-3-70b (2 endpoints) | 8k | $0.59–$0.65 | $0.79–$2.75 | – | – | – | – |
groq | groq/llama3-70b-8192 llama3-70b-8192 | 8k | $0.59 | $0.79 | – | – | – | – |
replicate | replicate/meta/llama-3-70b llama-3-70b | 8k | $0.65 | $2.75 | – | – | – | – |
openrouter, replicate, bedrock | ▶llama-3-70b-instruct (10 endpoints) | 8k | $0.30–$4.45 | $0.40–$5.88 | – | – | – | – |
openrouter | meta-llama/llama-3-70b-instruct llama-3-70b-instruct | 8k | $0.30 | $0.40 | – | – | – | – |
replicate | replicate/meta/llama-3-70b-instruct llama-3-70b-instruct | 8k | $0.65 | $2.75 | – | – | – | – |
bedrock | meta.llama3-70b-instruct-v1:0 llama3-70b-instruct-v1.0 | 8k | $2.65 | $3.50 | – | – | – | – |
bedrock | bedrock/us-east-1/meta.llama3-70b-instruct-v1:0 llama3-70b-instruct-v1.0 | 8k | $2.65 | $3.50 | – | – | – | – |
bedrock | bedrock/us-west-1/meta.llama3-70b-instruct-v1:0 llama3-70b-instruct-v1.0 | 8k | $2.65 | $3.50 | – | – | – | – |
bedrock | bedrock/eu-west-1/meta.llama3-70b-instruct-v1:0 llama3-70b-instruct-v1.0 | 8k | $2.86 | $3.78 | – | – | – | – |
bedrock | bedrock/ca-central-1/meta.llama3-70b-instruct-v1:0 llama3-70b-instruct-v1.0 | 8k | $3.05 | $4.03 | – | – | – | – |
bedrock | bedrock/ap-south-1/meta.llama3-70b-instruct-v1:0 llama3-70b-instruct-v1.0 | 8k | $3.18 | $4.20 | – | – | – | – |
bedrock | bedrock/eu-west-2/meta.llama3-70b-instruct-v1:0 llama3-70b-instruct-v1.0 | 8k | $3.45 | $4.55 | – | – | – | – |
bedrock | bedrock/sa-east-1/meta.llama3-70b-instruct-v1:0 llama3-70b-instruct-v1.0 | 8k | $4.45 | $5.88 | – | – | – | – |
vertex_ai-llama_models | vertex_ai/meta/llama3-70b-instruct-maasℹ️ llama3-70b-instruct-maas | 32k | $0.00 | $0.00 | – | – | – | – |
groq, replicate | ▶llama-3-8b (2 endpoints) | 8k–8k | $0.05 | $0.08–$0.25 | – | – | – | – |
groq | groq/llama3-8b-8192 llama3-8b-8192 | 8k | $0.05 | $0.08 | – | – | – | – |
replicate | replicate/meta/llama-3-8b llama-3-8b | 8k | $0.05 | $0.25 | – | – | – | – |
openrouter, bedrock, replicate | ▶llama-3-8b-instruct (10 endpoints) | 8k–8k | $0.03–$0.50 | $0.06–$1.01 | – | – | – | – |
openrouter | meta-llama/llama-3-8b-instruct llama-3-8b-instruct | 8k | $0.03 | $0.06 | – | – | – | – |
bedrock | meta.llama3-8b-instruct-v1:0 llama3-8b-instruct-v1.0 | 8k | $0.30 | $0.60 | – | – | – | – |
bedrock | bedrock/us-east-1/meta.llama3-8b-instruct-v1:0 llama3-8b-instruct-v1.0 | 8k | $0.30 | $0.60 | – | – | – | – |
bedrock | bedrock/us-west-1/meta.llama3-8b-instruct-v1:0 llama3-8b-instruct-v1.0 | 8k | $0.30 | $0.60 | – | – | – | – |
bedrock | bedrock/eu-west-1/meta.llama3-8b-instruct-v1:0 llama3-8b-instruct-v1.0 | 8k | $0.32 | $0.65 | – | – | – | – |
bedrock | bedrock/ca-central-1/meta.llama3-8b-instruct-v1:0 llama3-8b-instruct-v1.0 | 8k | $0.35 | $0.69 | – | – | – | – |
bedrock | bedrock/ap-south-1/meta.llama3-8b-instruct-v1:0 llama3-8b-instruct-v1.0 | 8k | $0.36 | $0.72 | – | – | – | – |
bedrock | bedrock/eu-west-2/meta.llama3-8b-instruct-v1:0 llama3-8b-instruct-v1.0 | 8k | $0.39 | $0.78 | – | – | – | – |
bedrock | bedrock/sa-east-1/meta.llama3-8b-instruct-v1:0 llama3-8b-instruct-v1.0 | 8k | $0.50 | $1.01 | – | – | – | – |
replicate | replicate/meta/llama-3-8b-instruct llama-3-8b-instruct | 8k | $0.05 | $0.25 | – | – | – | – |
vertex_ai-llama_models | vertex_ai/meta/llama3-8b-instruct-maasℹ️ llama3-8b-instruct-maas | 32k | $0.00 | $0.00 | – | – | – | – |
groq | groq/llama3-groq-70b-8192-tool-use-preview llama3-groq-70b-8192-tool-use-preview | 8k | $0.89 | $0.89 | – | – | – | – |
groq | groq/llama3-groq-8b-8192-tool-use-preview llama3-groq-8b-8192-tool-use-preview | 8k | $0.19 | $0.19 | – | – | – | – |
openrouter | neversleep/llama-3-lumimaid-70b llama-3-lumimaid-70b | 8k | $4.00 | $6.00 | – | – | – | – |
openrouter | neversleep/llama-3-lumimaid-8b llama-3-lumimaid-8b | 24k | $0.20 | $1.25 | – | – | – | – |
openrouter | neversleep/llama-3-lumimaid-8b:extended llama-3-lumimaid-8b:extended | 24k | $0.20 | $1.25 | – | – | – | – |
groq, sambanova | ▶llama-4-maverick-17b-128e-instruct (2 endpoints) | 131k | $0.20–$0.63 | $0.60–$1.80 | – | – | – | – |
groq | groq/meta-llama/llama-4-maverick-17b-128e-instruct llama-4-maverick-17b-128e-instruct | 131k | $0.20 | $0.60 | – | – | – | – |
sambanova | sambanova/Llama-4-Maverick-17B-128E-Instructℹ️ llama-4-maverick-17b-128e-instruct | 131k | $0.63 | $1.80 | – | – | – | – |
azure_ai | azure_ai/Llama-4-Maverick-17B-128E-Instruct-FP8ℹ️ llama-4-maverick-17b-128e-instruct-fp8 | 1000k | $1.41 | $0.35 | – | – | – | – |
vertex_ai-llama_models | vertex_ai/meta/llama-4-maverick-17b-128e-instruct-maasℹ️ llama-4-maverick-17b-128e-instruct-maas | 1000k | $0.35 | $1.15 | – | – | – | – |
vertex_ai-llama_models | vertex_ai/meta/llama-4-maverick-17b-16e-instruct-maasℹ️ llama-4-maverick-17b-16e-instruct-maas | 1000k | $0.35 | $1.15 | – | – | – | – |
bedrock_converse | ▶llama4-maverick-17b-instruct-v1.0 (2 endpoints) | 128k | $0.24 | $0.97 | – | – | – | – |
bedrock_converse | meta.llama4-maverick-17b-instruct-v1:0 llama4-maverick-17b-instruct-v1.0 | 128k | $0.24 | $0.97 | – | – | – | – |
bedrock_converse | us.meta.llama4-maverick-17b-instruct-v1:0 llama4-maverick-17b-instruct-v1.0 | 128k | $0.24 | $0.97 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/llama4-maverick-instruct-basicℹ️ llama4-maverick-instruct-basic | 131k | $0.22 | $0.88 | – | – | – | – |
vertex_ai-llama_models | vertex_ai/meta/llama-4-scout-17b-128e-instruct-maasℹ️ llama-4-scout-17b-128e-instruct-maas | 10000k | $0.25 | $0.70 | – | – | – | – |
azure_ai, groq, sambanova, nscale | ▶llama-4-scout-17b-16e-instruct (4 endpoints) | 8k–10000k | $0.09–$0.40 | $0.29–$0.78 | – | – | – | – |
azure_ai | azure_ai/Llama-4-Scout-17B-16E-Instructℹ️ llama-4-scout-17b-16e-instruct | 10000k | $0.20 | $0.78 | – | – | – | – |
groq | groq/meta-llama/llama-4-scout-17b-16e-instruct llama-4-scout-17b-16e-instruct | 131k | $0.11 | $0.34 | – | – | – | – |
sambanova | sambanova/Llama-4-Scout-17B-16E-Instructℹ️ llama-4-scout-17b-16e-instruct | 8k | $0.40 | $0.70 | – | – | – | – |
nscale | nscale/meta-llama/Llama-4-Scout-17B-16E-Instructℹ️ llama-4-scout-17b-16e-instruct | – | $0.09 | $0.29 | – | – | – | – |
vertex_ai-llama_models | vertex_ai/meta/llama-4-scout-17b-16e-instruct-maasℹ️ llama-4-scout-17b-16e-instruct-maas | 10000k | $0.25 | $0.70 | – | – | – | – |
bedrock_converse | ▶llama4-scout-17b-instruct-v1.0 (2 endpoints) | 128k | $0.17 | $0.66 | – | – | – | – |
bedrock_converse | meta.llama4-scout-17b-instruct-v1:0 llama4-scout-17b-instruct-v1.0 | 128k | $0.17 | $0.66 | – | – | – | – |
bedrock_converse | us.meta.llama4-scout-17b-instruct-v1:0 llama4-scout-17b-instruct-v1.0 | 128k | $0.17 | $0.66 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/llama4-scout-instruct-basicℹ️ llama4-scout-instruct-basic | 131k | $0.15 | $0.60 | – | – | – | – |
openrouter | meta-llama/llama-guard-2-8b llama-guard-2-8b | 8k | $0.20 | $0.20 | – | – | – | – |
openrouter, groq | ▶llama-guard-3-8b (2 endpoints) | 8k–131k | $0.02–$0.20 | $0.06–$0.20 | – | – | – | – |
openrouter | meta-llama/llama-guard-3-8b llama-guard-3-8b | 131k | $0.02 | $0.06 | – | – | – | – |
groq | groq/llama-guard-3-8b llama-guard-3-8b | 8k | $0.20 | $0.20 | – | – | – | – |
openrouter | meta-llama/llama-guard-4-12b llama-guard-4-12b | 163k | $0.05 | $0.05 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/llama-v3p1-405b-instructℹ️ llama-v3p1-405b-instruct | 128k | $3.00 | $3.00 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/llama-v3p1-8b-instructℹ️ llama-v3p1-8b-instruct | 16k | $0.10 | $0.10 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/llama-v3p2-11b-vision-instructℹ️ llama-v3p2-11b-vision-instruct | 16k | $0.20 | $0.20 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/llama-v3p2-1b-instructℹ️ llama-v3p2-1b-instruct | 16k | $0.10 | $0.10 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/llama-v3p2-3b-instructℹ️ llama-v3p2-3b-instruct | 16k | $0.10 | $0.10 | – | – | – | – |
fireworks_ai | accounts/fireworks/models/llama-v3p2-90b-vision-instructℹ️ llama-v3p2-90b-vision-instruct | 16k | $0.90 | $0.90 | – | – | – | – |
openrouter | eleutherai/llemma_7b llemma_7b | 4k | $0.80 | $1.20 | – | – | – | – |
aleph_alpha | luminous-base-control | – | $37.50 | $41.25 | – | – | – | – |
aleph_alpha | luminous-extended-control | – | $56.25 | $61.875 | – | – | – | – |
aleph_alpha | luminous-supreme-control | – | $218.75 | $240.625 | – | – | – | – |
deepinfra | deepinfra/lizpreciatior/lzlv_70b_fp16_hf lzlv_70b_fp16_hf | 4k | $0.70 | $0.90 | – | – | – | – |
openrouter | arcee-ai/maestro-reasoning maestro-reasoning | 131k | $0.90 | $3.30 | – | – | – | – |
openrouter | alpindale/magnum-72b magnum-72b | 16k | $4.00 | $6.00 | – | – | – | – |
openrouter | anthracite-org/magnum-v2-72b magnum-v2-72b | 32k | $3.00 | $3.00 | – | – | – | – |
openrouter | anthracite-org/magnum-v4-72b magnum-v4-72b | 16k | $2.50 | $3.00 | – | – | – | – |
openrouter | microsoft/mai-ds-r1:free mai-ds-r1 | 163k | $0.00 | $0.00 | – | – | – | – |
openrouter | inception/mercury-coder-small-beta mercury-coder-small-beta | 32k | $0.25 | $1.00 | – | – | – | – |
azure_ai, deepinfra, sambanova | ▶meta-llama-3.1-405b-instruct (3 endpoints) | 16k–128k | $0.90–$5.33 | $0.90–$16.00 | – | – | – | – |
azure_ai | azure_ai/Meta-Llama-3.1-405B-Instructℹ️ meta-llama-3.1-405b-instruct | 128k | $5.33 | $16.00 | – | – | – | – |
deepinfra | deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct meta-llama-3.1-405b-instruct | 32k | $0.90 | $0.90 | – | – | – | – |
sambanova | sambanova/Meta-Llama-3.1-405B-Instructℹ️ meta-llama-3.1-405b-instruct | 16k | $5.00 | $10.00 | – | – | – | – |
together_ai | together_ai/meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo meta-llama-3.1-405b-instruct-turbo | – | $3.50 | $3.50 | – | – | – | – |
azure_ai, friendliai | ▶meta-llama-3.1-70b-instruct (2 endpoints) | 8k–128k | $0.60–$2.68 | $0.60–$3.54 | – | – | – | – |
azure_ai | azure_ai/Meta-Llama-3.1-70B-Instructℹ️ meta-llama-3.1-70b-instruct | 128k | $2.68 | $3.54 | – | – | – | – |
friendliai | friendliai/meta-llama-3.1-70b-instruct meta-llama-3.1-70b-instruct | 8k | $0.60 | $0.60 | – | – | – | – |
together_ai | together_ai/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo meta-llama-3.1-70b-instruct-turbo | – | $0.88 | $0.88 | – | – | – | – |
together_ai | together_ai/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo meta-llama-3.1-8b-instruct-turbo | – | $0.18 | $0.18 | – | – | – | – |
sambanova | sambanova/Meta-Llama-3.2-1B-Instructℹ️ meta-llama-3.2-1b-instruct | 16k | $0.04 | $0.08 | – | – | – | – |
sambanova | sambanova/Meta-Llama-3.2-3B-Instructℹ️ meta-llama-3.2-3b-instruct | 4k | $0.08 | $0.16 | – | – | – | – |
sambanova | sambanova/Meta-Llama-3.3-70B-Instructℹ️ meta-llama-3.3-70b-instruct | 131k | $0.60 | $1.20 | – | – | – | – |
sambanova | sambanova/Meta-Llama-Guard-3-8Bℹ️ meta-llama-guard-3-8b | 16k | $0.30 | $0.30 | – | – | – | – |
sagemaker | sagemaker/meta-textgeneration-llama-2-13b-f meta-textgeneration-llama-2-13b-f | 4k | $0.00 | $0.00 | – | – | – | – |
sagemaker | sagemaker/meta-textgeneration-llama-2-70b-b-f meta-textgeneration-llama-2-70b-b-f | 4k | $0.00 | $0.00 | – | – | – | – |
sagemaker | sagemaker/meta-textgeneration-llama-2-7b-f meta-textgeneration-llama-2-7b-f | 4k | $0.00 | $0.00 | – | – | – | – |
openrouter | sophosympatheia/midnight-rose-70b midnight-rose-70b | 4k | $0.80 | $0.80 | – | – | – | – |
openrouter | minimax/minimax-01 minimax-01 | 1000k | $0.20 | $1.10 | – | – | – | – |
openrouter, azure_ai | ▶ministral-3b (2 endpoints) | 128k–131k | $0.04 | $0.04 | – | – | – | – |
openrouter | mistralai/ministral-3b ministral-3b | 131k | $0.04 | $0.04 | – | – | – | – |
azure_ai | azure_ai/ministral-3bℹ️ ministral-3b | 128k | $0.04 | $0.04 | – | – | – | – |
openrouter | mistralai/ministral-8b ministral-8b | 128k | $0.10 | $0.10 | – | – | – | – |
openrouter, perplexity | ▶mistral-7b-instruct (3 endpoints) | 4k–32k | $0.00–$0.07 | $0.00–$0.28 | – | – | – | – |
openrouter | mistralai/mistral-7b-instruct:free mistral-7b-instruct | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | mistralai/mistral-7b-instruct mistral-7b-instruct | 32k | $0.028 | $0.054 | – | – | – | – |
perplexity | perplexity/mistral-7b-instruct mistral-7b-instruct | 4k | $0.07 | $0.28 | – | – | – | – |
deepinfra, anyscale, cloudflare, openrouter | ▶mistral-7b-instruct-v0.1 (4 endpoints) | 2k–32k | $0.11–$1.923 | $0.13–$1.923 | – | – | – | – |
deepinfra | deepinfra/mistralai/Mistral-7B-Instruct-v0.1 mistral-7b-instruct-v0.1 | 32k | $0.13 | $0.13 | – | – | – | – |
anyscale | anyscale/mistralai/Mistral-7B-Instruct-v0.1ℹ️ mistral-7b-instruct-v0.1 | 16k | $0.15 | $0.15 | – | – | – | – |
cloudflare | cloudflare/@cf/mistral/mistral-7b-instruct-v0.1 mistral-7b-instruct-v0.1 | 8k | $1.923 | $1.923 | – | – | – | – |
openrouter | mistralai/mistral-7b-instruct-v0.1 mistral-7b-instruct-v0.1 | 2k | $0.11 | $0.19 | – | – | – | – |
openrouter, bedrock, replicate | ▶mistral-7b-instruct-v0.2 (6 endpoints) | 4k–32k | $0.05–$0.20 | $0.20–$0.26 | – | – | – | – |
openrouter | mistralai/mistral-7b-instruct-v0.2 mistral-7b-instruct-v0.2 | 32k | $0.20 | $0.20 | – | – | – | – |
bedrock | mistral.mistral-7b-instruct-v0:2 mistral-7b-instruct-v0.2 | 32k | $0.15 | $0.20 | – | – | – | – |
bedrock | bedrock/us-west-2/mistral.mistral-7b-instruct-v0:2 mistral-7b-instruct-v0.2 | 32k | $0.15 | $0.20 | – | – | – | – |
bedrock | bedrock/us-east-1/mistral.mistral-7b-instruct-v0:2 mistral-7b-instruct-v0.2 | 32k | $0.15 | $0.20 | – | – | – | – |
bedrock | bedrock/eu-west-3/mistral.mistral-7b-instruct-v0:2 mistral-7b-instruct-v0.2 | 32k | $0.20 | $0.26 | – | – | – | – |
replicate | replicate/mistralai/mistral-7b-instruct-v0.2 mistral-7b-instruct-v0.2 | 4k | $0.05 | $0.25 | – | – | – | – |
replicate | replicate/mistralai/mistral-7b-v0.1 mistral-7b-v0.1 | 4k | $0.05 | $0.25 | – | – | – | – |
vertex_ai-mistral_models | vertex_ai/mistral-large@2411-001 mistral-large@2411-001 | 128k | $2.00 | $6.00 | – | – | – | – |
vertex_ai-mistral_models | vertex_ai/mistral-large@latest mistral-large@latest | 128k | $2.00 | $6.00 | – | – | – | – |
deepinfra | deepinfra/amazon/MistralLite mistrallite | 32k | $0.20 | $0.20 | – | – | – | – |
openrouter, mistral | ▶mistral-medium (4 endpoints) | 32k–32k | $2.70–$2.75 | $8.10 | – | – | – | – |
openrouter | mistralai/mistral-medium mistral-medium | 32k | $2.75 | $8.10 | – | – | – | – |
mistral | mistral/mistral-medium mistral-medium | 32k | $2.70 | $8.10 | – | – | – | – |
mistral | mistral/mistral-medium-2312 mistral-medium-2312 | 32k | $2.70 | $8.10 | – | – | – | – |
mistral | mistral/mistral-medium-latest mistral-medium-latest | 32k | $2.70 | $8.10 | – | – | – | – |
openrouter | mistralai/mistral-medium-3 mistral-medium-3 | 131k | $0.40 | $2.00 | – | – | – | – |
openrouter, azure_ai, vertex_ai-mistral_models | ▶mistral-nemo (4 endpoints) | 128k–131k | $0.00–$3.00 | $0.00–$3.00 | – | – | – | – |
openrouter | mistralai/mistral-nemo mistral-nemo | 131k | $0.025 | $0.07 | – | – | – | – |
azure_ai | azure_ai/mistral-nemoℹ️ mistral-nemo | 131k | $0.15 | $0.15 | – | – | – | – |
openrouter | mistralai/mistral-nemo:free mistral-nemo | 128k | $0.00 | $0.00 | – | – | – | – |
vertex_ai-mistral_models | vertex_ai/mistral-nemo@2407 mistral-nemo@2407 | 128k | $3.00 | $3.00 | – | – | – | – |
vertex_ai-mistral_models | vertex_ai/mistral-nemo@latest mistral-nemo@latest | 128k | $0.15 | $0.15 | – | – | – | – |
openrouter | mistralai/mistral-saba mistral-saba | 32k | $0.20 | $0.60 | – | – | – | – |
groq | groq/mistral-saba-24b mistral-saba-24b | 32k | $0.79 | $0.79 | – | – | – | – |
openrouter | ▶mistral-small-24b-instruct-2501 (2 endpoints) | 28k–32k | $0.00–$0.06 | $0.00–$0.12 | – | – | – | – |
openrouter | mistralai/mistral-small-24b-instruct-2501:free mistral-small-24b-instruct-2501 | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | mistralai/mistral-small-24b-instruct-2501 mistral-small-24b-instruct-2501 | 28k | $0.06 | $0.12 | – | – | – | – |
vertex_ai-mistral_models | vertex_ai/mistral-small-2503@001 mistral-small-2503@001 | 32k | $1.00 | $3.00 | – | – | – | – |
openrouter | ▶mistral-small-3.1-24b-instruct (2 endpoints) | 96k–131k | $0.00–$0.05 | $0.00–$0.15 | – | – | – | – |
openrouter | mistralai/mistral-small-3.1-24b-instruct mistral-small-3.1-24b-instruct | 131k | $0.05 | $0.15 | – | – | – | – |
openrouter | mistralai/mistral-small-3.1-24b-instruct:free mistral-small-3.1-24b-instruct | 96k | $0.00 | $0.00 | – | – | – | – |
openrouter, mistral | ▶mistral-tiny (2 endpoints) | 32k–32k | $0.25 | $0.25 | – | – | – | – |
openrouter | mistralai/mistral-tiny mistral-tiny | 32k | $0.25 | $0.25 | – | – | – | – |
mistral | mistral/mistral-tiny mistral-tiny | 32k | $0.25 | $0.25 | – | – | – | – |
openrouter, fireworks_ai | ▶mixtral-8x22b-instruct (2 endpoints) | 65k | $0.40–$1.20 | $1.20 | – | – | – | – |
openrouter | mistralai/mixtral-8x22b-instruct mixtral-8x22b-instruct | 65k | $0.40 | $1.20 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/mixtral-8x22b-instruct-hfℹ️ mixtral-8x22b-instruct | 65k | $1.20 | $1.20 | – | – | – | – |
anyscale, nscale | ▶mixtral-8x22b-instruct-v0.1 (2 endpoints) | 65k | $0.60–$0.90 | $0.60–$0.90 | – | – | – | – |
anyscale | anyscale/mistralai/Mixtral-8x22B-Instruct-v0.1ℹ️ mixtral-8x22b-instruct-v0.1 | 65k | $0.90 | $0.90 | – | – | – | – |
nscale | nscale/mistralai/mixtral-8x22b-instruct-v0.1ℹ️ mixtral-8x22b-instruct-v0.1 | – | $0.60 | $0.60 | – | – | – | – |
groq | groq/mixtral-8x7b-32768 mixtral-8x7b-32768 | 32k | $0.24 | $0.24 | – | – | – | – |
openrouter, perplexity | ▶mixtral-8x7b-instruct (2 endpoints) | 4k–32k | $0.07–$0.08 | $0.24–$0.28 | – | – | – | – |
openrouter | mistralai/mixtral-8x7b-instruct mixtral-8x7b-instruct | 32k | $0.08 | $0.24 | – | – | – | – |
perplexity | perplexity/mixtral-8x7b-instruct mixtral-8x7b-instruct | 4k | $0.07 | $0.28 | – | – | – | – |
openrouter | nothingiisreal/mn-celeste-12b mn-celeste-12b | 16k | $0.80 | $1.20 | – | – | – | – |
openrouter | infermatic/mn-inferor-12b mn-inferor-12b | 16k | $0.80 | $1.20 | – | – | – | – |
openrouter | aetherwiing/mn-starcannon-12b mn-starcannon-12b | 16k | $0.80 | $1.20 | – | – | – | – |
openrouter | moonshotai/moonlight-16b-a3b-instruct:free moonlight-16b-a3b-instruct | 8k | $0.00 | $0.00 | – | – | – | – |
openrouter | pygmalionai/mythalion-13b mythalion-13b | 4k | $0.80 | $1.20 | – | – | – | – |
openrouter, deepinfra | ▶mythomax-l2-13b (2 endpoints) | 4k | $0.065–$0.22 | $0.065–$0.22 | – | – | – | – |
openrouter | gryphe/mythomax-l2-13b mythomax-l2-13b | 4k | $0.065 | $0.065 | – | – | – | – |
deepinfra | deepinfra/Gryphe/MythoMax-L2-13b mythomax-l2-13b | 4k | $0.22 | $0.22 | – | – | – | – |
openrouter | neversleep/noromaid-20b noromaid-20b | 8k | $1.25 | $2.00 | – | – | – | – |
openrouter | nousresearch/nous-hermes-2-mixtral-8x7b-dpo nous-hermes-2-mixtral-8x7b-dpo | 32k | $0.60 | $0.60 | – | – | – | – |
openrouter | amazon/nova-lite-v1 nova-lite-v1 | 300k | $0.06 | $0.24 | – | – | – | – |
bedrock_converse | ▶nova-lite-v1.0 (3 endpoints) | 128k | $0.06–$0.078 | $0.24–$0.312 | – | – | – | – |
bedrock_converse | amazon.nova-lite-v1:0 nova-lite-v1.0 | 128k | $0.06 | $0.24 | – | – | – | – |
bedrock_converse | us.amazon.nova-lite-v1:0 nova-lite-v1.0 | 128k | $0.06 | $0.24 | – | – | – | – |
bedrock_converse | eu.amazon.nova-lite-v1:0 nova-lite-v1.0 | 128k | $0.078 | $0.312 | – | – | – | – |
openrouter | amazon/nova-micro-v1 nova-micro-v1 | 128k | $0.035 | $0.14 | – | – | – | – |
bedrock_converse | ▶nova-micro-v1.0 (3 endpoints) | 300k | $0.035–$0.046 | $0.14–$0.184 | – | – | – | – |
bedrock_converse | amazon.nova-micro-v1:0 nova-micro-v1.0 | 300k | $0.035 | $0.14 | – | – | – | – |
bedrock_converse | us.amazon.nova-micro-v1:0 nova-micro-v1.0 | 300k | $0.035 | $0.14 | – | – | – | – |
bedrock_converse | eu.amazon.nova-micro-v1:0 nova-micro-v1.0 | 300k | $0.046 | $0.184 | – | – | – | – |
bedrock_converse | us.amazon.nova-premier-v1:0 nova-premier-v1.0 | 1000k | $2.50 | $12.50 | – | – | – | – |
openrouter | amazon/nova-pro-v1 nova-pro-v1 | 300k | $0.80 | $3.20 | – | – | – | – |
bedrock_converse | ▶nova-pro-v1.0 (3 endpoints) | 300k | $0.80–$1.05 | $3.20–$4.20 | – | – | – | – |
bedrock_converse | amazon.nova-pro-v1:0 nova-pro-v1.0 | 300k | $0.80 | $3.20 | – | – | – | – |
bedrock_converse | us.amazon.nova-pro-v1:0 nova-pro-v1.0 | 300k | $0.80 | $3.20 | – | – | – | – |
bedrock_converse | eu.amazon.nova-pro-v1:0ℹ️ nova-pro-v1.0 | 300k | $1.05 | $4.20 | – | – | – | – |
openrouter | allenai/olmo-7b-instruct olmo-7b-instruct | 2k | $0.08 | $0.24 | – | – | – | – |
openrouter | open-r1/olympiccoder-32b:free olympiccoder-32b | 32k | $0.00 | $0.00 | – | – | – | – |
deepinfra | deepinfra/openchat/openchat_3.5 openchat_3.5 | 4k | $0.13 | $0.13 | – | – | – | – |
mistral | mistral/open-codestral-mambaℹ️ open-codestral-mamba | 256k | $0.25 | $0.25 | – | – | – | – |
openrouter | all-hands/openhands-lm-32b-v0.1 openhands-lm-32b-v0.1 | 16k | $2.60 | $3.40 | – | – | – | – |
openrouter | microsoft/phi-3.5-mini-128k-instruct phi-3.5-mini-128k-instruct | 131k | $0.03 | $0.09 | – | – | – | – |
azure_ai | azure_ai/Phi-3.5-mini-instructℹ️ phi-3.5-mini-instruct | 128k | $0.13 | $0.52 | – | – | – | – |
azure_ai | azure_ai/Phi-3.5-MoE-instructℹ️ phi-3.5-moe-instruct | 128k | $0.16 | $0.64 | – | – | – | – |
azure_ai | azure_ai/Phi-3.5-vision-instructℹ️ phi-3.5-vision-instruct | 128k | $0.13 | $0.52 | – | – | – | – |
azure_ai | azure_ai/Phi-3-medium-4k-instructℹ️ phi-3-medium-4k-instruct | 4k | $0.17 | $0.68 | – | – | – | – |
openrouter, azure_ai | ▶phi-3-mini-128k-instruct (2 endpoints) | 128k | $0.10–$0.13 | $0.10–$0.52 | – | – | – | – |
openrouter | microsoft/phi-3-mini-128k-instruct phi-3-mini-128k-instruct | 128k | $0.10 | $0.10 | – | – | – | – |
azure_ai | azure_ai/Phi-3-mini-128k-instructℹ️ phi-3-mini-128k-instruct | 128k | $0.13 | $0.52 | – | – | – | – |
azure_ai | azure_ai/Phi-3-mini-4k-instructℹ️ phi-3-mini-4k-instruct | 4k | $0.13 | $0.52 | – | – | – | – |
azure_ai | azure_ai/Phi-3-small-128k-instructℹ️ phi-3-small-128k-instruct | 128k | $0.15 | $0.60 | – | – | – | – |
azure_ai | azure_ai/Phi-3-small-8k-instructℹ️ phi-3-small-8k-instruct | 8k | $0.15 | $0.60 | – | – | – | – |
azure_ai | azure_ai/Phi-4-mini-instructℹ️ phi-4-mini-instruct | 131k | $0.075 | $0.30 | – | – | – | – |
openrouter, azure_ai | ▶phi-4-multimodal-instruct (2 endpoints) | 131k | $0.05–$0.08 | $0.10–$0.32 | – | – | – | – |
openrouter | microsoft/phi-4-multimodal-instruct phi-4-multimodal-instruct | 131k | $0.05 | $0.10 | – | – | – | – |
azure_ai | azure_ai/Phi-4-multimodal-instructℹ️ phi-4-multimodal-instruct | 131k | $0.08 | $0.32 | – | – | – | – |
openrouter | microsoft/phi-4-reasoning:free phi-4-reasoning | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | ▶phi-4-reasoning-plus (2 endpoints) | 32k | $0.00–$0.07 | $0.00–$0.35 | – | – | – | – |
openrouter | microsoft/phi-4-reasoning-plus:free phi-4-reasoning-plus | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | microsoft/phi-4-reasoning-plus phi-4-reasoning-plus | 32k | $0.07 | $0.35 | – | – | – | – |
deepinfra | deepinfra/Phind/Phind-CodeLlama-34B-v2 phind-codellama-34b-v2 | 16k | $0.60 | $0.60 | – | – | – | – |
mistral, openrouter | ▶pixtral-12b (2 endpoints) | 32k–128k | $0.10–$0.15 | $0.10–$0.15 | – | – | – | – |
mistral | mistral/pixtral-12b-2409 pixtral-12b-2409 | 128k | $0.15 | $0.15 | – | – | – | – |
openrouter | mistralai/pixtral-12b pixtral-12b | 32k | $0.10 | $0.10 | – | – | – | – |
openrouter, mistral | ▶pixtral-large-latest (3 endpoints) | 128k–131k | $2.00 | $6.00 | – | – | – | – |
openrouter | mistralai/pixtral-large-2411 pixtral-large-2411 | 131k | $2.00 | $6.00 | – | – | – | – |
mistral | mistral/pixtral-large-2411 pixtral-large-2411 | 128k | $2.00 | $6.00 | – | – | – | – |
mistral | mistral/pixtral-large-latest pixtral-large-latest | 128k | $2.00 | $6.00 | – | – | – | – |
perplexity | perplexity/pplx-70b-chat pplx-70b-chat | 4k | $0.70 | $2.80 | – | – | – | – |
perplexity | perplexity/pplx-70b-online pplx-70b-online | 4k | $0.00 | $2.80 | – | – | – | – |
perplexity | perplexity/pplx-7b-chat pplx-7b-chat | 8k | $0.07 | $0.28 | – | – | – | – |
perplexity | perplexity/pplx-7b-online pplx-7b-online | 4k | $0.00 | $0.28 | – | – | – | – |
openrouter | ▶qwen-2.5-7b-instruct (2 endpoints) | 32k | $0.00–$0.04 | $0.00–$0.10 | – | – | – | – |
openrouter | qwen/qwen-2.5-7b-instruct:free qwen-2.5-7b-instruct | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | qwen/qwen-2.5-7b-instruct qwen-2.5-7b-instruct | 32k | $0.04 | $0.10 | – | – | – | – |
lambda, openrouter, nscale | ▶qwen25-coder-32b-instruct (4 endpoints) | 32k–33k | $0.00–$0.07 | $0.00–$0.20 | – | – | – | – |
lambda | qwen25-coder-32b-instruct | 33k | $0.07 | $0.16 | – | – | – | – |
openrouter | qwen/qwen-2.5-coder-32b-instruct:free qwen-2.5-coder-32b-instruct | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | qwen/qwen-2.5-coder-32b-instruct qwen-2.5-coder-32b-instruct | 32k | $0.06 | $0.15 | – | – | – | – |
nscale | nscale/Qwen/Qwen2.5-Coder-32B-Instructℹ️ qwen2.5-coder-32b-instruct | – | $0.06 | $0.20 | – | – | – | – |
nscale | nscale/Qwen/Qwen2.5-Coder-3B-Instructℹ️ qwen2.5-coder-3b-instruct | – | $0.01 | $0.03 | – | – | – | – |
openrouter, nscale | ▶qwen2.5-coder-7b-instruct (2 endpoints) | 32k | $0.01 | $0.03 | – | – | – | – |
openrouter | qwen/qwen2.5-coder-7b-instruct qwen2.5-coder-7b-instruct | 32k | $0.01 | $0.03 | – | – | – | – |
nscale | nscale/Qwen/Qwen2.5-Coder-7B-Instructℹ️ qwen2.5-coder-7b-instruct | – | $0.01 | $0.03 | – | – | – | – |
openrouter | ▶qwen2.5-vl-32b-instruct (2 endpoints) | 8k–128k | $0.00–$0.90 | $0.00–$0.90 | – | – | – | – |
openrouter | qwen/qwen2.5-vl-32b-instruct qwen2.5-vl-32b-instruct | 128k | $0.90 | $0.90 | – | – | – | – |
openrouter | qwen/qwen2.5-vl-32b-instruct:free qwen2.5-vl-32b-instruct | 8k | $0.00 | $0.00 | – | – | – | – |
openrouter | qwen/qwen2.5-vl-3b-instruct:free qwen2.5-vl-3b-instruct | 64k | $0.00 | $0.00 | – | – | – | – |
openrouter | ▶qwen2.5-vl-72b-instruct (2 endpoints) | 32k–131k | $0.00–$0.25 | $0.00–$0.75 | – | – | – | – |
openrouter | qwen/qwen2.5-vl-72b-instruct:free qwen2.5-vl-72b-instruct | 131k | $0.00 | $0.00 | – | – | – | – |
openrouter | qwen/qwen2.5-vl-72b-instruct qwen2.5-vl-72b-instruct | 32k | $0.25 | $0.75 | – | – | – | – |
openrouter | ▶qwen-2.5-vl-7b-instruct (2 endpoints) | 32k–64k | $0.00–$0.20 | $0.00–$0.20 | – | – | – | – |
openrouter | qwen/qwen-2.5-vl-7b-instruct:free qwen-2.5-vl-7b-instruct | 64k | $0.00 | $0.00 | – | – | – | – |
openrouter | qwen/qwen-2.5-vl-7b-instruct qwen-2.5-vl-7b-instruct | 32k | $0.20 | $0.20 | – | – | – | – |
sambanova | sambanova/Qwen2-Audio-7B-Instructℹ️ qwen2-audio-7b-instruct | 4k | $0.50 | $100.00 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/qwen2p5-coder-32b-instructℹ️ qwen2p5-coder-32b-instruct | 4k | $0.90 | $0.90 | – | – | – | – |
openrouter | qwen/qwen3-0.6b-04-28:free qwen3-0.6b-04-28 | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | ▶qwen3-14b (2 endpoints) | 40k | $0.00–$0.07 | $0.00–$0.24 | – | – | – | – |
openrouter | qwen/qwen3-14b:free qwen3-14b | 40k | $0.00 | $0.00 | – | – | – | – |
openrouter | qwen/qwen3-14b qwen3-14b | 40k | $0.07 | $0.24 | – | – | – | – |
openrouter | qwen/qwen3-1.7b:free qwen3-1.7b | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | ▶qwen3-235b-a22b (2 endpoints) | 40k | $0.00–$0.14 | $0.00–$0.60 | – | – | – | – |
openrouter | qwen/qwen3-235b-a22b:free qwen3-235b-a22b | 40k | $0.00 | $0.00 | – | – | – | – |
openrouter | qwen/qwen3-235b-a22b qwen3-235b-a22b | 40k | $0.14 | $0.60 | – | – | – | – |
openrouter | ▶qwen3-30b-a3b (2 endpoints) | 32k–40k | $0.00–$0.08 | $0.00–$0.29 | – | – | – | – |
openrouter | qwen/qwen3-30b-a3b:free qwen3-30b-a3b | 40k | $0.00 | $0.00 | – | – | – | – |
openrouter | qwen/qwen3-30b-a3b qwen3-30b-a3b | 32k | $0.08 | $0.29 | – | – | – | – |
openrouter, sambanova | ▶qwen3-32b (3 endpoints) | 8k–40k | $0.00–$0.40 | $0.00–$0.80 | – | – | – | – |
openrouter | qwen/qwen3-32b:free qwen3-32b | 40k | $0.00 | $0.00 | – | – | – | – |
openrouter | qwen/qwen3-32b qwen3-32b | 40k | $0.10 | $0.30 | – | – | – | – |
sambanova | sambanova/Qwen3-32Bℹ️ qwen3-32b | 8k | $0.40 | $0.80 | – | – | – | – |
openrouter | qwen/qwen3-4b:free qwen3-4b | 128k | $0.00 | $0.00 | – | – | – | – |
openrouter | ▶qwen3-8b (2 endpoints) | 40k–128k | $0.00–$0.035 | $0.00–$0.138 | – | – | – | – |
openrouter | qwen/qwen3-8b qwen3-8b | 128k | $0.035 | $0.138 | – | – | – | – |
openrouter | qwen/qwen3-8b:free qwen3-8b | 40k | $0.00 | $0.00 | – | – | – | – |
openrouter | qwen/qwen-max qwen-max | 32k | $1.60 | $6.40 | – | – | – | – |
openrouter | qwen/qwen-plus qwen-plus | 131k | $0.40 | $1.20 | – | – | – | – |
groq | groq/qwen-qwq-32b qwen-qwq-32b | 128k | $0.29 | $0.39 | – | – | – | – |
openrouter | qwen/qwen-turbo qwen-turbo | 1000k | $0.05 | $0.20 | – | – | – | – |
openrouter | qwen/qwen-vl-max qwen-vl-max | 7k | $0.80 | $3.20 | – | – | – | – |
openrouter | qwen/qwen-vl-plus qwen-vl-plus | 7k | $0.21 | $0.63 | – | – | – | – |
openrouter | featherless/qwerky-72b:free qwerky-72b | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter, sambanova, nscale | ▶qwq-32b (4 endpoints) | 16k–131k | $0.00–$0.50 | $0.00–$1.00 | – | – | – | – |
openrouter | qwen/qwq-32b qwq-32b | 131k | $0.15 | $0.20 | – | – | – | – |
openrouter | qwen/qwq-32b:free qwq-32b | 40k | $0.00 | $0.00 | – | – | – | – |
sambanova | sambanova/QwQ-32Bℹ️ qwq-32b | 16k | $0.50 | $1.00 | – | – | – | – |
nscale | nscale/Qwen/QwQ-32Bℹ️ qwq-32b | – | $0.18 | $0.20 | – | – | – | – |
openrouter | arliai/qwq-32b-arliai-rpr-v1:free qwq-32b-arliai-rpr-v1 | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | qwen/qwq-32b-preview qwq-32b-preview | 32k | $0.09 | $0.27 | – | – | – | – |
openrouter | perplexity/r1-1776 r1-1776 | 128k | $2.00 | $8.00 | – | – | – | – |
openrouter | rekaai/reka-flash-3:free reka-flash-3 | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | undi95/remm-slerp-l2-13b remm-slerp-l2-13b | 4k | $0.80 | $1.20 | – | – | – | – |
openrouter | thedrummer/rocinante-12b rocinante-12b | 32k | $0.25 | $0.50 | – | – | – | – |
openrouter | shisa-ai/shisa-v2-llama3.3-70b:free shisa-v2-llama3.3-70b | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | thedrummer/skyfall-36b-v2 skyfall-36b-v2 | 32k | $0.50 | $0.80 | – | – | – | – |
perplexity, openrouter | ▶sonar (2 endpoints) | 127k–128k | $1.00 | $1.00 | – | – | – | – |
perplexity | perplexity/sonar sonar | 128k | $1.00 | $1.00 | – | – | – | – |
openrouter | perplexity/sonar sonar | 127k | $1.00 | $1.00 | – | – | – | – |
perplexity, openrouter | ▶sonar-deep-research (2 endpoints) | 128k | $2.00 | $8.00 | – | – | – | – |
perplexity | perplexity/sonar-deep-research sonar-deep-research | 128k | $2.00 | $8.00 | – | – | – | – |
openrouter | perplexity/sonar-deep-research sonar-deep-research | 128k | $2.00 | $8.00 | – | – | – | – |
perplexity | perplexity/sonar-medium-chat sonar-medium-chat | 16k | $0.60 | $1.80 | – | – | – | – |
perplexity | perplexity/sonar-medium-online sonar-medium-online | 12k | $0.00 | $1.80 | – | – | – | – |
perplexity, openrouter | ▶sonar-pro (2 endpoints) | 200k | $3.00 | $15.00 | – | – | – | – |
perplexity | perplexity/sonar-pro sonar-pro | 200k | $3.00 | $15.00 | – | – | – | – |
openrouter | perplexity/sonar-pro sonar-pro | 200k | $3.00 | $15.00 | – | – | – | – |
perplexity, openrouter | ▶sonar-reasoning (2 endpoints) | 127k–128k | $1.00 | $5.00 | – | – | – | – |
perplexity | perplexity/sonar-reasoning sonar-reasoning | 128k | $1.00 | $5.00 | – | – | – | – |
openrouter | perplexity/sonar-reasoning sonar-reasoning | 127k | $1.00 | $5.00 | – | – | – | – |
perplexity, openrouter | ▶sonar-reasoning-pro (2 endpoints) | 128k | $2.00 | $8.00 | – | – | – | – |
perplexity | perplexity/sonar-reasoning-pro sonar-reasoning-pro | 128k | $2.00 | $8.00 | – | – | – | – |
openrouter | perplexity/sonar-reasoning-pro sonar-reasoning-pro | 128k | $2.00 | $8.00 | – | – | – | – |
perplexity | perplexity/sonar-small-chat sonar-small-chat | 16k | $0.07 | $0.28 | – | – | – | – |
perplexity | perplexity/sonar-small-online sonar-small-online | 12k | $0.00 | $0.28 | – | – | – | – |
openrouter | raifle/sorcererlm-8x22b sorcererlm-8x22b | 16k | $4.50 | $4.50 | – | – | – | – |
openrouter | arcee-ai/spotlight spotlight | 131k | $0.18 | $0.18 | – | – | – | – |
bedrock | amazon.titan-text-express-v1 titan-text-express-v1 | 42k | $1.30 | $1.70 | – | – | – | – |
bedrock | amazon.titan-text-lite-v1 titan-text-lite-v1 | 42k | $0.30 | $0.40 | – | – | – | – |
bedrock | amazon.titan-text-premier-v1:0 titan-text-premier-v1.0 | 42k | $0.50 | $1.50 | – | – | – | – |
together_ai | together-ai-21.1b-41b | – | $0.80 | $0.80 | – | – | – | – |
together_ai | together-ai-41.1b-80b | – | $0.90 | $0.90 | – | – | – | – |
together_ai | together-ai-4.1b-8b | – | $0.20 | $0.20 | – | – | – | – |
together_ai | together-ai-81.1b-110b | – | $1.80 | $1.80 | – | – | – | – |
together_ai | together-ai-8.1b-21b | – | $0.30 | $0.30 | – | – | – | – |
together_ai | together-ai-up-to-4b | – | $0.10 | $0.10 | – | – | – | – |
openrouter | undi95/toppy-m-7b toppy-m-7b | 4k | $0.80 | $1.20 | – | – | – | – |
openrouter | bytedance-research/ui-tars-72b:free ui-tars-72b | 32k | $0.00 | $0.00 | – | – | – | – |
openrouter | thedrummer/unslopnemo-12b unslopnemo-12b | 32k | $0.45 | $0.45 | – | – | – | – |
openrouter | arcee-ai/virtuoso-large virtuoso-large | 131k | $0.75 | $1.20 | – | – | – | – |
openrouter | arcee-ai/virtuoso-medium-v2 virtuoso-medium-v2 | 131k | $0.50 | $0.80 | – | – | – | – |
openrouter | mancer/weaver weaver | 8k | $1.50 | $1.50 | – | – | – | – |
fireworks_ai, openrouter | ▶yi-large (2 endpoints) | 32k | $3.00 | $3.00 | – | – | – | – |
fireworks_ai | fireworks_ai/accounts/fireworks/models/yi-largeℹ️ yi-large | 32k | $3.00 | $3.00 | – | – | – | – |
openrouter | 01-ai/yi-large yi-large | 32k | $3.00 | $3.00 | – | – | – | – |
anyscale | anyscale/HuggingFaceH4/zephyr-7b-beta zephyr-7b-beta | 16k | $0.15 | $0.15 | – | – | – | – |