id: llmgateway
npm: @ai-sdk/openai-compatible
env: LLMGATEWAY_API_KEY
api: https://api.llmgateway.io/v1
Models
Auto Route
autoin $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Claude 3 Opus
claude-3-opusin $15.00/M
out $75.00/M
cache read $1.50/M
cache write $18.75/M
ctx: 200,000
max out: 4,096
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Claude 3.7 Sonnet
claude-3-7-sonnetin $3.00/M
out $15.00/M
cache read $0.30/M
cache write $3.75/M
ctx: 200,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Haiku 4.5
claude-haiku-4-5-20251001in $1.00/M
out $5.00/M
cache read $0.10/M
cache write $1.25/M
ctx: 200,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Haiku 4.5 (latest)
claude-haiku-4-5in $1.00/M
out $5.00/M
cache read $0.10/M
cache write $1.25/M
ctx: 200,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.1
claude-opus-4-1-20250805in $15.00/M
out $75.00/M
cache read $1.50/M
cache write $18.75/M
ctx: 200,000
max out: 32,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.5
claude-opus-4-5-20251101in $5.00/M
out $25.00/M
cache read $0.50/M
cache write $6.25/M
ctx: 200,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.6
claude-opus-4-6in $5.00/M
out $25.00/M
cache read $0.50/M
cache write $6.25/M
ctx: 1,000,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.7
claude-opus-4-7in $5.00/M
out $25.00/M
cache read $0.50/M
cache write $6.25/M
ctx: 1,000,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.8
claude-opus-4-8in $5.00/M
out $25.00/M
cache read $0.50/M
cache write $6.25/M
ctx: 1,000,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Sonnet 3.7
claude-3-7-sonnet-20250219in $3.00/M
out $15.00/M
cache read $0.30/M
cache write $3.75/M
ctx: 200,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Sonnet 4.5
claude-sonnet-4-5-20250929in $3.00/M
out $15.00/M
cache read $0.30/M
cache write $3.75/M
ctx: 200,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Sonnet 4.5 (latest)
claude-sonnet-4-5in $3.00/M
out $15.00/M
cache read $0.30/M
cache write $3.75/M
ctx: 200,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Sonnet 4.6
claude-sonnet-4-6in $3.00/M
out $15.00/M
cache read $0.30/M
cache write $3.75/M
ctx: 1,000,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Codestral
codestral-2508in $0.30/M
out $0.90/M
ctx: 256,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Custom Model
customin $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek V3.1
deepseek-v3.1in $0.56/M
out $1.68/M
cache read $0.11/M
ctx: 128,000
max out: 32,768
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek V3.2
deepseek-v3.2in $0.28/M
out $0.42/M
cache read $0.03/M
ctx: 163,840
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek V4 Flash
deepseek-v4-flashin $0.14/M
out $0.28/M
cache read $0.00/M
ctx: 1,050,000
max out: 384,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek V4 Pro
deepseek-v4-proin $0.43/M
out $0.87/M
cache read $0.00/M
ctx: 1,050,000
max out: 384,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Devstral 2
devstral-2512in $0.40/M
out $2.00/M
ctx: 262,144
max out: 262,144
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
deprecated
Devstral Small
devstral-small-2507in $0.10/M
out $0.30/M
ctx: 131,072
max out: 128,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
deprecated
Fugu Ultra
fugu-ultrain $5.00/M
out $30.00/M
cache read $0.50/M
ctx: 1,000,000
max out: 1,000,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini 2.5 Flash
gemini-2.5-flashin $0.30/M
out $2.50/M
cache read $0.03/M
ctx: 1,048,576
max out: 65,536
in: text, image, audio, video, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini 2.5 Flash Lite Preview (09-2025)
gemini-2.5-flash-lite-preview-09-2025in $0.10/M
out $0.40/M
cache read $0.01/M
ctx: 1,048,576
max out: 1,048,576
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini 2.5 Flash-Lite
gemini-2.5-flash-litein $0.10/M
out $0.40/M
cache read $0.01/M
ctx: 1,048,576
max out: 65,536
in: text, image, audio, video, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini 2.5 Pro
gemini-2.5-proin $1.25/M
out $10.00/M
cache read $0.13/M
ctx: 1,048,576
max out: 65,536
in: text, image, audio, video, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini 3 Flash Preview
gemini-3-flash-previewin $0.50/M
out $3.00/M
cache read $0.05/M
ctx: 1,048,576
max out: 65,536
in: text, image, video, audio, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini 3.1 Flash Lite
gemini-3.1-flash-litein $0.25/M
out $1.50/M
cache read $0.03/M
cache write $0.08/M
ctx: 1,048,576
max out: 65,536
in: text, image, video, audio, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini 3.1 Pro Preview
gemini-3.1-pro-previewin $2.00/M
out $12.00/M
cache read $0.20/M
ctx: 1,048,576
max out: 65,536
in: text, image, video, audio, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini 3.5 Flash
gemini-3.5-flashin $1.50/M
out $9.00/M
cache read $0.15/M
cache write $0.08/M
ctx: 1,048,576
max out: 65,536
in: text, image, video, audio, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini Pro Latest
gemini-pro-latestin $2.00/M
out $12.00/M
cache read $0.20/M
ctx: 1,048,576
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Gemma 4 26B A4B IT
gemma-4-26b-a4b-itin $0.07/M
out $0.34/M
ctx: 262,144
max out: 32,768
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Gemma 4 31B IT
gemma-4-31b-itin $0.13/M
out $0.38/M
ctx: 262,144
max out: 32,768
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4 32B (0414-128k)
glm-4-32b-0414-128kin $0.10/M
out $0.10/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.5
glm-4.5in $0.60/M
out $2.20/M
cache read $0.11/M
cache write $0.00/M
ctx: 131,000
max out: 98,304
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.5 AirX
glm-4.5-airxin $1.10/M
out $4.50/M
cache read $0.22/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.5 X
glm-4.5-xin $2.20/M
out $8.90/M
cache read $0.45/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
beta
GLM-4.5-Air
glm-4.5-airin $0.20/M
out $1.10/M
cache read $0.03/M
cache write $0.00/M
ctx: 131,000
max out: 98,304
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.5-Flash
glm-4.5-flashin $0.00/M
out $0.00/M
cache read $0.00/M
cache write $0.00/M
ctx: 128,000
max out: 98,304
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.5V
glm-4.5vin $0.60/M
out $1.80/M
cache read $0.11/M
ctx: 128,000
max out: 16,384
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.6
glm-4.6in $0.60/M
out $2.20/M
cache read $0.11/M
cache write $0.00/M
ctx: 204,800
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.6V
glm-4.6vin $0.30/M
out $0.90/M
cache read $0.05/M
ctx: 131,072
max out: 32,768
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.6V Flash
glm-4.6v-flashin $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
beta
GLM-4.6V FlashX
glm-4.6v-flashxin $0.04/M
out $0.40/M
cache read $0.00/M
ctx: 128,000
max out: 16,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.7
glm-4.7in $0.60/M
out $2.20/M
cache read $0.11/M
cache write $0.00/M
ctx: 204,800
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.7 Flash (Free)
glm-4.7-flash-freein $0.00/M
out $0.00/M
ctx: 200,000
max out: 200,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.7-Flash
glm-4.7-flashin $0.06/M
out $0.40/M
cache read $0.01/M
cache write $0.00/M
ctx: 200,000
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.7-FlashX
glm-4.7-flashxin $0.07/M
out $0.40/M
cache read $0.01/M
cache write $0.00/M
ctx: 200,000
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-5
glm-5in $1.00/M
out $3.20/M
cache read $0.20/M
cache write $0.00/M
ctx: 203,000
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-5.1
glm-5.1in $1.40/M
out $4.40/M
cache read $0.26/M
cache write $0.00/M
ctx: 204,800
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-5.2
glm-5.2in $1.40/M
out $4.40/M
cache read $0.26/M
cache write $0.00/M
ctx: 1,000,000
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT OSS 120B
gpt-oss-120bin $0.15/M
out $0.75/M
ctx: 131,072
max out: 32,766
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT OSS 20B
gpt-oss-20bin $0.10/M
out $0.50/M
ctx: 131,072
max out: 32,766
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-3.5-turbo
gpt-3.5-turboin $0.50/M
out $1.50/M
cache read $0.00/M
ctx: 16,385
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4
gpt-4in $30.00/M
out $60.00/M
ctx: 8,192
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4 Turbo
gpt-4-turboin $10.00/M
out $30.00/M
ctx: 128,000
max out: 4,096
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4.1
gpt-4.1in $2.00/M
out $8.00/M
cache read $0.50/M
ctx: 1,000,000
max out: 32,768
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4.1 mini
gpt-4.1-miniin $0.40/M
out $1.60/M
cache read $0.10/M
ctx: 1,000,000
max out: 32,768
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4.1 nano
gpt-4.1-nanoin $0.10/M
out $0.40/M
cache read $0.03/M
ctx: 1,000,000
max out: 32,768
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4o
gpt-4oin $2.50/M
out $10.00/M
cache read $1.25/M
ctx: 128,000
max out: 16,384
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4o mini
gpt-4o-miniin $0.15/M
out $0.60/M
cache read $0.07/M
ctx: 128,000
max out: 16,384
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4o Mini Search Preview
gpt-4o-mini-search-previewin $0.15/M
out $0.60/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4o Search Preview
gpt-4o-search-previewin $2.50/M
out $10.00/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5
gpt-5in $1.25/M
out $10.00/M
cache read $0.13/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5 Chat (latest)
gpt-5-chat-latestin $1.25/M
out $10.00/M
cache read $0.13/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5 Mini
gpt-5-miniin $0.25/M
out $2.00/M
cache read $0.03/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5 Nano
gpt-5-nanoin $0.05/M
out $0.40/M
cache read $0.01/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5 Pro
gpt-5-proin $15.00/M
out $120.00/M
ctx: 400,000
max out: 272,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.1
gpt-5.1in $1.25/M
out $10.00/M
cache read $0.13/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.1 Codex
gpt-5.1-codexin $1.25/M
out $10.00/M
cache read $0.13/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.1 Codex mini
gpt-5.1-codex-miniin $0.25/M
out $2.00/M
cache read $0.03/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.2
gpt-5.2in $1.75/M
out $14.00/M
cache read $0.17/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.2 Chat
gpt-5.2-chat-latestin $1.75/M
out $14.00/M
cache read $0.17/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.2 Codex
gpt-5.2-codexin $1.75/M
out $14.00/M
cache read $0.17/M
ctx: 400,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.2 Pro
gpt-5.2-proin $21.00/M
out $168.00/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.3 Chat (latest)
gpt-5.3-chat-latestin $1.75/M
out $14.00/M
cache read $0.17/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.3 Codex
gpt-5.3-codexin $1.75/M
out $14.00/M
cache read $0.17/M
ctx: 400,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.4
gpt-5.4in $2.50/M
out $15.00/M
cache read $0.25/M
ctx: 1,050,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.4 mini
gpt-5.4-miniin $0.75/M
out $4.50/M
cache read $0.07/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.4 nano
gpt-5.4-nanoin $0.20/M
out $1.25/M
cache read $0.02/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.4 Pro
gpt-5.4-proin $30.00/M
out $180.00/M
ctx: 1,050,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.5
gpt-5.5in $5.00/M
out $30.00/M
cache read $0.50/M
ctx: 1,050,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.5 Pro
gpt-5.5-proin $30.00/M
out $180.00/M
ctx: 1,050,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Grok 4
grok-4in $3.00/M
out $15.00/M
cache read $0.75/M
ctx: 256,000
max out: 256,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Grok 4.1 Fast Non-Reasoning
grok-4-1-fast-non-reasoningin $0.20/M
out $0.50/M
cache read $0.05/M
ctx: 2,000,000
max out: 2,000,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Grok 4.1 Fast Reasoning
grok-4-1-fast-reasoningin $0.20/M
out $0.50/M
cache read $0.05/M
ctx: 2,000,000
max out: 30,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Grok 4.20 (Non-Reasoning)
grok-4-20-beta-0309-non-reasoningin $2.00/M
out $6.00/M
cache read $0.20/M
ctx: 2,000,000
max out: 30,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Grok 4.20 (Non-Reasoning)
grok-4-20-non-reasoningin $2.00/M
out $6.00/M
cache read $0.20/M
ctx: 2,000,000
max out: 30,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Grok 4.20 (Reasoning)
grok-4-20-beta-0309-reasoningin $2.00/M
out $6.00/M
cache read $0.20/M
ctx: 2,000,000
max out: 30,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Grok 4.20 (Reasoning)
grok-4-20-reasoningin $2.00/M
out $6.00/M
cache read $0.20/M
ctx: 2,000,000
max out: 30,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Grok 4.3
grok-4-3in $1.25/M
out $2.50/M
cache read $0.31/M
ctx: 1,000,000
max out: 30,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Grok Build 0.1
grok-build-0-1in $1.00/M
out $2.00/M
cache read $0.20/M
ctx: 256,000
max out: 256,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2
kimi-k2in $1.00/M
out $3.00/M
cache read $0.50/M
ctx: 256,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2 Thinking
kimi-k2-thinkingin $0.60/M
out $2.50/M
cache read $0.15/M
ctx: 262,144
max out: 262,144
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2 Thinking Turbo
kimi-k2-thinking-turboin $1.15/M
out $8.00/M
cache read $0.15/M
ctx: 262,144
max out: 262,144
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.5
kimi-k2.5in $0.60/M
out $3.00/M
cache read $0.10/M
ctx: 262,144
max out: 262,144
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.6
kimi-k2.6in $0.95/M
out $4.00/M
cache read $0.16/M
ctx: 262,144
max out: 262,144
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.7 Code
kimi-k2.7-codein $0.95/M
out $4.00/M
cache read $0.19/M
ctx: 262,144
max out: 262,144
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.7 Code Highspeed
kimi-k2.7-code-highspeedin $1.90/M
out $8.00/M
cache read $0.38/M
ctx: 262,144
max out: 262,144
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3 70B Instruct
llama-3-70b-instructin $0.51/M
out $0.74/M
ctx: 8,192
max out: 8,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3 8B Instruct
llama-3-8b-instructin $0.04/M
out $0.04/M
ctx: 8,192
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.1 70B Instruct
llama-3.1-70b-instructin $0.72/M
out $0.72/M
ctx: 128,000
max out: 2,048
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
beta
Llama 3.1 Nemotron Ultra 253B
llama-3.1-nemotron-ultra-253bin $0.60/M
out $1.80/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.2 11B Instruct
llama-3.2-11b-instructin $0.07/M
out $0.33/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.2 3B Instruct
llama-3.2-3b-instructin $0.03/M
out $0.05/M
ctx: 32,768
max out: 32,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 4 Maverick 17B Instruct
llama-4-maverick-17b-instructin $0.24/M
out $0.97/M
ctx: 1,048,576
max out: 2,048
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 4 Scout 17B Instruct
llama-4-scout-17b-instructin $0.17/M
out $0.66/M
ctx: 131,072
max out: 2,048
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Llama-3.3-70B-Instruct
llama-3.3-70b-instructin $0.13/M
out $0.40/M
ctx: 131,072
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiMo-V2-Omni
mimo-v2-omniin $0.40/M
out $2.00/M
cache read $0.08/M
ctx: 256,000
max out: 131,072
in: text, image, audio, video, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
MiMo-V2-Pro
mimo-v2-proin $1.00/M
out $3.00/M
cache read $0.20/M
ctx: 1,000,000
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiMo-V2.5
mimo-v2.5in $0.14/M
out $0.28/M
cache read $0.00/M
ctx: 1,000,000
max out: 131,072
in: text, image, audio, video
out: text
reasoning
tools
vision
structured
temp
open weights
MiMo-V2.5-Pro
mimo-v2.5-proin $0.43/M
out $0.87/M
cache read $0.00/M
ctx: 1,000,000
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax M2.1 Lightning
minimax-m2.1-lightningin $0.12/M
out $0.48/M
ctx: 196,608
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax Text 01
minimax-text-01in $0.20/M
out $1.10/M
ctx: 1,000,000
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax-M2
minimax-m2in $0.20/M
out $1.00/M
cache read $0.03/M
ctx: 196,608
max out: 128,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax-M2.1
minimax-m2.1in $0.27/M
out $1.10/M
ctx: 204,800
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax-M2.5
minimax-m2.5in $0.30/M
out $1.20/M
cache read $0.03/M
cache write $0.38/M
ctx: 228,700
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax-M2.5-highspeed
minimax-m2.5-highspeedin $0.60/M
out $2.40/M
cache read $0.03/M
cache write $0.38/M
ctx: 204,800
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax-M2.7
minimax-m2.7in $0.30/M
out $1.20/M
cache read $0.06/M
cache write $0.38/M
ctx: 204,800
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax-M2.7-highspeed
minimax-m2.7-highspeedin $0.60/M
out $2.40/M
cache read $0.06/M
cache write $0.38/M
ctx: 204,800
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax-M3
minimax-m3in $0.60/M
out $2.40/M
cache read $0.12/M
ctx: 512,000
max out: 128,000
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Ministral 14B
ministral-14b-2512in $0.20/M
out $0.20/M
ctx: 262,144
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Ministral 3B
ministral-3b-2512in $0.10/M
out $0.10/M
ctx: 131,072
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Ministral 8B
ministral-8b-2512in $0.15/M
out $0.15/M
ctx: 262,144
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral Large (latest)
mistral-large-latestin $4.00/M
out $12.00/M
ctx: 128,000
max out: 262,144
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral Large 3
mistral-large-2512in $0.50/M
out $1.50/M
ctx: 262,144
max out: 262,144
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral Small 3.2
mistral-small-2506in $0.10/M
out $0.30/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Nemotron 3 Ultra 550B A55B
nemotron-3-ultra-550bin $0.50/M
out $2.50/M
cache read $0.15/M
ctx: 262,144
max out: 128,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
o1
o1in $15.00/M
out $60.00/M
cache read $7.50/M
ctx: 200,000
max out: 100,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
o3
o3in $2.00/M
out $8.00/M
cache read $0.50/M
ctx: 200,000
max out: 100,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
o3-mini
o3-miniin $1.10/M
out $4.40/M
cache read $0.55/M
ctx: 200,000
max out: 100,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
o4-mini
o4-miniin $1.10/M
out $4.40/M
cache read $0.28/M
ctx: 200,000
max out: 100,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Pixtral Large (latest)
pixtral-large-latestin $4.00/M
out $12.00/M
ctx: 128,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen Coder Plus
qwen-coder-plusin $0.50/M
out $1.00/M
ctx: 131,072
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen Flash
qwen-flashin $0.05/M
out $0.40/M
cache read $0.01/M
cache write $0.06/M
ctx: 1,000,000
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen Max
qwen-maxin $1.60/M
out $6.40/M
ctx: 32,768
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen Max Latest
qwen-max-latestin $1.60/M
out $6.40/M
ctx: 32,768
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen Plus
qwen-plusin $0.40/M
out $1.20/M
reason $4.00/M
cache read $0.08/M
cache write $0.50/M
ctx: 131,072
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen Plus Latest
qwen-plus-latestin $0.40/M
out $1.20/M
cache read $0.08/M
cache write $0.50/M
ctx: 1,000,000
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen Turbo
qwen-turboin $0.05/M
out $0.20/M
reason $0.50/M
ctx: 1,000,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen-Omni Turbo
qwen-omni-turboin $0.20/M
out $0.80/M
ctx: 32,768
max out: 2,048
in: text, image, audio, video
out: text, audio
reasoning
tools
vision
structured
temp
open weights
Qwen-VL Max
qwen-vl-maxin $0.80/M
out $3.20/M
ctx: 131,072
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen-VL Plus
qwen-vl-plusin $0.21/M
out $0.64/M
ctx: 131,072
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen2.5 VL 32B Instruct
qwen2-5-vl-32b-instructin $1.40/M
out $4.20/M
ctx: 131,072
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen2.5-VL 72B Instruct
qwen2-5-vl-72b-instructin $0.13/M
out $0.40/M
ctx: 32,768
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 235B A22B FP8
qwen3-235b-a22b-fp8in $0.20/M
out $0.80/M
ctx: 40,960
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 235B A22B Instruct (2507)
qwen3-235b-a22b-instruct-2507in $0.20/M
out $0.60/M
ctx: 262,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 235B A22B Thinking (2507)
qwen3-235b-a22b-thinking-2507in $0.20/M
out $0.60/M
ctx: 262,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 30B A3B Instruct (2507)
qwen3-30b-a3b-instruct-2507in $0.10/M
out $0.30/M
ctx: 262,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 32B
qwen3-32bin $0.10/M
out $0.30/M
reason $8.40/M
ctx: 32,768
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 4B FP8
qwen3-4b-fp8in $0.03/M
out $0.03/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 Coder Flash
qwen3-coder-flashin $0.30/M
out $1.50/M
cache read $0.06/M
cache write $0.38/M
ctx: 1,000,000
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 Coder Next
qwen3-coder-nextin $0.11/M
out $0.68/M
cache read $0.06/M
ctx: 262,144
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 Coder Plus
qwen3-coder-plusin $6.00/M
out $60.00/M
cache read $1.20/M
cache write $7.50/M
ctx: 1,000,000
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 Max
qwen3-maxin $3.00/M
out $15.00/M
cache read $0.60/M
cache write $3.75/M
ctx: 262,144
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 Max (2026-01-23)
qwen3-max-2026-01-23in $1.20/M
out $6.00/M
cache read $0.24/M
cache write $1.50/M
ctx: 262,144
max out: 32,800
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 VL 235B A22B Instruct
qwen3-vl-235b-a22b-instructin $0.50/M
out $2.00/M
ctx: 131,072
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 VL 235B A22B Thinking
qwen3-vl-235b-a22b-thinkingin $0.50/M
out $2.00/M
ctx: 131,072
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 VL 30B A3B Instruct
qwen3-vl-30b-a3b-instructin $0.20/M
out $0.70/M
ctx: 131,072
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 VL 30B A3B Thinking
qwen3-vl-30b-a3b-thinkingin $0.20/M
out $1.00/M
ctx: 131,072
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 VL 8B Instruct
qwen3-vl-8b-instructin $0.08/M
out $0.50/M
ctx: 131,072
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 VL Flash
qwen3-vl-flashin $0.05/M
out $0.40/M
cache read $0.01/M
ctx: 262,144
max out: 32,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3-Coder 30B-A3B Instruct
qwen3-coder-30b-a3b-instructin $0.10/M
out $0.30/M
ctx: 262,000
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3-Coder 480B-A35B Instruct
qwen3-coder-480b-a35b-instructin $0.40/M
out $1.80/M
ctx: 262,144
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3-Next 80B-A3B (Thinking)
qwen3-next-80b-a3b-thinkingin $0.50/M
out $6.00/M
ctx: 131,072
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3-Next 80B-A3B Instruct
qwen3-next-80b-a3b-instructin $0.50/M
out $2.00/M
ctx: 131,072
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3-VL Plus
qwen3-vl-plusin $0.20/M
out $1.60/M
reason $4.80/M
cache read $0.04/M
cache write $0.25/M
ctx: 262,144
max out: 32,768
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3.5 397B-A17B
qwen35-397b-a17bin $0.60/M
out $3.60/M
ctx: 262,144
max out: 65,536
in: text, image, video, audio
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3.5 9B
qwen3.5-9bin $0.10/M
out $0.15/M
ctx: 262,144
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3.6 35B-A3B
qwen3.6-35b-a3bin $0.25/M
out $1.49/M
ctx: 262,144
max out: 65,536
in: text, image, video, audio
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3.6 Max Preview
qwen3.6-max-previewin $1.30/M
out $7.80/M
cache read $0.13/M
cache write $1.63/M
ctx: 262,144
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3.6 Plus
qwen3.6-plusin $0.50/M
out $3.00/M
cache read $0.05/M
cache write $0.63/M
ctx: 262,144
max out: 65,536
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3.7 Max
qwen3.7-maxin $2.50/M
out $7.50/M
cache read $0.50/M
cache write $3.13/M
ctx: 1,000,000
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3.7 Plus
qwen3.7-plusin $0.40/M
out $1.60/M
cache read $0.08/M
cache write $0.50/M
ctx: 1,000,000
max out: 64,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
QwQ Plus
qwq-plusin $0.80/M
out $2.40/M
ctx: 131,072
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Seed 1.6 (250615)
seed-1-6-250615in $0.25/M
out $2.00/M
cache read $0.05/M
ctx: 256,000
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Seed 1.6 (250915)
seed-1-6-250915in $0.25/M
out $2.00/M
cache read $0.05/M
ctx: 256,000
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Seed 1.6 Flash (250715)
seed-1-6-flash-250715in $0.07/M
out $0.30/M
cache read $0.01/M
ctx: 256,000
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Seed 1.8 (251228)
seed-1-8-251228in $0.25/M
out $2.00/M
cache read $0.05/M
ctx: 256,000
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Sonar
sonarin $1.00/M
out $1.00/M
ctx: 130,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Sonar Pro
sonar-proin $3.00/M
out $15.00/M
ctx: 200,000
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Sonar Reasoning Pro
sonar-reasoning-proin $2.00/M
out $8.00/M
ctx: 128,000
max out: 4,096
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights