Models
Aion 2.0
aion-labs-aion-2-0in $1.00/M
out $2.00/M
cache read $0.25/M
ctx: 128,000
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Fable 5
claude-fable-5in $12.00/M
out $60.00/M
cache read $1.20/M
cache write $15.00/M
ctx: 1,000,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.5
claude-opus-4-5in $6.00/M
out $30.00/M
cache read $0.60/M
cache write $7.50/M
ctx: 198,000
max out: 32,768
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.6
claude-opus-4-6in $6.00/M
out $30.00/M
cache read $0.60/M
cache write $7.50/M
ctx: 1,000,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.6 Fast
claude-opus-4-6-fastin $36.00/M
out $180.00/M
cache read $3.60/M
cache write $45.00/M
ctx: 1,000,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.7
claude-opus-4-7in $6.00/M
out $30.00/M
cache read $0.60/M
cache write $7.50/M
ctx: 1,000,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.7 Fast
claude-opus-4-7-fastin $36.00/M
out $180.00/M
cache read $3.60/M
cache write $45.00/M
ctx: 1,000,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.8
claude-opus-4-8in $6.00/M
out $30.00/M
cache read $0.60/M
cache write $7.50/M
ctx: 1,000,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.8 Fast
claude-opus-4-8-fastin $12.00/M
out $60.00/M
cache read $1.20/M
cache write $15.00/M
ctx: 1,000,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Sonnet 4.5
claude-sonnet-4-5in $3.75/M
out $18.75/M
cache read $0.38/M
cache write $4.69/M
ctx: 198,000
max out: 64,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Sonnet 4.6
claude-sonnet-4-6in $3.60/M
out $18.00/M
cache read $0.36/M
cache write $4.50/M
ctx: 1,000,000
max out: 64,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek V3.2
deepseek-v3.2in $0.33/M
out $0.48/M
cache read $0.16/M
ctx: 160,000
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek V4 Flash
deepseek-v4-flashin $0.17/M
out $0.35/M
cache read $0.03/M
ctx: 1,000,000
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek V4 Pro
deepseek-v4-proin $1.73/M
out $3.80/M
cache read $0.33/M
ctx: 1,000,000
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini 3 Flash Preview
gemini-3-flash-previewin $0.70/M
out $3.75/M
cache read $0.07/M
ctx: 256,000
max out: 65,536
in: text, image, video, audio, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini 3.1 Pro Preview
gemini-3-1-pro-previewin $2.50/M
out $15.00/M
cache read $0.50/M
cache write $0.50/M
ctx: 1,000,000
max out: 32,768
in: text, image, audio, video
out: text
reasoning
tools
vision
structured
temp
open weights
Gemini 3.5 Flash
gemini-3-5-flashin $1.55/M
out $9.45/M
cache read $0.15/M
cache write $0.09/M
ctx: 1,000,000
max out: 65,536
in: text, image, audio, video
out: text
reasoning
tools
vision
structured
temp
open weights
Gemma 4 Uncensored
gemma-4-uncensoredin $0.16/M
out $0.50/M
ctx: 256,000
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 4.6
zai-org-glm-4.6in $0.43/M
out $1.75/M
cache read $0.08/M
ctx: 198,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 4.7
zai-org-glm-4.7in $0.55/M
out $2.65/M
cache read $0.11/M
ctx: 198,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 4.7 Flash
zai-org-glm-4.7-flashin $0.13/M
out $0.50/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 4.7 Flash Heretic
olafangensan-glm-4.7-flash-hereticin $0.14/M
out $0.80/M
ctx: 200,000
max out: 24,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 5
zai-org-glm-5in $1.00/M
out $3.20/M
cache read $0.20/M
ctx: 198,000
max out: 32,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 5 Turbo
z-ai-glm-5-turboin $1.20/M
out $4.00/M
cache read $0.24/M
ctx: 200,000
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 5.1
zai-org-glm-5-1in $1.75/M
out $5.50/M
cache read $0.33/M
ctx: 200,000
max out: 24,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 5.2
zai-org-glm-5-2in $1.40/M
out $4.40/M
cache read $0.26/M
ctx: 1,000,000
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 5V Turbo
z-ai-glm-5v-turboin $1.50/M
out $5.00/M
cache read $0.30/M
ctx: 200,000
max out: 32,768
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Google Gemma 3 27B Instruct
google-gemma-3-27b-itin $0.12/M
out $0.20/M
ctx: 198,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Google Gemma 4 26B A4B Instruct
google-gemma-4-26b-a4b-itin $0.16/M
out $0.50/M
ctx: 256,000
max out: 8,192
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Google Gemma 4 31B Instruct
google-gemma-4-31b-itin $0.12/M
out $0.36/M
cache read $0.09/M
ctx: 256,000
max out: 8,192
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4o
openai-gpt-4o-2024-11-20in $3.13/M
out $12.50/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4o Mini
openai-gpt-4o-mini-2024-07-18in $0.19/M
out $0.75/M
cache read $0.09/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.2
openai-gpt-52in $2.19/M
out $17.50/M
cache read $0.22/M
ctx: 256,000
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.2 Codex
openai-gpt-52-codexin $2.19/M
out $17.50/M
cache read $0.22/M
ctx: 256,000
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.3 Codex
openai-gpt-53-codexin $2.19/M
out $17.50/M
cache read $0.22/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.4
openai-gpt-54in $3.13/M
out $18.80/M
cache read $0.31/M
ctx: 1,000,000
max out: 131,072
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.4 Mini
openai-gpt-54-miniin $0.94/M
out $5.63/M
cache read $0.09/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.4 Pro
openai-gpt-54-proin $37.50/M
out $225.00/M
ctx: 1,000,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.5
openai-gpt-55in $6.25/M
out $37.50/M
cache read $0.63/M
ctx: 1,000,000
max out: 131,072
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.5 Pro
openai-gpt-55-proin $37.50/M
out $225.00/M
ctx: 1,000,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Grok 4.20
grok-4-20in $1.42/M
out $2.83/M
cache read $0.23/M
ctx: 2,000,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Grok 4.20 Multi-Agent
grok-4-20-multi-agentin $1.42/M
out $2.83/M
cache read $0.23/M
ctx: 2,000,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Grok 4.3
grok-4-3in $1.42/M
out $2.83/M
cache read $0.23/M
ctx: 1,000,000
max out: 32,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Grok Build 0.1
grok-build-0-1in $1.00/M
out $2.00/M
cache read $0.20/M
ctx: 256,000
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Hermes 3 Llama 3.1 405b
hermes-3-llama-3.1-405bin $1.10/M
out $3.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.5
kimi-k2-5in $0.56/M
out $3.50/M
cache read $0.22/M
ctx: 256,000
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.6
kimi-k2-6in $0.85/M
out $4.66/M
cache read $0.22/M
ctx: 256,000
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.7 Code
kimi-k2-7-codein $0.90/M
out $4.30/M
cache read $0.20/M
ctx: 256,000
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.2 3B
llama-3.2-3bin $0.15/M
out $0.60/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.3 70B
llama-3.3-70bin $0.70/M
out $2.80/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Mercury 2
mercury-2in $0.31/M
out $0.94/M
cache read $0.03/M
ctx: 128,000
max out: 50,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiMo-V2.5
xiaomi-mimo-v2-5in $0.17/M
out $0.35/M
cache read $0.06/M
ctx: 1,000,000
max out: 65,536
in: text, image, audio, video
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax M2.5
minimax-m25in $0.34/M
out $1.19/M
cache read $0.04/M
ctx: 198,000
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax M2.7
minimax-m27in $0.38/M
out $1.50/M
cache read $0.07/M
ctx: 198,000
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax M3 Preview
minimax-m3-previewin $0.30/M
out $1.20/M
cache read $0.06/M
ctx: 524,288
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral Small 3.2 24B Instruct
mistral-small-3-2-24b-instructin $0.09/M
out $0.25/M
ctx: 256,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral Small 4
mistral-small-2603in $0.19/M
out $0.75/M
ctx: 256,000
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Nemotron Cascade 2 30B A3B
nvidia-nemotron-cascade-2-30b-a3bin $0.14/M
out $0.80/M
ctx: 256,000
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
NVIDIA Nemotron 3 Nano 30B
nvidia-nemotron-3-nano-30b-a3bin $0.07/M
out $0.30/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
NVIDIA Nemotron 3 Ultra
nvidia-nemotron-3-ultra-550b-a55bin $0.63/M
out $3.13/M
cache read $0.19/M
ctx: 256,000
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
OpenAI GPT OSS 120B
openai-gpt-oss-120bin $0.07/M
out $0.30/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 3 235B A22B Instruct 2507
qwen3-235b-a22b-instruct-2507in $0.15/M
out $0.75/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 3 235B A22B Thinking 2507
qwen3-235b-a22b-thinking-2507in $0.45/M
out $3.50/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 3 Coder 480B Turbo
qwen3-coder-480b-a35b-instruct-turboin $0.35/M
out $1.50/M
cache read $0.04/M
ctx: 256,000
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 3 Next 80b
qwen3-next-80bin $0.35/M
out $1.90/M
ctx: 256,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 3.5 35B A3B
qwen3-5-35b-a3bin $0.31/M
out $1.25/M
cache read $0.16/M
ctx: 256,000
max out: 16,384
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 3.5 397B
qwen3-5-397b-a17bin $0.75/M
out $4.50/M
ctx: 128,000
max out: 32,768
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 3.5 9B
qwen3-5-9bin $0.10/M
out $0.15/M
ctx: 256,000
max out: 32,768
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 3.6 27B
qwen3-6-27bin $0.33/M
out $3.25/M
ctx: 256,000
max out: 65,536
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 3.6 Plus Uncensored
qwen-3-6-plusin $0.63/M
out $3.75/M
cache read $0.06/M
cache write $0.78/M
ctx: 1,000,000
max out: 65,536
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 3.7 Max
qwen-3-7-maxin $2.70/M
out $8.05/M
cache read $0.27/M
cache write $3.35/M
ctx: 1,000,000
max out: 65,536
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 3.7 Plus
qwen-3-7-plusin $0.50/M
out $2.00/M
cache read $0.05/M
cache write $0.63/M
ctx: 1,000,000
max out: 65,536
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 VL 235B
qwen3-vl-235b-a22bin $0.25/M
out $1.50/M
ctx: 256,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Trinity Large Thinking
arcee-trinity-large-thinkingin $0.31/M
out $1.13/M
cache read $0.07/M
ctx: 256,000
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Venice Role Play Uncensored
venice-uncensored-role-playin $0.50/M
out $2.00/M
ctx: 128,000
max out: 4,096
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Venice Uncensored 1.2
venice-uncensored-1-2in $0.20/M
out $0.90/M
ctx: 128,000
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights