id: chutes
npm: @ai-sdk/openai-compatible
env: CHUTES_API_KEY
api: https://llm.chutes.ai/v1
Models
DeepHermes 3 Mistral 24B Preview
NousResearch/DeepHermes-3-Mistral-24B-Previewin $0.02/M
out $0.10/M
cache read $0.01/M
ctx: 32,768
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek R1 0528 TEE
deepseek-ai/DeepSeek-R1-0528-TEEin $0.45/M
out $2.15/M
cache read $0.23/M
ctx: 163,840
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek R1 Distill Llama 70B
deepseek-ai/DeepSeek-R1-Distill-Llama-70Bin $0.03/M
out $0.11/M
cache read $0.01/M
ctx: 131,072
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek TNG R1T2 Chimera TEE
tngtech/DeepSeek-TNG-R1T2-Chimera-TEEin $0.30/M
out $1.10/M
cache read $0.15/M
ctx: 163,840
max out: 163,840
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek V3 0324 TEE
deepseek-ai/DeepSeek-V3-0324-TEEin $0.25/M
out $1.00/M
cache read $0.13/M
ctx: 163,840
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek V3.1 TEE
deepseek-ai/DeepSeek-V3.1-TEEin $0.27/M
out $1.00/M
cache read $0.14/M
ctx: 163,840
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek V3.2 TEE
deepseek-ai/DeepSeek-V3.2-TEEin $0.28/M
out $0.42/M
cache read $0.14/M
ctx: 131,072
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
dots.ocr
rednote-hilab/dots.ocrin $0.01/M
out $0.01/M
cache read $0.01/M
ctx: 131,072
max out: 131,072
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
gemma 3 12b it
unsloth/gemma-3-12b-itin $0.03/M
out $0.10/M
cache read $0.01/M
ctx: 131,072
max out: 131,072
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
gemma 3 27b it
unsloth/gemma-3-27b-itin $0.03/M
out $0.11/M
cache read $0.01/M
ctx: 128,000
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
gemma 3 4b it
unsloth/gemma-3-4b-itin $0.01/M
out $0.03/M
cache read $0.01/M
ctx: 96,000
max out: 96,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
gemma 4 31B turbo TEE
google/gemma-4-31B-turbo-TEEin $0.13/M
out $0.38/M
cache read $0.07/M
ctx: 131,072
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 4.6V
zai-org/GLM-4.6Vin $0.30/M
out $0.90/M
cache read $0.15/M
ctx: 131,072
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 4.7 FP8
zai-org/GLM-4.7-FP8in $0.30/M
out $1.20/M
cache read $0.15/M
ctx: 202,752
max out: 65,535
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 4.7 TEE
zai-org/GLM-4.7-TEEin $0.39/M
out $1.75/M
cache read $0.20/M
ctx: 202,752
max out: 65,535
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 5 TEE
zai-org/GLM-5-TEEin $0.95/M
out $2.55/M
cache read $0.47/M
ctx: 202,752
max out: 65,535
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 5 Turbo
zai-org/GLM-5-Turboin $0.49/M
out $1.96/M
cache read $0.24/M
ctx: 202,752
max out: 65,535
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 5.1 TEE
zai-org/GLM-5.1-TEEin $1.05/M
out $3.50/M
cache read $0.53/M
ctx: 202,752
max out: 65,535
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
gpt oss 120b TEE
openai/gpt-oss-120b-TEEin $0.09/M
out $0.36/M
cache read $0.04/M
ctx: 131,072
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Hermes 4 14B
NousResearch/Hermes-4-14Bin $0.01/M
out $0.05/M
cache read $0.01/M
ctx: 40,960
max out: 40,960
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.5 TEE
moonshotai/Kimi-K2.5-TEEin $0.44/M
out $2.00/M
cache read $0.22/M
ctx: 262,144
max out: 65,535
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.6 TEE
moonshotai/Kimi-K2.6-TEEin $0.95/M
out $4.00/M
cache read $0.47/M
ctx: 262,144
max out: 65,535
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.2 1B Instruct
unsloth/Llama-3.2-1B-Instructin $0.01/M
out $0.01/M
cache read $0.01/M
ctx: 16,384
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.2 3B Instruct
unsloth/Llama-3.2-3B-Instructin $0.01/M
out $0.01/M
cache read $0.01/M
ctx: 16,384
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiMo V2 Flash TEE
XiaomiMiMo/MiMo-V2-Flash-TEEin $0.09/M
out $0.29/M
cache read $0.04/M
ctx: 262,144
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax M2.5 TEE
MiniMaxAI/MiniMax-M2.5-TEEin $0.15/M
out $1.20/M
cache read $0.07/M
ctx: 196,608
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral Nemo Instruct 2407
unsloth/Mistral-Nemo-Instruct-2407in $0.02/M
out $0.04/M
cache read $0.01/M
ctx: 131,072
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen2.5 72B Instruct
Qwen/Qwen2.5-72B-Instructin $0.30/M
out $1.20/M
cache read $0.15/M
ctx: 32,768
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen2.5 Coder 32B Instruct
Qwen/Qwen2.5-Coder-32B-Instructin $0.03/M
out $0.11/M
cache read $0.01/M
ctx: 32,768
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen2.5 VL 32B Instruct
Qwen/Qwen2.5-VL-32B-Instructin $0.05/M
out $0.22/M
cache read $0.03/M
ctx: 16,384
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 235B A22B Instruct 2507 TEE
Qwen/Qwen3-235B-A22B-Instruct-2507-TEEin $0.10/M
out $0.60/M
cache read $0.05/M
ctx: 262,144
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 235B A22B Thinking 2507
Qwen/Qwen3-235B-A22B-Thinking-2507in $0.11/M
out $0.60/M
cache read $0.06/M
ctx: 262,144
max out: 262,144
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 30B A3B
Qwen/Qwen3-30B-A3Bin $0.06/M
out $0.22/M
cache read $0.03/M
ctx: 40,960
max out: 40,960
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 32B TEE
Qwen/Qwen3-32B-TEEin $0.08/M
out $0.24/M
cache read $0.04/M
ctx: 40,960
max out: 40,960
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 Coder Next TEE
Qwen/Qwen3-Coder-Next-TEEin $0.12/M
out $0.75/M
cache read $0.06/M
ctx: 262,144
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 Next 80B A3B Instruct
Qwen/Qwen3-Next-80B-A3B-Instructin $0.10/M
out $0.80/M
cache read $0.05/M
ctx: 262,144
max out: 262,144
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3.5 397B A17B TEE
Qwen/Qwen3.5-397B-A17B-TEEin $0.39/M
out $2.34/M
cache read $0.20/M
ctx: 262,144
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3.6 27B TEE
Qwen/Qwen3.6-27B-TEEin $0.20/M
out $1.56/M
cache read $0.10/M
ctx: 262,144
max out: 65,536
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3Guard Gen 0.6B
Qwen/Qwen3Guard-Gen-0.6Bin $0.01/M
out $0.01/M
cache read $0.01/M
ctx: 32,768
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights