id: baseten
npm: @ai-sdk/openai-compatible
env: BASETEN_API_KEY
api: https://inference.baseten.co/v1
Models
DeepSeek V3.1
deepseek-ai/DeepSeek-V3.1in $0.50/M
out $1.50/M
ctx: 164,000
max out: 131,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
deprecated
Deepseek V4 Pro
deepseek-ai/DeepSeek-V4-Proin $1.74/M
out $3.48/M
cache read $0.14/M
ctx: 131,000
max out: 131,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 4.7
zai-org/GLM-4.7in $0.60/M
out $2.20/M
cache read $0.12/M
ctx: 200,000
max out: 200,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 5
zai-org/GLM-5in $0.95/M
out $3.15/M
cache read $0.20/M
ctx: 202,800
max out: 202,800
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 5.1
zai-org/GLM-5.1in $1.30/M
out $4.30/M
cache read $0.26/M
ctx: 202,800
max out: 202,800
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM 5.2
zai-org/GLM-5.2in $1.40/M
out $4.40/M
cache read $0.30/M
ctx: 202,720
max out: 202,720
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.5
moonshotai/Kimi-K2.5in $0.60/M
out $3.00/M
cache read $0.12/M
ctx: 262,000
max out: 262,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.6
moonshotai/Kimi-K2.6in $0.95/M
out $4.00/M
cache read $0.16/M
ctx: 262,000
max out: 262,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.7 Code
moonshotai/Kimi-K2.7-Codein $0.95/M
out $4.00/M
cache read $0.16/M
ctx: 262,000
max out: 262,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax-M2.5
MiniMaxAI/MiniMax-M2.5in $0.30/M
out $1.20/M
ctx: 204,000
max out: 204,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
deprecated
Nemotron Super
nvidia/Nemotron-120B-A12Bin $0.30/M
out $0.75/M
cache read $0.06/M
ctx: 202,800
max out: 202,800
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Nemotron Ultra
nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55Bin $0.60/M
out $2.40/M
cache read $0.12/M
ctx: 202,800
max out: 202,800
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
OpenAI GPT 120B
openai/gpt-oss-120bin $0.10/M
out $0.50/M
ctx: 128,072
max out: 128,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights