id: vultr
npm: @ai-sdk/openai-compatible
env: VULTR_API_KEY
api: https://api.vultrinference.com/v1
Models
DeepSeek V3.2
nvidia/DeepSeek-V3.2-NVFP4in $0.55/M
out $1.65/M
ctx: 131,072
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-5.1
zai-org/GLM-5.1-FP8in $0.85/M
out $3.10/M
ctx: 200,000
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.6
moonshotai/Kimi-K2.6in $0.15/M
out $0.60/M
ctx: 262,144
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.1 Nemotron Safety Guard
nvidia/Llama-3.1-Nemotron-Safety-Guard-8B-v3in $0.01/M
out $0.01/M
ctx: 8,192
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MiniMax-M2.7
MiniMaxAI/MiniMax-M2.7in $0.30/M
out $1.20/M
ctx: 204,800
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
NVIDIA Nemotron 3 Nano Omni
nvidia/Nemotron-3-Nano-Omni-30B-A3B-Reasoning-BF16in $0.13/M
out $0.38/M
ctx: 262,144
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
NVIDIA Nemotron Cascade 2
nvidia/Nemotron-Cascade-2-30B-A3Bin $0.15/M
out $0.60/M
ctx: 262,144
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights