id: nvidia
npm: @ai-sdk/openai-compatible
env: NVIDIA_API_KEY
api: https://integrate.api.nvidia.com/v1
Models
Active Speaker Detection
nvidia/active-speaker-detectionin $0.00/M
out $0.00/M
ctx: 0
max out: 4,096
in: video
out: text
reasoning
tools
vision
structured
temp
open weights
bevformer
nvidia/bevformerin $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: video
out: text
reasoning
tools
vision
structured
temp
open weights
BGE M3
baai/bge-m3in $0.00/M
out $0.00/M
ctx: 8,192
max out: 1,024
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
ByteDance-Seed/Seed-OSS-36B-Instruct
bytedance/seed-oss-36b-instructin $0.00/M
out $0.00/M
ctx: 262,000
max out: 262,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
cosmos-predict1-5b
nvidia/cosmos-predict1-5bin $0.00/M
out $0.00/M
ctx: 0
max out: 4,096
in: text, image, video
out: video
reasoning
tools
vision
structured
temp
open weights
cosmos-transfer1-7b
nvidia/cosmos-transfer1-7bin $0.00/M
out $0.00/M
ctx: 0
max out: 4,096
in: text, image, video
out: video
reasoning
tools
vision
structured
temp
open weights
cosmos-transfer2.5-2b
nvidia/cosmos-transfer2_5-2bin $0.00/M
out $0.00/M
ctx: 0
max out: 4,096
in: text, image, video
out: video
reasoning
tools
vision
structured
temp
open weights
DeepSeek V4 Flash
deepseek-ai/deepseek-v4-flashin $0.14/M
out $0.28/M
cache read $0.00/M
ctx: 1,048,576
max out: 393,216
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek V4 Pro
deepseek-ai/deepseek-v4-proin $0.43/M
out $0.87/M
cache read $0.00/M
ctx: 1,048,576
max out: 393,216
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
dracarys-llama-3.1-70b-instruct
abacusai/dracarys-llama-3_1-70b-instructin $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
esm2-650m
meta/esm2-650min $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
esmfold
meta/esmfoldin $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
FLUX.1-dev
black-forest-labs/flux.1-devin $0.00/M
out $0.00/M
ctx: 4,096
max out: 0
in: text
out: image
reasoning
tools
vision
structured
temp
open weights
FLUX.1-Kontext-dev
black-forest-labs/flux_1-kontext-devin $0.00/M
out $0.00/M
ctx: 40,960
max out: 40,960
in: text, image
out: image
reasoning
tools
vision
structured
temp
open weights
FLUX.1-schnell
black-forest-labs/flux_1-schnellin $0.00/M
out $0.00/M
ctx: 77
max out: 0
in: text
out: image
reasoning
tools
vision
structured
temp
open weights
FLUX.2 Klein 4B
black-forest-labs/flux_2-klein-4bin $0.00/M
out $0.00/M
ctx: 40,960
max out: 40,960
in: image, text
out: image
reasoning
tools
vision
structured
temp
open weights
Gemma 2 2b It
google/gemma-2-2b-itin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Gemma 3n E2b It
google/gemma-3n-e2b-itin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Gemma 3n E4b It
google/gemma-3n-e4b-itin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Gemma-4-31B-IT
google/gemma-4-31b-itin $0.00/M
out $0.00/M
ctx: 256,000
max out: 16,384
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
gliner-pii
nvidia/gliner-piiin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-5.1
z-ai/glm-5.1in $0.00/M
out $0.00/M
ctx: 131,072
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT OSS 20B
openai/gpt-oss-20bin $0.00/M
out $0.00/M
ctx: 131,072
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-OSS-120B
openai/gpt-oss-120bin $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2 0905
moonshotai/kimi-k2-instruct-0905in $0.00/M
out $0.00/M
ctx: 262,144
max out: 262,144
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.6
moonshotai/kimi-k2.6in $0.00/M
out $0.00/M
ctx: 262,144
max out: 262,144
in: text, image, video
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.1 70b Instruct
meta/llama-3.1-70b-instructin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.1 8B Instruct
meta/llama-3.1-8b-instructin $0.00/M
out $0.00/M
ctx: 16,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.2 11b Vision Instruct
meta/llama-3.2-11b-vision-instructin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.2 1b Instruct
meta/llama-3.2-1b-instructin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.2 3B Instruct
meta/llama-3.2-3b-instructin $0.00/M
out $0.00/M
ctx: 32,768
max out: 32,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.3 70b Instruct
meta/llama-3.3-70b-instructin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 4 Maverick 17b 128e Instruct
meta/llama-4-maverick-17b-128e-instructin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Llama Guard 4 12B
meta/llama-guard-4-12bin $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
llama-3_2-nemoretriever-300m-embed-v1
nvidia/llama-3_2-nemoretriever-300m-embed-v1in $0.00/M
out $0.00/M
ctx: 32,768
max out: 2,048
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
llama-3.1-nemotron-safety-guard-8b-v3
nvidia/llama-3_1-nemotron-safety-guard-8b-v3in $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama-3.2-90B-Vision-Instruct
meta/llama-3.2-90b-vision-instructin $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
llama-nemotron-embed-vl-1b-v2
nvidia/llama-nemotron-embed-vl-1b-v2in $0.00/M
out $0.00/M
ctx: 32,768
max out: 2,048
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
llama-nemotron-rerank-vl-1b-v2
nvidia/llama-nemotron-rerank-vl-1b-v2in $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Magistral Small 2506
mistralai/magistral-small-2506in $0.00/M
out $0.00/M
ctx: 32,768
max out: 32,768
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
magpie-tts-zeroshot
nvidia/magpie-tts-zeroshotin $0.00/M
out $0.00/M
ctx: 0
max out: 4,096
in: text, audio
out: audio
reasoning
tools
vision
structured
temp
open weights
MiniMax-M2.7
minimaxai/minimax-m2.7in $0.00/M
out $0.00/M
ctx: 204,800
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral Large 3 675B Instruct 2512
mistralai/mistral-large-3-675b-instruct-2512in $0.00/M
out $0.00/M
ctx: 262,144
max out: 262,144
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral Medium 3
mistralai/mistral-medium-3-instructin $0.00/M
out $0.00/M
ctx: 131,072
max out: 32,768
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral-7B-Instruct-v0.3
mistralai/mistral-7b-instruct-v03in $0.00/M
out $0.00/M
ctx: 65,536
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
mistral-nemotron
mistralai/mistral-nemotronin $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
mistral-small-4-119b-2603
mistralai/mistral-small-4-119b-2603in $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral: Mixtral 8x22B Instruct
mistralai/mixtral-8x22b-instructin $0.00/M
out $0.00/M
ctx: 65,536
max out: 13,108
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral: Mixtral 8x7B Instruct
mistralai/mixtral-8x7b-instructin $0.00/M
out $0.00/M
ctx: 32,768
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Nemotron 3 Nano Omni
nvidia/nemotron-3-nano-omni-30b-a3b-reasoningin $0.00/M
out $0.00/M
ctx: 256,000
max out: 65,536
in: text, image, video, audio
out: text
reasoning
tools
vision
structured
temp
open weights
Nemotron 3 Super
nvidia/nemotron-3-super-120b-a12bin $0.20/M
out $0.80/M
ctx: 262,144
max out: 262,144
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Nemotron 3 Ultra 550B A55B
nvidia/nemotron-3-ultra-550b-a55bin $0.50/M
out $2.50/M
cache read $0.15/M
ctx: 1,000,000
max out: 65,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
nemotron-3-content-safety
nvidia/nemotron-3-content-safetyin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
nemotron-3-nano-30b-a3b
nvidia/nemotron-3-nano-30b-a3bin $0.00/M
out $0.00/M
ctx: 131,072
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
nemotron-content-safety-reasoning-4b
nvidia/nemotron-content-safety-reasoning-4bin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
nemotron-mini-4b-instruct
nvidia/nemotron-mini-4b-instructin $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
nemotron-voicechat
nvidia/nemotron-voicechatin $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text, audio
out: text
reasoning
tools
vision
structured
temp
open weights
nv-embed-v1
nvidia/nv-embed-v1in $0.00/M
out $0.00/M
ctx: 32,768
max out: 2,048
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
nv-embedcode-7b-v1
nvidia/nv-embedcode-7b-v1in $0.00/M
out $0.00/M
ctx: 32,768
max out: 2,048
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
nvidia-nemotron-nano-9b-v2
nvidia/nvidia-nemotron-nano-9b-v2in $0.00/M
out $0.00/M
ctx: 131,072
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
paligemma
google/google-paligemmain $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Phi 4 Multimodal
microsoft/phi-4-multimodal-instructin $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Phi-4-Mini
microsoft/phi-4-mini-instructin $0.00/M
out $0.00/M
ctx: 131,072
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen Image
qwen/qwen-imagein $0.00/M
out $0.00/M
ctx: 0
max out: 0
in: text, image
out: image
reasoning
tools
vision
structured
temp
open weights
Qwen Image Edit
qwen/qwen-image-editin $0.00/M
out $0.00/M
ctx: 0
max out: 0
in: text, image
out: image
reasoning
tools
vision
structured
temp
open weights
Qwen2.5 Coder 32b Instruct
qwen/qwen2.5-coder-32b-instructin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 Coder 480B A35B Instruct
qwen/qwen3-coder-480b-a35b-instructin $0.00/M
out $0.00/M
ctx: 262,144
max out: 66,536
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3-Next-80B-A3B-Instruct
qwen/qwen3-next-80b-a3b-instructin $0.00/M
out $0.00/M
ctx: 262,144
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3.5 122B-A10B
qwen/qwen3.5-122b-a10bin $0.00/M
out $0.00/M
ctx: 262,144
max out: 65,536
in: text, image, video, audio
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3.5-397B-A17B
qwen/qwen3.5-397b-a17bin $0.00/M
out $0.00/M
ctx: 262,144
max out: 8,192
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
rerank-qa-mistral-4b
nvidia/rerank-qa-mistral-4bin $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
riva-translate-4b-instruct-v1_1
nvidia/riva-translate-4b-instruct-v1_1in $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
sarvam-m
sarvamai/sarvam-min $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
solar-10.7b-instruct
upstage/solar-10_7b-instructin $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
sparsedrive
nvidia/sparsedrivein $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: video
out: text
reasoning
tools
vision
structured
temp
open weights
Step 3.5 Flash
stepfun-ai/step-3.5-flashin $0.00/M
out $0.00/M
ctx: 256,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Step 3.7 Flash
stepfun-ai/step-3.7-flashin $0.00/M
out $0.00/M
ctx: 256,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
streampetr
nvidia/streampetrin $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: video
out: text
reasoning
tools
vision
structured
temp
open weights
studiovoice
nvidia/studiovoicein $0.00/M
out $0.00/M
ctx: 128,000
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
synthetic-video-detector
nvidia/synthetic-video-detectorin $0.00/M
out $0.00/M
ctx: 0
max out: 4,096
in: video
out: text
reasoning
tools
vision
structured
temp
open weights
usdcode
nvidia/usdcodein $0.00/M
out $0.00/M
ctx: 128,000
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
usdvalidate
nvidia/usdvalidatein $0.00/M
out $0.00/M
ctx: 0
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Whisper Large v3
openai/whisper-large-v3in $0.00/M
out $0.00/M
ctx: 0
max out: 4,096
in: audio
out: text
reasoning
tools
vision
structured
temp
open weights