id: cloudflare-ai-gateway
npm: ai-gateway-provider
env: CLOUDFLARE_API_TOKEN, CLOUDFLARE_ACCOUNT_ID, CLOUDFLARE_GATEWAY_ID
Models
BART Large CNN
workers-ai/@cf/facebook/bart-large-cnnin $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
BGE Base EN v1.5
workers-ai/@cf/baai/bge-base-en-v1.5in $0.07/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
BGE Large EN v1.5
workers-ai/@cf/baai/bge-large-en-v1.5in $0.20/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
BGE M3
workers-ai/@cf/baai/bge-m3in $0.01/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
BGE Reranker Base
workers-ai/@cf/baai/bge-reranker-basein $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
BGE Small EN v1.5
workers-ai/@cf/baai/bge-small-en-v1.5in $0.02/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Fable 5
anthropic/claude-fable-5in $10.00/M
out $50.00/M
cache read $1.00/M
cache write $12.50/M
ctx: 1,000,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Haiku 3
anthropic/claude-3-haikuin $0.25/M
out $1.25/M
cache read $0.03/M
cache write $0.30/M
ctx: 200,000
max out: 4,096
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Haiku 3.5 (latest)
anthropic/claude-3-5-haikuin $0.80/M
out $4.00/M
cache read $0.08/M
cache write $1.00/M
ctx: 200,000
max out: 8,192
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Haiku 3.5 (latest)
anthropic/claude-3.5-haikuin $0.80/M
out $4.00/M
cache read $0.08/M
cache write $1.00/M
ctx: 200,000
max out: 8,192
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Haiku 4.5 (latest)
anthropic/claude-haiku-4-5in $1.00/M
out $5.00/M
cache read $0.10/M
cache write $1.25/M
ctx: 200,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 3
anthropic/claude-3-opusin $15.00/M
out $75.00/M
cache read $1.50/M
cache write $18.75/M
ctx: 200,000
max out: 4,096
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4 (latest)
anthropic/claude-opus-4in $15.00/M
out $75.00/M
cache read $1.50/M
cache write $18.75/M
ctx: 200,000
max out: 32,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.1 (latest)
anthropic/claude-opus-4-1in $15.00/M
out $75.00/M
cache read $1.50/M
cache write $18.75/M
ctx: 200,000
max out: 32,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.5 (latest)
anthropic/claude-opus-4-5in $5.00/M
out $25.00/M
cache read $0.50/M
cache write $6.25/M
ctx: 200,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.6 (latest)
anthropic/claude-opus-4-6in $5.00/M
out $25.00/M
cache read $0.50/M
cache write $6.25/M
ctx: 1,000,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.7
anthropic/claude-opus-4-7in $5.00/M
out $25.00/M
cache read $0.50/M
cache write $6.25/M
ctx: 1,000,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Opus 4.8
anthropic/claude-opus-4-8in $5.00/M
out $25.00/M
cache read $0.50/M
cache write $6.25/M
ctx: 1,000,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Sonnet 3
anthropic/claude-3-sonnetin $3.00/M
out $15.00/M
cache read $0.30/M
cache write $0.30/M
ctx: 200,000
max out: 4,096
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Sonnet 3.5 v2
anthropic/claude-3.5-sonnetin $3.00/M
out $15.00/M
cache read $0.30/M
cache write $3.75/M
ctx: 200,000
max out: 8,192
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Sonnet 4 (latest)
anthropic/claude-sonnet-4in $3.00/M
out $15.00/M
cache read $0.30/M
cache write $3.75/M
ctx: 200,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Sonnet 4.5 (latest)
anthropic/claude-sonnet-4-5in $3.00/M
out $15.00/M
cache read $0.30/M
cache write $3.75/M
ctx: 200,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Claude Sonnet 4.6
anthropic/claude-sonnet-4-6in $3.00/M
out $15.00/M
cache read $0.30/M
cache write $3.75/M
ctx: 1,000,000
max out: 64,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
Deepgram Aura 2 (EN)
workers-ai/@cf/deepgram/aura-2-enin $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Deepgram Aura 2 (ES)
workers-ai/@cf/deepgram/aura-2-esin $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Deepgram Nova 3
workers-ai/@cf/deepgram/nova-3in $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DeepSeek R1 Distill Qwen 32B
workers-ai/@cf/deepseek-ai/deepseek-r1-distill-qwen-32bin $0.50/M
out $4.88/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
DistilBERT SST-2 INT8
workers-ai/@cf/huggingface/distilbert-sst-2-int8in $0.03/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Gemma 3 12B IT
workers-ai/@cf/google/gemma-3-12b-itin $0.35/M
out $0.56/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Gemma SEA-LION v4 27B IT
workers-ai/@cf/aisingapore/gemma-sea-lion-v4-27b-itin $0.35/M
out $0.56/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GLM-4.7-Flash
workers-ai/@cf/zai-org/glm-4.7-flashin $0.06/M
out $0.40/M
ctx: 131,072
max out: 131,072
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT OSS 120B
workers-ai/@cf/openai/gpt-oss-120bin $0.35/M
out $0.75/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT OSS 20B
workers-ai/@cf/openai/gpt-oss-20bin $0.20/M
out $0.30/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-3.5-turbo
openai/gpt-3.5-turboin $0.50/M
out $1.50/M
cache read $1.25/M
ctx: 16,385
max out: 4,096
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4
openai/gpt-4in $30.00/M
out $60.00/M
ctx: 8,192
max out: 8,192
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4 Turbo
openai/gpt-4-turboin $10.00/M
out $30.00/M
ctx: 128,000
max out: 4,096
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4o
openai/gpt-4oin $2.50/M
out $10.00/M
cache read $1.25/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-4o mini
openai/gpt-4o-miniin $0.15/M
out $0.60/M
cache read $0.08/M
ctx: 128,000
max out: 16,384
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.1
openai/gpt-5.1in $1.25/M
out $10.00/M
cache read $0.13/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.1 Codex
openai/gpt-5.1-codexin $1.25/M
out $10.00/M
cache read $0.13/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.2
openai/gpt-5.2in $1.75/M
out $14.00/M
cache read $0.17/M
ctx: 400,000
max out: 128,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.2 Codex
openai/gpt-5.2-codexin $1.75/M
out $14.00/M
cache read $0.17/M
ctx: 400,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.3 Codex
openai/gpt-5.3-codexin $1.75/M
out $14.00/M
cache read $0.17/M
ctx: 400,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.4
openai/gpt-5.4in $2.50/M
out $15.00/M
cache read $0.25/M
ctx: 1,050,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
GPT-5.5
openai/gpt-5.5in $5.00/M
out $30.00/M
cache read $0.50/M
ctx: 1,050,000
max out: 128,000
in: text, image, pdf
out: text
reasoning
tools
vision
structured
temp
open weights
IBM Granite 4.0 H Micro
workers-ai/@cf/ibm-granite/granite-4.0-h-microin $0.02/M
out $0.11/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
IndicTrans2 EN-Indic 1B
workers-ai/@cf/ai4bharat/indictrans2-en-indic-1Bin $0.34/M
out $0.34/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.5
workers-ai/@cf/moonshotai/kimi-k2.5in $0.60/M
out $3.00/M
cache read $0.10/M
ctx: 256,000
max out: 256,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Kimi K2.6
workers-ai/@cf/moonshotai/kimi-k2.6in $0.95/M
out $4.00/M
cache read $0.16/M
ctx: 256,000
max out: 256,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 2 7B Chat FP16
workers-ai/@cf/meta/llama-2-7b-chat-fp16in $0.56/M
out $6.67/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3 8B Instruct
workers-ai/@cf/meta/llama-3-8b-instructin $0.28/M
out $0.83/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3 8B Instruct AWQ
workers-ai/@cf/meta/llama-3-8b-instruct-awqin $0.12/M
out $0.27/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.1 8B Instruct
workers-ai/@cf/meta/llama-3.1-8b-instructin $0.28/M
out $0.83/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.1 8B Instruct AWQ
workers-ai/@cf/meta/llama-3.1-8b-instruct-awqin $0.12/M
out $0.27/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.1 8B Instruct FP8
workers-ai/@cf/meta/llama-3.1-8b-instruct-fp8in $0.15/M
out $0.29/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.2 11B Vision Instruct
workers-ai/@cf/meta/llama-3.2-11b-vision-instructin $0.05/M
out $0.68/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.2 1B Instruct
workers-ai/@cf/meta/llama-3.2-1b-instructin $0.03/M
out $0.20/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.2 3B Instruct
workers-ai/@cf/meta/llama-3.2-3b-instructin $0.05/M
out $0.34/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 3.3 70B Instruct FP8 Fast
workers-ai/@cf/meta/llama-3.3-70b-instruct-fp8-fastin $0.29/M
out $2.25/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama 4 Scout 17B 16E Instruct
workers-ai/@cf/meta/llama-4-scout-17b-16e-instructin $0.27/M
out $0.85/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Llama Guard 3 8B
workers-ai/@cf/meta/llama-guard-3-8bin $0.48/M
out $0.03/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
M2M100 1.2B
workers-ai/@cf/meta/m2m100-1.2bin $0.34/M
out $0.34/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral 7B Instruct v0.1
workers-ai/@cf/mistral/mistral-7b-instruct-v0.1in $0.11/M
out $0.19/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Mistral Small 3.1 24B Instruct
workers-ai/@cf/mistralai/mistral-small-3.1-24b-instructin $0.35/M
out $0.56/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
MyShell MeloTTS
workers-ai/@cf/myshell-ai/melottsin $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Nemotron 3 Super 120B
workers-ai/@cf/nvidia/nemotron-3-120b-a12bin $0.50/M
out $1.50/M
ctx: 256,000
max out: 256,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
o1
openai/o1in $15.00/M
out $60.00/M
cache read $7.50/M
ctx: 200,000
max out: 100,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
o3
openai/o3in $2.00/M
out $8.00/M
cache read $0.50/M
ctx: 200,000
max out: 100,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
o3-mini
openai/o3-miniin $1.10/M
out $4.40/M
cache read $0.55/M
ctx: 200,000
max out: 100,000
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
o3-pro
openai/o3-proin $20.00/M
out $80.00/M
ctx: 200,000
max out: 100,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
o4-mini
openai/o4-miniin $1.10/M
out $4.40/M
cache read $0.28/M
ctx: 200,000
max out: 100,000
in: text, image
out: text
reasoning
tools
vision
structured
temp
open weights
Pipecat Smart Turn v2
workers-ai/@cf/pipecat-ai/smart-turn-v2in $0.00/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
PLaMo Embedding 1B
workers-ai/@cf/pfnet/plamo-embedding-1bin $0.02/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen 2.5 Coder 32B Instruct
workers-ai/@cf/qwen/qwen2.5-coder-32b-instructin $0.66/M
out $1.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 30B A3B FP8
workers-ai/@cf/qwen/qwen3-30b-a3b-fp8in $0.05/M
out $0.34/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
Qwen3 Embedding 0.6B
workers-ai/@cf/qwen/qwen3-embedding-0.6bin $0.01/M
out $0.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights
QwQ 32B
workers-ai/@cf/qwen/qwq-32bin $0.66/M
out $1.00/M
ctx: 128,000
max out: 16,384
in: text
out: text
reasoning
tools
vision
structured
temp
open weights