omni-moderation-latest | openai | moderation | - | - | 32,768 | - | - | - | - |
omni-moderation-latest-intents | openai | moderation | - | - | 32,768 | - | - | - | - |
omni-moderation-2024-09-26 | openai | moderation | - | - | 32,768 | - | - | - | - |
gpt-4 | openai | chat | $30.00 | $60.00 | 4,096 | - | ✓ | ✓ | - |
gpt-4.1 | openai | chat | $2.00 | $8.00 | 32,768 | ✓ | ✓ | ✓ | - |
gpt-4.1-2025-04-14 | openai | chat | $2.00 | $8.00 | 32,768 | ✓ | ✓ | ✓ | - |
gpt-4.1-mini | openai | chat | $0.40 | $1.60 | 32,768 | ✓ | ✓ | ✓ | - |
gpt-4.1-mini-2025-04-14 | openai | chat | $0.40 | $1.60 | 32,768 | ✓ | ✓ | ✓ | - |
gpt-4.1-nano | openai | chat | $0.10 | $0.40 | 32,768 | ✓ | ✓ | ✓ | - |
gpt-4.1-nano-2025-04-14 | openai | chat | $0.10 | $0.40 | 32,768 | ✓ | ✓ | ✓ | - |
gpt-4o | openai | chat | $2.50 | $10.00 | 16,384 | ✓ | ✓ | ✓ | - |
watsonx/ibm/granite-3-8b-instruct | watsonx | chat | $200.00 | $200.00 | 8,192 | - | ✓ | ✓ | - |
watsonx/mistralai/mistral-large | watsonx | chat | $3.00 | $10.00 | 131,072 | - | ✓ | ✓ | - |
gpt-4o-search-preview-2025-03-11 | openai | chat | $2.50 | $10.00 | 16,384 | ✓ | ✓ | ✓ | - |
gpt-4o-search-preview | openai | chat | $2.50 | $10.00 | 16,384 | ✓ | ✓ | ✓ | - |
gpt-4.5-preview | openai | chat | $75.00 | $150.00 | 16,384 | ✓ | ✓ | ✓ | - |
gpt-4.5-preview-2025-02-27 | openai | chat | $75.00 | $150.00 | 16,384 | ✓ | ✓ | ✓ | 2025-07-14 |
gpt-4o-audio-preview | openai | chat | $2.50 | $10.00 | 16,384 | - | ✓ | - | - |
gpt-4o-audio-preview-2024-12-17 | openai | chat | $2.50 | $10.00 | 16,384 | - | ✓ | - | - |
gpt-4o-audio-preview-2024-10-01 | openai | chat | $2.50 | $10.00 | 16,384 | - | ✓ | - | - |
gpt-4o-audio-preview-2025-06-03 | openai | chat | $2.50 | $10.00 | 16,384 | - | ✓ | - | - |
gpt-4o-mini-audio-preview | openai | chat | $0.15 | $0.60 | 16,384 | - | ✓ | - | - |
gpt-4o-mini-audio-preview-2024-12-17 | openai | chat | $0.15 | $0.60 | 16,384 | - | ✓ | - | - |
gpt-4o-mini | openai | chat | $0.15 | $0.60 | 16,384 | ✓ | ✓ | ✓ | - |
gpt-4o-mini-search-preview-2025-03-11 | openai | chat | $0.15 | $0.60 | 16,384 | ✓ | ✓ | ✓ | - |
gpt-4o-mini-search-preview | openai | chat | $0.15 | $0.60 | 16,384 | ✓ | ✓ | ✓ | - |
gpt-4o-mini-2024-07-18 | openai | chat | $0.15 | $0.60 | 16,384 | ✓ | ✓ | ✓ | - |
gpt-5 | openai | chat | $1.25 | $10.00 | 128,000 | ✓ | ✓ | ✓ | - |
gpt-5-mini | openai | chat | $0.25 | $2.00 | 128,000 | ✓ | ✓ | ✓ | - |
gpt-5-nano | openai | chat | $0.05 | $0.40 | 128,000 | ✓ | ✓ | ✓ | - |
gpt-5-chat | openai | chat | $1.25 | $10.00 | 128,000 | ✓ | - | ✓ | - |
gpt-5-chat-latest | openai | chat | $1.25 | $10.00 | 128,000 | ✓ | - | ✓ | - |
gpt-5-2025-08-07 | openai | chat | $1.25 | $10.00 | 128,000 | ✓ | ✓ | ✓ | - |
gpt-5-mini-2025-08-07 | openai | chat | $0.25 | $2.00 | 128,000 | ✓ | ✓ | ✓ | - |
gpt-5-nano-2025-08-07 | openai | chat | $0.05 | $0.40 | 128,000 | ✓ | ✓ | ✓ | - |
codex-mini-latest | openai | responses | $1.50 | $6.00 | 100,000 | ✓ | ✓ | ✓ | - |
o1-pro | openai | responses | $150.00 | $600.00 | 100,000 | ✓ | ✓ | ✓ | - |
o1-pro-2025-03-19 | openai | responses | $150.00 | $600.00 | 100,000 | ✓ | ✓ | ✓ | - |
o1 | openai | chat | $15.00 | $60.00 | 100,000 | ✓ | ✓ | ✓ | - |
o1-mini | openai | chat | $1.10 | $4.40 | 65,536 | ✓ | - | ✓ | - |
computer-use-preview | azure | chat | $3.00 | $12.00 | 1,024 | ✓ | ✓ | - | - |
o3-deep-research | openai | responses | $10.00 | $40.00 | 100,000 | ✓ | ✓ | ✓ | - |
o3-deep-research-2025-06-26 | openai | responses | $10.00 | $40.00 | 100,000 | ✓ | ✓ | ✓ | - |
o3-pro | openai | responses | $20.00 | $80.00 | 100,000 | ✓ | ✓ | ✓ | - |
o3-pro-2025-06-10 | openai | responses | $20.00 | $80.00 | 100,000 | ✓ | ✓ | ✓ | - |
o3 | openai | chat | $2.00 | $8.00 | 100,000 | ✓ | ✓ | ✓ | - |
o3-2025-04-16 | openai | chat | $2.00 | $8.00 | 100,000 | ✓ | ✓ | ✓ | - |
o3-mini | openai | chat | $1.10 | $4.40 | 100,000 | - | ✓ | ✓ | - |
o3-mini-2025-01-31 | openai | chat | $1.10 | $4.40 | 100,000 | - | ✓ | ✓ | - |
o4-mini | openai | chat | $1.10 | $4.40 | 100,000 | ✓ | ✓ | ✓ | - |
o4-mini-deep-research | openai | responses | $2.00 | $8.00 | 100,000 | ✓ | ✓ | ✓ | - |
o4-mini-deep-research-2025-06-26 | openai | responses | $2.00 | $8.00 | 100,000 | ✓ | ✓ | ✓ | - |
o4-mini-2025-04-16 | openai | chat | $1.10 | $4.40 | 100,000 | ✓ | ✓ | ✓ | - |
o1-mini-2024-09-12 | openai | chat | $3.00 | $12.00 | 65,536 | ✓ | - | ✓ | - |
o1-preview | openai | chat | $15.00 | $60.00 | 32,768 | ✓ | - | ✓ | - |
o1-preview-2024-09-12 | openai | chat | $15.00 | $60.00 | 32,768 | ✓ | - | ✓ | - |
o1-2024-12-17 | openai | chat | $15.00 | $60.00 | 100,000 | ✓ | ✓ | ✓ | - |
chatgpt-4o-latest | openai | chat | $5.00 | $15.00 | 4,096 | ✓ | ✓ | ✓ | - |
gpt-4o-2024-05-13 | openai | chat | $5.00 | $15.00 | 4,096 | ✓ | ✓ | ✓ | - |
gpt-4o-2024-08-06 | openai | chat | $2.50 | $10.00 | 16,384 | ✓ | ✓ | ✓ | - |
gpt-4o-2024-11-20 | openai | chat | $2.50 | $10.00 | 16,384 | ✓ | ✓ | ✓ | - |
gpt-4o-realtime-preview-2024-10-01 | openai | chat | $5.00 | $20.00 | 4,096 | - | ✓ | - | - |
gpt-4o-realtime-preview | openai | chat | $5.00 | $20.00 | 4,096 | - | ✓ | - | - |
gpt-4o-realtime-preview-2024-12-17 | openai | chat | $5.00 | $20.00 | 4,096 | - | ✓ | - | - |
gpt-4o-realtime-preview-2025-06-03 | openai | chat | $5.00 | $20.00 | 4,096 | - | ✓ | - | - |
gpt-4o-mini-realtime-preview | openai | chat | $0.60 | $2.40 | 4,096 | - | ✓ | - | - |
gpt-4o-mini-realtime-preview-2024-12-17 | openai | chat | $0.60 | $2.40 | 4,096 | - | ✓ | - | - |
gpt-4-turbo-preview | openai | chat | $10.00 | $30.00 | 4,096 | - | ✓ | ✓ | - |
gpt-4-0314 | openai | chat | $30.00 | $60.00 | 4,096 | - | - | ✓ | - |
gpt-4-0613 | openai | chat | $30.00 | $60.00 | 4,096 | - | ✓ | ✓ | 2025-06-06 |
gpt-4-32k | openai | chat | $60.00 | $120.00 | 4,096 | - | - | ✓ | - |
gpt-4-32k-0314 | openai | chat | $60.00 | $120.00 | 4,096 | - | - | ✓ | - |
gpt-4-32k-0613 | openai | chat | $60.00 | $120.00 | 4,096 | - | - | ✓ | - |
gpt-4-turbo | openai | chat | $10.00 | $30.00 | 4,096 | ✓ | ✓ | ✓ | - |
gpt-4-turbo-2024-04-09 | openai | chat | $10.00 | $30.00 | 4,096 | ✓ | ✓ | ✓ | - |
gpt-4-1106-preview | openai | chat | $10.00 | $30.00 | 4,096 | - | ✓ | ✓ | - |
gpt-4-0125-preview | openai | chat | $10.00 | $30.00 | 4,096 | - | ✓ | ✓ | - |
gpt-4-vision-preview | openai | chat | $10.00 | $30.00 | 4,096 | ✓ | - | ✓ | 2024-12-06 |
gpt-4-1106-vision-preview | openai | chat | $10.00 | $30.00 | 4,096 | ✓ | - | ✓ | 2024-12-06 |
gpt-3.5-turbo | openai | chat | $1.50 | $2.00 | 4,097 | - | ✓ | ✓ | - |
gpt-3.5-turbo-0301 | openai | chat | $1.50 | $2.00 | 4,097 | - | - | ✓ | - |
gpt-3.5-turbo-0613 | openai | chat | $1.50 | $2.00 | 4,097 | - | ✓ | ✓ | - |
gpt-3.5-turbo-1106 | openai | chat | $1.00 | $2.00 | 16,385 | - | ✓ | ✓ | - |
gpt-3.5-turbo-0125 | openai | chat | $0.50 | $1.50 | 16,385 | - | ✓ | ✓ | - |
gpt-3.5-turbo-16k | openai | chat | $3.00 | $4.00 | 16,385 | - | - | ✓ | - |
gpt-3.5-turbo-16k-0613 | openai | chat | $3.00 | $4.00 | 16,385 | - | - | ✓ | - |
ft:gpt-3.5-turbo | openai | chat | $3.00 | $6.00 | 4,096 | - | - | - | - |
ft:gpt-3.5-turbo-0125 | openai | chat | $3.00 | $6.00 | 4,096 | - | - | - | - |
ft:gpt-3.5-turbo-1106 | openai | chat | $3.00 | $6.00 | 4,096 | - | - | - | - |
ft:gpt-3.5-turbo-0613 | openai | chat | $3.00 | $6.00 | 4,096 | - | - | - | - |
ft:gpt-4-0613 | openai | chat | $30.00 | $60.00 | 4,096 | - | ✓ | - | - |
ft:gpt-4o-2024-08-06 | openai | chat | $3.75 | $15.00 | 16,384 | ✓ | ✓ | - | - |
ft:gpt-4o-2024-11-20 | openai | chat | $3.75 | $15.00 | 16,384 | ✓ | ✓ | ✓ | - |
ft:gpt-4o-mini-2024-07-18 | openai | chat | $0.30 | $1.20 | 16,384 | ✓ | ✓ | ✓ | - |
ft:davinci-002 | text-completion-openai | completion | $2.00 | $2.00 | 16,384 | - | - | - | - |
ft:babbage-002 | text-completion-openai | completion | $0.40 | $0.40 | 16,384 | - | - | - | - |
text-embedding-3-large | openai | embedding | $0.13 | - | 8,191 | - | - | - | - |
text-embedding-3-small | openai | embedding | $0.02 | - | 8,191 | - | - | - | - |
text-embedding-ada-002 | openai | embedding | $0.10 | - | 8,191 | - | - | - | - |
text-embedding-ada-002-v2 | openai | embedding | $0.10 | - | 8,191 | - | - | - | - |
text-moderation-stable | openai | moderation | - | - | 32,768 | - | - | - | - |
text-moderation-007 | openai | moderation | - | - | 32,768 | - | - | - | - |
text-moderation-latest | openai | moderation | - | - | 32,768 | - | - | - | - |
256-x-256/dall-e-2 | openai | image_generation | - | - | - | - | - | - | - |
512-x-512/dall-e-2 | openai | image_generation | - | - | - | - | - | - | - |
1024-x-1024/dall-e-2 | openai | image_generation | - | - | - | - | - | - | - |
hd/1024-x-1792/dall-e-3 | openai | image_generation | - | - | - | - | - | - | - |
hd/1792-x-1024/dall-e-3 | openai | image_generation | - | - | - | - | - | - | - |
hd/1024-x-1024/dall-e-3 | openai | image_generation | - | - | - | - | - | - | - |
standard/1024-x-1792/dall-e-3 | openai | image_generation | - | - | - | - | - | - | - |
standard/1792-x-1024/dall-e-3 | openai | image_generation | - | - | - | - | - | - | - |
standard/1024-x-1024/dall-e-3 | openai | image_generation | - | - | - | - | - | - | - |
gpt-image-1 | openai | image_generation | - | - | - | - | - | - | - |
low/1024-x-1024/gpt-image-1 | openai | image_generation | - | - | - | - | - | - | - |
medium/1024-x-1024/gpt-image-1 | openai | image_generation | - | - | - | - | - | - | - |
high/1024-x-1024/gpt-image-1 | openai | image_generation | - | - | - | - | - | - | - |
low/1024-x-1536/gpt-image-1 | openai | image_generation | - | - | - | - | - | - | - |
medium/1024-x-1536/gpt-image-1 | openai | image_generation | - | - | - | - | - | - | - |
high/1024-x-1536/gpt-image-1 | openai | image_generation | - | - | - | - | - | - | - |
low/1536-x-1024/gpt-image-1 | openai | image_generation | - | - | - | - | - | - | - |
medium/1536-x-1024/gpt-image-1 | openai | image_generation | - | - | - | - | - | - | - |
high/1536-x-1024/gpt-image-1 | openai | image_generation | - | - | - | - | - | - | - |
gpt-4o-transcribe | openai | audio_transcription | $2.50 | $10.00 | - | - | - | - | - |
gpt-4o-mini-transcribe | openai | audio_transcription | $1.25 | $5.00 | - | - | - | - | - |
whisper-1 | openai | audio_transcription | - | - | - | - | - | - | - |
tts-1 | openai | audio_speech | - | - | - | - | - | - | - |
tts-1-hd | openai | audio_speech | - | - | - | - | - | - | - |
gpt-4o-mini-tts | openai | audio_speech | $2.50 | $10.00 | - | - | - | - | - |
azure/gpt-5 | azure | chat | $1.25 | $10.00 | 128,000 | ✓ | ✓ | ✓ | - |
azure/gpt-5-2025-08-07 | azure | chat | $1.25 | $10.00 | 128,000 | ✓ | ✓ | ✓ | - |
azure/gpt-5-mini | azure | chat | $0.25 | $2.00 | 128,000 | ✓ | ✓ | ✓ | - |
azure/gpt-5-mini-2025-08-07 | azure | chat | $0.25 | $2.00 | 128,000 | ✓ | ✓ | ✓ | - |
azure/gpt-5-nano-2025-08-07 | azure | chat | $0.05 | $0.40 | 128,000 | ✓ | ✓ | ✓ | - |
azure/gpt-5-nano | azure | chat | $0.05 | $0.40 | 128,000 | ✓ | ✓ | ✓ | - |
azure/gpt-5-chat | azure | chat | $1.25 | $10.00 | 128,000 | ✓ | ✓ | ✓ | - |
azure/gpt-5-chat-latest | azure | chat | $1.25 | $10.00 | 128,000 | ✓ | ✓ | ✓ | - |
azure/gpt-4o-mini-tts | azure | audio_speech | $2.50 | $10.00 | - | - | - | - | - |
azure/computer-use-preview | azure | chat | $3.00 | $12.00 | 1,024 | ✓ | ✓ | - | - |
azure/gpt-4o-audio-preview-2024-12-17 | azure | chat | $2.50 | $10.00 | 16,384 | - | ✓ | - | - |
azure/gpt-4o-mini-audio-preview-2024-12-17 | azure | chat | $2.50 | $10.00 | 16,384 | - | ✓ | - | - |
azure/gpt-4.1 | azure | chat | $2.00 | $8.00 | 32,768 | ✓ | ✓ | ✓ | - |
azure/gpt-4.1-2025-04-14 | azure | chat | $2.00 | $8.00 | 32,768 | ✓ | ✓ | ✓ | - |
azure/gpt-4.1-mini | azure | chat | $0.40 | $1.60 | 32,768 | ✓ | ✓ | ✓ | - |
azure/gpt-4.1-mini-2025-04-14 | azure | chat | $0.40 | $1.60 | 32,768 | ✓ | ✓ | ✓ | - |
azure/gpt-4.1-nano | azure | chat | $0.10 | $0.40 | 32,768 | ✓ | ✓ | ✓ | - |
azure/gpt-4.1-nano-2025-04-14 | azure | chat | $0.10 | $0.40 | 32,768 | ✓ | ✓ | ✓ | - |
azure/o3-pro | azure | responses | $20.00 | $80.00 | 100,000 | ✓ | ✓ | - | - |
azure/o3-pro-2025-06-10 | azure | responses | $20.00 | $80.00 | 100,000 | ✓ | ✓ | - | - |
azure/o3 | azure | chat | $2.00 | $8.00 | 100,000 | ✓ | ✓ | ✓ | - |
azure/o3-2025-04-16 | azure | chat | $10.00 | $40.00 | 100,000 | ✓ | ✓ | ✓ | - |
azure/o3-deep-research | azure | responses | $10.00 | $40.00 | 100,000 | ✓ | ✓ | ✓ | - |
azure/o4-mini | azure | chat | $1.10 | $4.40 | 100,000 | ✓ | ✓ | ✓ | - |
azure/gpt-4o-mini-realtime-preview-2024-12-17 | azure | chat | $0.60 | $2.40 | 4,096 | - | ✓ | - | - |
azure/eu/gpt-4o-mini-realtime-preview-2024-12-17 | azure | chat | $0.66 | $2.64 | 4,096 | - | ✓ | - | - |
azure/us/gpt-4o-mini-realtime-preview-2024-12-17 | azure | chat | $0.66 | $2.64 | 4,096 | - | ✓ | - | - |
azure/gpt-4o-realtime-preview-2024-12-17 | azure | chat | $5.00 | $20.00 | 4,096 | - | ✓ | - | - |
azure/us/gpt-4o-realtime-preview-2024-12-17 | azure | chat | $5.50 | $22.00 | 4,096 | - | ✓ | - | - |
azure/eu/gpt-4o-realtime-preview-2024-12-17 | azure | chat | $5.50 | $22.00 | 4,096 | - | ✓ | - | - |
azure/gpt-4o-realtime-preview-2024-10-01 | azure | chat | $5.00 | $20.00 | 4,096 | - | ✓ | - | - |
azure/us/gpt-4o-realtime-preview-2024-10-01 | azure | chat | $5.50 | $22.00 | 4,096 | - | ✓ | - | - |
azure/eu/gpt-4o-realtime-preview-2024-10-01 | azure | chat | $5.50 | $22.00 | 4,096 | - | ✓ | - | - |
azure/o4-mini-2025-04-16 | azure | chat | $1.10 | $4.40 | 100,000 | ✓ | ✓ | ✓ | - |
azure/o3-mini-2025-01-31 | azure | chat | $1.10 | $4.40 | 100,000 | - | - | ✓ | - |
azure/us/o3-mini-2025-01-31 | azure | chat | $1.21 | $4.84 | 100,000 | - | - | ✓ | - |
azure/eu/o3-mini-2025-01-31 | azure | chat | $1.21 | $4.84 | 100,000 | - | - | ✓ | - |
azure/tts-1 | azure | audio_speech | - | - | - | - | - | - | - |
azure/tts-1-hd | azure | audio_speech | - | - | - | - | - | - | - |
azure/whisper-1 | azure | audio_transcription | - | - | - | - | - | - | - |
azure/gpt-4o-transcribe | azure | audio_transcription | $2.50 | $10.00 | - | - | - | - | - |
azure/gpt-4o-mini-transcribe | azure | audio_transcription | $1.25 | $5.00 | - | - | - | - | - |
azure/o3-mini | azure | chat | $1.10 | $4.40 | 100,000 | - | - | ✓ | - |
azure/o1-mini | azure | chat | $1.21 | $4.84 | 65,536 | - | ✓ | ✓ | - |
azure/o1-mini-2024-09-12 | azure | chat | $1.10 | $4.40 | 65,536 | - | ✓ | ✓ | - |
azure/us/o1-mini-2024-09-12 | azure | chat | $1.21 | $4.84 | 65,536 | - | ✓ | ✓ | - |
azure/eu/o1-mini-2024-09-12 | azure | chat | $1.21 | $4.84 | 65,536 | - | ✓ | ✓ | - |
azure/o1 | azure | chat | $15.00 | $60.00 | 100,000 | ✓ | ✓ | ✓ | - |
azure/o1-2024-12-17 | azure | chat | $15.00 | $60.00 | 100,000 | ✓ | ✓ | ✓ | - |
azure/us/o1-2024-12-17 | azure | chat | $16.50 | $66.00 | 100,000 | ✓ | ✓ | ✓ | - |
azure/eu/o1-2024-12-17 | azure | chat | $16.50 | $66.00 | 100,000 | ✓ | ✓ | ✓ | - |
azure/codex-mini | azure | responses | $1.50 | $6.00 | 100,000 | ✓ | ✓ | ✓ | - |
azure/o1-preview | azure | chat | $15.00 | $60.00 | 32,768 | - | ✓ | ✓ | - |
azure/o1-preview-2024-09-12 | azure | chat | $15.00 | $60.00 | 32,768 | - | ✓ | ✓ | - |
azure/us/o1-preview-2024-09-12 | azure | chat | $16.50 | $66.00 | 32,768 | - | ✓ | ✓ | - |
azure/eu/o1-preview-2024-09-12 | azure | chat | $16.50 | $66.00 | 32,768 | - | ✓ | ✓ | - |
azure/gpt-4.5-preview | azure | chat | $75.00 | $150.00 | 16,384 | ✓ | ✓ | ✓ | - |
azure/gpt-4o | azure | chat | $2.50 | $10.00 | 16,384 | ✓ | ✓ | ✓ | - |
azure/global/gpt-4o-2024-11-20 | azure | chat | $2.50 | $10.00 | 16,384 | ✓ | ✓ | ✓ | - |
azure/gpt-4o-2024-08-06 | azure | chat | $2.50 | $10.00 | 16,384 | ✓ | ✓ | ✓ | - |
azure/global/gpt-4o-2024-08-06 | azure | chat | $2.50 | $10.00 | 16,384 | ✓ | ✓ | ✓ | - |
azure/gpt-4o-2024-11-20 | azure | chat | $2.75 | $11.00 | 16,384 | ✓ | ✓ | ✓ | - |
azure/us/gpt-4o-2024-11-20 | azure | chat | $2.75 | $11.00 | 16,384 | ✓ | ✓ | - | - |
azure/eu/gpt-4o-2024-11-20 | azure | chat | $2.75 | $11.00 | 16,384 | ✓ | ✓ | - | - |
azure/gpt-4o-2024-05-13 | azure | chat | $5.00 | $15.00 | 4,096 | ✓ | ✓ | ✓ | - |
azure/global-standard/gpt-4o-2024-08-06 | azure | chat | $2.50 | $10.00 | 16,384 | ✓ | ✓ | ✓ | 2025-08-20 |
azure/us/gpt-4o-2024-08-06 | azure | chat | $2.75 | $11.00 | 16,384 | ✓ | ✓ | ✓ | - |
azure/eu/gpt-4o-2024-08-06 | azure | chat | $2.75 | $11.00 | 16,384 | ✓ | ✓ | ✓ | - |
azure/global-standard/gpt-4o-2024-11-20 | azure | chat | $2.50 | $10.00 | 16,384 | ✓ | ✓ | - | 2025-12-20 |
azure/global-standard/gpt-4o-mini | azure | chat | $0.15 | $0.60 | 16,384 | ✓ | ✓ | - | - |
azure/gpt-4o-mini | azure | chat | $0.165 | $0.66 | 16,384 | ✓ | ✓ | ✓ | - |
azure/gpt-4o-mini-2024-07-18 | azure | chat | $0.165 | $0.66 | 16,384 | ✓ | ✓ | ✓ | - |
azure/us/gpt-4o-mini-2024-07-18 | azure | chat | $0.165 | $0.66 | 16,384 | ✓ | ✓ | ✓ | - |
azure/eu/gpt-4o-mini-2024-07-18 | azure | chat | $0.165 | $0.66 | 16,384 | ✓ | ✓ | ✓ | - |
azure/gpt-4-turbo-2024-04-09 | azure | chat | $10.00 | $30.00 | 4,096 | ✓ | ✓ | - | - |
azure/gpt-4-0125-preview | azure | chat | $10.00 | $30.00 | 4,096 | - | ✓ | - | - |
azure/gpt-4-1106-preview | azure | chat | $10.00 | $30.00 | 4,096 | - | ✓ | - | - |
azure/gpt-4-0613 | azure | chat | $30.00 | $60.00 | 4,096 | - | ✓ | - | - |
azure/gpt-4-32k-0613 | azure | chat | $60.00 | $120.00 | 4,096 | - | - | - | - |
azure/gpt-4-32k | azure | chat | $60.00 | $120.00 | 4,096 | - | - | - | - |
azure/gpt-4 | azure | chat | $30.00 | $60.00 | 4,096 | - | ✓ | - | - |
azure/gpt-4-turbo | azure | chat | $10.00 | $30.00 | 4,096 | - | ✓ | - | - |
azure/gpt-4-turbo-vision-preview | azure | chat | $10.00 | $30.00 | 4,096 | ✓ | - | - | - |
azure/gpt-35-turbo-16k-0613 | azure | chat | $3.00 | $4.00 | 4,096 | - | ✓ | - | - |
azure/gpt-35-turbo-1106 | azure | chat | $1.00 | $2.00 | 4,096 | - | ✓ | - | 2025-03-31 |
azure/gpt-35-turbo-0613 | azure | chat | $1.50 | $2.00 | 4,097 | - | ✓ | - | 2025-02-13 |
azure/gpt-35-turbo-0301 | azure | chat | $0.20 | $2.00 | 4,097 | - | ✓ | - | 2025-02-13 |
azure/gpt-35-turbo-0125 | azure | chat | $0.50 | $1.50 | 4,096 | - | ✓ | - | 2025-05-31 |
azure/gpt-3.5-turbo-0125 | azure | chat | $0.50 | $1.50 | 4,096 | - | ✓ | - | 2025-03-31 |
azure/gpt-35-turbo-16k | azure | chat | $3.00 | $4.00 | 4,096 | - | - | - | - |
azure/gpt-35-turbo | azure | chat | $0.50 | $1.50 | 4,096 | - | ✓ | - | - |
azure/gpt-3.5-turbo | azure | chat | $0.50 | $1.50 | 4,096 | - | ✓ | - | - |
azure/gpt-3.5-turbo-instruct-0914 | azure_text | completion | $1.50 | $2.00 | 4,097 | - | - | - | - |
azure/gpt-35-turbo-instruct | azure_text | completion | $1.50 | $2.00 | 4,097 | - | - | - | - |
azure/gpt-35-turbo-instruct-0914 | azure_text | completion | $1.50 | $2.00 | 4,097 | - | - | - | - |
azure/mistral-large-latest | azure | chat | $8.00 | $24.00 | 32,000 | - | ✓ | - | - |
azure/mistral-large-2402 | azure | chat | $8.00 | $24.00 | 32,000 | - | ✓ | - | - |
azure/command-r-plus | azure | chat | $3.00 | $15.00 | 4,096 | - | ✓ | - | - |
azure/ada | azure | embedding | $0.10 | - | 8,191 | - | - | - | - |
azure/text-embedding-ada-002 | azure | embedding | $0.10 | - | 8,191 | - | - | - | - |
azure/text-embedding-3-large | azure | embedding | $0.13 | - | 8,191 | - | - | - | - |
azure/text-embedding-3-small | azure | embedding | $0.02 | - | 8,191 | - | - | - | - |
azure/gpt-image-1 | azure | image_generation | - | - | - | - | - | - | - |
azure/low/1024-x-1024/gpt-image-1 | azure | image_generation | - | - | - | - | - | - | - |
azure/medium/1024-x-1024/gpt-image-1 | azure | image_generation | - | - | - | - | - | - | - |
azure/high/1024-x-1024/gpt-image-1 | azure | image_generation | - | - | - | - | - | - | - |
azure/low/1024-x-1536/gpt-image-1 | azure | image_generation | - | - | - | - | - | - | - |
azure/medium/1024-x-1536/gpt-image-1 | azure | image_generation | - | - | - | - | - | - | - |
azure/high/1024-x-1536/gpt-image-1 | azure | image_generation | - | - | - | - | - | - | - |
azure/low/1536-x-1024/gpt-image-1 | azure | image_generation | - | - | - | - | - | - | - |
azure/medium/1536-x-1024/gpt-image-1 | azure | image_generation | - | - | - | - | - | - | - |
azure/high/1536-x-1024/gpt-image-1 | azure | image_generation | - | - | - | - | - | - | - |
azure/standard/1024-x-1024/dall-e-3 | azure | image_generation | - | - | - | - | - | - | - |
azure/hd/1024-x-1024/dall-e-3 | azure | image_generation | - | - | - | - | - | - | - |
azure/standard/1024-x-1792/dall-e-3 | azure | image_generation | - | - | - | - | - | - | - |
azure/standard/1792-x-1024/dall-e-3 | azure | image_generation | - | - | - | - | - | - | - |
azure/hd/1024-x-1792/dall-e-3 | azure | image_generation | - | - | - | - | - | - | - |
azure/hd/1792-x-1024/dall-e-3 | azure | image_generation | - | - | - | - | - | - | - |
azure/standard/1024-x-1024/dall-e-2 | azure | image_generation | - | - | - | - | - | - | - |
azure_ai/grok-3 | azure_ai | chat | $3.30 | $16.50 | 131,072 | - | ✓ | - | - |
azure_ai/global/grok-3 | azure_ai | chat | $3.00 | $15.00 | 131,072 | - | ✓ | - | - |
azure_ai/global/grok-3-mini | azure_ai | chat | $0.25 | $1.27 | 131,072 | - | ✓ | - | - |
azure_ai/grok-3-mini | azure_ai | chat | $0.275 | $1.38 | 131,072 | - | ✓ | - | - |
azure_ai/deepseek-r1 | azure_ai | chat | $1.35 | $5.40 | 8,192 | - | - | - | - |
azure_ai/deepseek-v3 | azure_ai | chat | $1.14 | $4.56 | 8,192 | - | - | - | - |
azure_ai/deepseek-v3-0324 | azure_ai | chat | $1.14 | $4.56 | 8,192 | - | ✓ | - | - |
azure_ai/jamba-instruct | azure_ai | chat | $0.50 | $0.70 | 4,096 | - | - | - | - |
azure_ai/jais-30b-chat | azure_ai | chat | $3,200.00 | $9,710.00 | 8,192 | - | - | - | - |
azure_ai/mistral-nemo | azure_ai | chat | $0.15 | $0.15 | 4,096 | - | ✓ | - | - |
azure_ai/mistral-medium-2505 | azure_ai | chat | $0.40 | $2.00 | 8,191 | - | ✓ | - | - |
azure_ai/mistral-large | azure_ai | chat | $4.00 | $12.00 | 8,191 | - | ✓ | - | - |
azure_ai/mistral-small | azure_ai | chat | $1.00 | $3.00 | 8,191 | - | ✓ | - | - |
azure_ai/mistral-small-2503 | azure_ai | chat | $1.00 | $3.00 | 128,000 | ✓ | ✓ | - | - |
azure_ai/mistral-large-2407 | azure_ai | chat | $2.00 | $6.00 | 4,096 | - | ✓ | - | - |
azure_ai/mistral-large-latest | azure_ai | chat | $2.00 | $6.00 | 4,096 | - | ✓ | - | - |
azure_ai/ministral-3b | azure_ai | chat | $0.04 | $0.04 | 4,096 | - | ✓ | - | - |
azure_ai/Llama-3.2-11B-Vision-Instruct | azure_ai | chat | $0.37 | $0.37 | 2,048 | ✓ | ✓ | - | - |
azure_ai/Llama-3.3-70B-Instruct | azure_ai | chat | $0.71 | $0.71 | 2,048 | - | ✓ | - | - |
azure_ai/Llama-4-Scout-17B-16E-Instruct | azure_ai | chat | $0.20 | $0.78 | 16,384 | ✓ | ✓ | - | - |
azure_ai/Llama-4-Maverick-17B-128E-Instruct-FP8 | azure_ai | chat | $1.41 | $0.35 | 16,384 | ✓ | ✓ | - | - |
azure_ai/Llama-3.2-90B-Vision-Instruct | azure_ai | chat | $2.04 | $2.04 | 2,048 | ✓ | ✓ | - | - |
azure_ai/Meta-Llama-3-70B-Instruct | azure_ai | chat | $1.10 | $0.37 | 2,048 | - | - | - | - |
azure_ai/Meta-Llama-3.1-8B-Instruct | azure_ai | chat | $0.30 | $0.61 | 2,048 | - | - | - | - |
azure_ai/Meta-Llama-3.1-70B-Instruct | azure_ai | chat | $2.68 | $3.54 | 2,048 | - | - | - | - |
azure_ai/Meta-Llama-3.1-405B-Instruct | azure_ai | chat | $5.33 | $16.00 | 2,048 | - | - | - | - |
azure_ai/Phi-4-mini-instruct | azure_ai | chat | $0.075 | $0.30 | 4,096 | - | ✓ | - | - |
azure_ai/Phi-4-multimodal-instruct | azure_ai | chat | $0.08 | $0.32 | 4,096 | ✓ | ✓ | - | - |
azure_ai/Phi-4 | azure_ai | chat | $0.125 | $0.50 | 16,384 | - | ✓ | - | - |
azure_ai/Phi-3.5-mini-instruct | azure_ai | chat | $0.13 | $0.52 | 4,096 | - | - | - | - |
azure_ai/Phi-3.5-vision-instruct | azure_ai | chat | $0.13 | $0.52 | 4,096 | ✓ | - | - | - |
azure_ai/Phi-3.5-MoE-instruct | azure_ai | chat | $0.16 | $0.64 | 4,096 | - | - | - | - |
azure_ai/Phi-3-mini-4k-instruct | azure_ai | chat | $0.13 | $0.52 | 4,096 | - | - | - | - |
azure_ai/Phi-3-mini-128k-instruct | azure_ai | chat | $0.13 | $0.52 | 4,096 | - | - | - | - |
azure_ai/Phi-3-small-8k-instruct | azure_ai | chat | $0.15 | $0.60 | 4,096 | - | - | - | - |
azure_ai/Phi-3-small-128k-instruct | azure_ai | chat | $0.15 | $0.60 | 4,096 | - | - | - | - |
azure_ai/Phi-3-medium-4k-instruct | azure_ai | chat | $0.17 | $0.68 | 4,096 | - | - | - | - |
azure_ai/Phi-3-medium-128k-instruct | azure_ai | chat | $0.17 | $0.68 | 4,096 | - | - | - | - |
azure_ai/cohere-rerank-v3.5 | azure_ai | rerank | - | - | 4,096 | - | - | - | - |
azure_ai/cohere-rerank-v3-multilingual | azure_ai | rerank | - | - | 4,096 | - | - | - | - |
azure_ai/cohere-rerank-v3-english | azure_ai | rerank | - | - | 4,096 | - | - | - | - |
azure_ai/Cohere-embed-v3-english | azure_ai | embedding | $0.10 | - | 512 | - | - | - | - |
azure_ai/Cohere-embed-v3-multilingual | azure_ai | embedding | $0.10 | - | 512 | - | - | - | - |
azure_ai/embed-v-4-0 | azure_ai | embedding | $0.12 | - | 128,000 | - | - | - | - |
azure_ai/FLUX-1.1-pro | azure_ai | image_generation | - | - | - | - | - | - | - |
azure_ai/FLUX.1-Kontext-pro | azure_ai | image_generation | - | - | - | - | - | - | - |
babbage-002 | text-completion-openai | completion | $0.40 | $0.40 | 16,384 | - | - | - | - |
davinci-002 | text-completion-openai | completion | $2.00 | $2.00 | 16,384 | - | - | - | - |
gpt-3.5-turbo-instruct | text-completion-openai | completion | $1.50 | $2.00 | 4,096 | - | - | - | - |
gpt-3.5-turbo-instruct-0914 | text-completion-openai | completion | $1.50 | $2.00 | 4,097 | - | - | - | - |
mistral/mistral-tiny | mistral | chat | $0.25 | $0.25 | 8,191 | - | - | - | - |
mistral/mistral-small | mistral | chat | $0.10 | $0.30 | 8,191 | - | ✓ | - | - |
mistral/mistral-small-latest | mistral | chat | $0.10 | $0.30 | 8,191 | - | ✓ | - | - |
mistral/mistral-medium | mistral | chat | $2.70 | $8.10 | 8,191 | - | - | - | - |
mistral/mistral-medium-latest | mistral | chat | $0.40 | $2.00 | 8,191 | - | ✓ | - | - |
mistral/mistral-medium-2505 | mistral | chat | $0.40 | $2.00 | 8,191 | - | ✓ | - | - |
mistral/mistral-medium-2312 | mistral | chat | $2.70 | $8.10 | 8,191 | - | - | - | - |
mistral/mistral-large-latest | mistral | chat | $2.00 | $6.00 | 128,000 | - | ✓ | - | - |
mistral/mistral-large-2411 | mistral | chat | $2.00 | $6.00 | 128,000 | - | ✓ | - | - |
mistral/mistral-large-2402 | mistral | chat | $4.00 | $12.00 | 8,191 | - | ✓ | - | - |
mistral/mistral-large-2407 | mistral | chat | $3.00 | $9.00 | 128,000 | - | ✓ | - | - |
mistral/pixtral-large-latest | mistral | chat | $2.00 | $6.00 | 128,000 | ✓ | ✓ | - | - |
mistral/pixtral-large-2411 | mistral | chat | $2.00 | $6.00 | 128,000 | ✓ | ✓ | - | - |
mistral/pixtral-12b-2409 | mistral | chat | $0.15 | $0.15 | 128,000 | ✓ | ✓ | - | - |
mistral/open-mistral-7b | mistral | chat | $0.25 | $0.25 | 8,191 | - | - | - | - |
mistral/open-mixtral-8x7b | mistral | chat | $0.70 | $0.70 | 8,191 | - | ✓ | - | - |
mistral/open-mixtral-8x22b | mistral | chat | $2.00 | $6.00 | 8,191 | - | ✓ | - | - |
mistral/codestral-latest | mistral | chat | $1.00 | $3.00 | 8,191 | - | - | - | - |
mistral/codestral-2405 | mistral | chat | $1.00 | $3.00 | 8,191 | - | - | - | - |
mistral/open-mistral-nemo | mistral | chat | $0.30 | $0.30 | 128,000 | - | - | - | - |
mistral/open-mistral-nemo-2407 | mistral | chat | $0.30 | $0.30 | 128,000 | - | - | - | - |
mistral/open-codestral-mamba | mistral | chat | $0.25 | $0.25 | 256,000 | - | - | - | - |
mistral/codestral-mamba-latest | mistral | chat | $0.25 | $0.25 | 256,000 | - | - | - | - |
mistral/devstral-small-2505 | mistral | chat | $0.10 | $0.30 | 128,000 | - | ✓ | - | - |
mistral/devstral-small-2507 | mistral | chat | $0.10 | $0.30 | 128,000 | - | ✓ | - | - |
mistral/devstral-medium-2507 | mistral | chat | $0.40 | $2.00 | 128,000 | - | ✓ | - | - |
mistral/magistral-medium-latest | mistral | chat | $2.00 | $5.00 | 40,000 | - | ✓ | - | - |
mistral/magistral-medium-2506 | mistral | chat | $2.00 | $5.00 | 40,000 | - | ✓ | - | - |
mistral/magistral-small-latest | mistral | chat | $0.50 | $1.50 | 40,000 | - | ✓ | - | - |
mistral/magistral-small-2506 | mistral | chat | $0.50 | $1.50 | 40,000 | - | ✓ | - | - |
mistral/mistral-embed | mistral | embedding | $0.10 | - | 8,192 | - | - | - | - |
deepseek/deepseek-reasoner | deepseek | chat | $0.55 | $2.19 | 8,192 | - | ✓ | ✓ | - |
deepseek/deepseek-chat | deepseek | chat | $0.27 | $1.10 | 8,192 | - | ✓ | ✓ | - |
deepseek/deepseek-r1 | deepseek | chat | $0.55 | $2.19 | 8,192 | - | ✓ | ✓ | - |
deepseek/deepseek-v3 | deepseek | chat | $0.27 | $1.10 | 8,192 | - | ✓ | ✓ | - |
codestral/codestral-latest | codestral | chat | - | - | 8,191 | - | - | - | - |
codestral/codestral-2405 | codestral | chat | - | - | 8,191 | - | - | - | - |
text-completion-codestral/codestral-latest | text-completion-codestral | completion | - | - | 8,191 | - | - | - | - |
text-completion-codestral/codestral-2405 | text-completion-codestral | completion | - | - | 8,191 | - | - | - | - |
xai/grok-beta | xai | chat | $5.00 | $15.00 | 131,072 | ✓ | ✓ | - | - |
xai/grok-2-vision-1212 | xai | chat | $2.00 | $10.00 | 32,768 | ✓ | ✓ | - | - |
xai/grok-2-vision-latest | xai | chat | $2.00 | $10.00 | 32,768 | ✓ | ✓ | - | - |
xai/grok-2-vision | xai | chat | $2.00 | $10.00 | 32,768 | ✓ | ✓ | - | - |
xai/grok-3 | xai | chat | $3.00 | $15.00 | 131,072 | - | ✓ | - | - |
xai/grok-3-latest | xai | chat | $3.00 | $15.00 | 131,072 | - | ✓ | - | - |
xai/grok-3-beta | xai | chat | $3.00 | $15.00 | 131,072 | - | ✓ | - | - |
xai/grok-3-fast-beta | xai | chat | $5.00 | $25.00 | 131,072 | - | ✓ | - | - |
xai/grok-3-fast-latest | xai | chat | $5.00 | $25.00 | 131,072 | - | ✓ | - | - |
xai/grok-3-mini | xai | chat | $0.30 | $0.50 | 131,072 | - | ✓ | - | - |
xai/grok-3-mini-latest | xai | chat | $0.30 | $0.50 | 131,072 | - | ✓ | - | - |
xai/grok-3-mini-fast | xai | chat | $0.60 | $4.00 | 131,072 | - | ✓ | - | - |
xai/grok-3-mini-fast-latest | xai | chat | $0.60 | $4.00 | 131,072 | - | ✓ | - | - |
xai/grok-3-mini-beta | xai | chat | $0.30 | $0.50 | 131,072 | - | ✓ | - | - |
xai/grok-3-mini-fast-beta | xai | chat | $0.60 | $4.00 | 131,072 | - | ✓ | - | - |
xai/grok-vision-beta | xai | chat | $5.00 | $15.00 | 8,192 | ✓ | ✓ | - | - |
xai/grok-2-1212 | xai | chat | $2.00 | $10.00 | 131,072 | - | ✓ | - | - |
xai/grok-2 | xai | chat | $2.00 | $10.00 | 131,072 | - | ✓ | - | - |
xai/grok-2-latest | xai | chat | $2.00 | $10.00 | 131,072 | - | ✓ | - | - |
xai/grok-4 | xai | chat | $3.00 | $15.00 | 256,000 | - | ✓ | - | - |
xai/grok-4-0709 | xai | chat | $3.00 | $15.00 | 256,000 | - | ✓ | - | - |
xai/grok-4-latest | xai | chat | $3.00 | $15.00 | 256,000 | - | ✓ | - | - |
deepseek/deepseek-coder | deepseek | chat | $0.14 | $0.28 | 4,096 | - | ✓ | ✓ | - |
groq/deepseek-r1-distill-llama-70b | groq | chat | $0.75 | $0.99 | 128,000 | - | ✓ | - | - |
groq/llama-3.3-70b-versatile | groq | chat | $0.59 | $0.79 | 32,768 | - | ✓ | - | - |
groq/llama-3.3-70b-specdec | groq | chat | $0.59 | $0.99 | 8,192 | - | - | - | 2025-04-14 |
groq/llama-guard-3-8b | groq | chat | $0.20 | $0.20 | 8,192 | - | - | - | - |
groq/llama2-70b-4096 | groq | chat | $0.70 | $0.80 | 4,096 | - | ✓ | - | - |
groq/llama3-8b-8192 | groq | chat | $0.05 | $0.08 | 8,192 | - | - | - | - |
groq/llama-3.2-1b-preview | groq | chat | $0.04 | $0.04 | 8,192 | - | ✓ | - | 2025-04-14 |
groq/llama-3.2-3b-preview | groq | chat | $0.06 | $0.06 | 8,192 | - | ✓ | - | 2025-04-14 |
groq/llama-3.2-11b-text-preview | groq | chat | $0.18 | $0.18 | 8,192 | - | ✓ | - | 2024-10-28 |
groq/llama-3.2-11b-vision-preview | groq | chat | $0.18 | $0.18 | 8,192 | ✓ | ✓ | - | 2025-04-14 |
groq/llama-3.2-90b-text-preview | groq | chat | $0.90 | $0.90 | 8,192 | - | ✓ | - | 2024-11-25 |
groq/llama-3.2-90b-vision-preview | groq | chat | $0.90 | $0.90 | 8,192 | ✓ | ✓ | - | 2025-04-14 |
groq/llama3-70b-8192 | groq | chat | $0.59 | $0.79 | 8,192 | - | - | - | - |
groq/llama-3.1-8b-instant | groq | chat | $0.05 | $0.08 | 8,192 | - | ✓ | - | - |
groq/llama-3.1-70b-versatile | groq | chat | $0.59 | $0.79 | 8,192 | - | ✓ | - | 2025-01-24 |
groq/llama-3.1-405b-reasoning | groq | chat | $0.59 | $0.79 | 8,192 | - | ✓ | - | - |
groq/meta-llama/llama-4-scout-17b-16e-instruct | groq | chat | $0.11 | $0.34 | 8,192 | - | ✓ | - | - |
groq/meta-llama/llama-4-maverick-17b-128e-instruct | groq | chat | $0.20 | $0.60 | 8,192 | - | ✓ | - | - |
groq/mistral-saba-24b | groq | chat | $0.79 | $0.79 | 32,000 | - | - | - | - |
groq/mixtral-8x7b-32768 | groq | chat | $0.24 | $0.24 | 32,768 | - | ✓ | - | 2025-03-20 |
groq/gemma-7b-it | groq | chat | $0.07 | $0.07 | 8,192 | - | ✓ | - | 2024-12-18 |
groq/gemma2-9b-it | groq | chat | $0.20 | $0.20 | 8,192 | - | - | - | - |
groq/llama3-groq-70b-8192-tool-use-preview | groq | chat | $0.89 | $0.89 | 8,192 | - | ✓ | - | 2025-01-06 |
groq/llama3-groq-8b-8192-tool-use-preview | groq | chat | $0.19 | $0.19 | 8,192 | - | ✓ | - | 2025-01-06 |
groq/qwen/qwen3-32b | groq | chat | $0.29 | $0.59 | 131,000 | - | ✓ | - | - |
groq/moonshotai/kimi-k2-instruct | groq | chat | $1.00 | $3.00 | 131,072 | - | ✓ | - | - |
groq/playai-tts | groq | audio_speech | - | - | 10,000 | - | - | - | - |
groq/whisper-large-v3 | groq | audio_transcription | - | - | - | - | - | - | - |
groq/whisper-large-v3-turbo | groq | audio_transcription | - | - | - | - | - | - | - |
groq/distil-whisper-large-v3-en | groq | audio_transcription | - | - | - | - | - | - | - |
groq/openai/gpt-oss-20b | groq | chat | $0.10 | $0.50 | 32,768 | - | ✓ | - | - |
groq/openai/gpt-oss-120b | groq | chat | $0.15 | $0.75 | 32,766 | - | ✓ | - | - |
cerebras/llama3.1-8b | cerebras | chat | $0.10 | $0.10 | 128,000 | - | ✓ | - | - |
cerebras/llama3.1-70b | cerebras | chat | $0.60 | $0.60 | 128,000 | - | ✓ | - | - |
cerebras/llama-3.3-70b | cerebras | chat | $0.85 | $1.20 | 128,000 | - | ✓ | - | - |
cerebras/qwen-3-32b | cerebras | chat | $0.40 | $0.80 | 128,000 | - | ✓ | - | - |
cerebras/openai/gpt-oss-20b | cerebras | chat | $0.07 | $0.30 | 32,768 | - | ✓ | - | - |
cerebras/openai/gpt-oss-120b | cerebras | chat | $0.25 | $0.69 | 32,768 | - | ✓ | - | - |
friendliai/meta-llama-3.1-8b-instruct | friendliai | chat | $0.10 | $0.10 | 8,192 | - | ✓ | - | - |
friendliai/meta-llama-3.1-70b-instruct | friendliai | chat | $0.60 | $0.60 | 8,192 | - | ✓ | - | - |
claude-3-haiku-20240307 | anthropic | chat | $0.25 | $1.25 | 4,096 | ✓ | ✓ | ✓ | 2025-03-01 |
claude-3-5-haiku-20241022 | anthropic | chat | $0.80 | $4.00 | 8,192 | ✓ | ✓ | ✓ | 2025-10-01 |
claude-3-5-haiku-latest | anthropic | chat | $1.00 | $5.00 | 8,192 | ✓ | ✓ | ✓ | 2025-10-01 |
claude-3-opus-latest | anthropic | chat | $15.00 | $75.00 | 4,096 | ✓ | ✓ | ✓ | 2025-03-01 |
claude-3-opus-20240229 | anthropic | chat | $15.00 | $75.00 | 4,096 | ✓ | ✓ | ✓ | 2025-03-01 |
claude-3-5-sonnet-latest | anthropic | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | ✓ | 2025-06-01 |
claude-3-5-sonnet-20240620 | anthropic | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | ✓ | 2025-06-01 |
claude-opus-4-20250514 | anthropic | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
claude-opus-4-1 | anthropic | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
claude-opus-4-1-20250805 | anthropic | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
claude-sonnet-4-20250514 | anthropic | chat | $3.00 | $15.00 | 64,000 | ✓ | ✓ | ✓ | - |
claude-4-opus-20250514 | anthropic | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
claude-4-sonnet-20250514 | anthropic | chat | $3.00 | $15.00 | 1,000,000 | ✓ | ✓ | ✓ | - |
claude-3-7-sonnet-latest | anthropic | chat | $3.00 | $15.00 | 128,000 | ✓ | ✓ | ✓ | 2025-06-01 |
claude-3-7-sonnet-20250219 | anthropic | chat | $3.00 | $15.00 | 128,000 | ✓ | ✓ | ✓ | 2026-02-01 |
claude-3-5-sonnet-20241022 | anthropic | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | ✓ | 2025-10-01 |
text-bison | vertex_ai-text-models | completion | - | - | 2,048 | - | - | - | - |
text-bison@001 | vertex_ai-text-models | completion | - | - | 1,024 | - | - | - | - |
text-bison@002 | vertex_ai-text-models | completion | - | - | 1,024 | - | - | - | - |
text-bison32k | vertex_ai-text-models | completion | $0.125 | $0.125 | 1,024 | - | - | - | - |
text-bison32k@002 | vertex_ai-text-models | completion | $0.125 | $0.125 | 1,024 | - | - | - | - |
text-unicorn | vertex_ai-text-models | completion | $10.00 | $28.00 | 1,024 | - | - | - | - |
text-unicorn@001 | vertex_ai-text-models | completion | $10.00 | $28.00 | 1,024 | - | - | - | - |
chat-bison | vertex_ai-chat-models | chat | $0.125 | $0.125 | 4,096 | - | - | - | - |
chat-bison@001 | vertex_ai-chat-models | chat | $0.125 | $0.125 | 4,096 | - | - | - | - |
chat-bison@002 | vertex_ai-chat-models | chat | $0.125 | $0.125 | 4,096 | - | - | - | 2025-04-09 |
chat-bison-32k | vertex_ai-chat-models | chat | $0.125 | $0.125 | 8,192 | - | - | - | - |
chat-bison-32k@002 | vertex_ai-chat-models | chat | $0.125 | $0.125 | 8,192 | - | - | - | - |
code-bison | vertex_ai-code-text-models | chat | $0.125 | $0.125 | 1,024 | - | - | - | - |
code-bison@001 | vertex_ai-code-text-models | completion | $0.125 | $0.125 | 1,024 | - | - | - | - |
code-bison@002 | vertex_ai-code-text-models | completion | $0.125 | $0.125 | 1,024 | - | - | - | - |
code-bison32k | vertex_ai-code-text-models | completion | $0.125 | $0.125 | 1,024 | - | - | - | - |
code-bison-32k@002 | vertex_ai-code-text-models | completion | $0.125 | $0.125 | 1,024 | - | - | - | - |
code-gecko@001 | vertex_ai-code-text-models | completion | $0.125 | $0.125 | 64 | - | - | - | - |
code-gecko@002 | vertex_ai-code-text-models | completion | $0.125 | $0.125 | 64 | - | - | - | - |
code-gecko | vertex_ai-code-text-models | completion | $0.125 | $0.125 | 64 | - | - | - | - |
code-gecko-latest | vertex_ai-code-text-models | completion | $0.125 | $0.125 | 64 | - | - | - | - |
codechat-bison@latest | vertex_ai-code-chat-models | chat | $0.125 | $0.125 | 1,024 | - | - | - | - |
codechat-bison | vertex_ai-code-chat-models | chat | $0.125 | $0.125 | 1,024 | - | - | - | - |
codechat-bison@001 | vertex_ai-code-chat-models | chat | $0.125 | $0.125 | 1,024 | - | - | - | - |
codechat-bison@002 | vertex_ai-code-chat-models | chat | $0.125 | $0.125 | 1,024 | - | - | - | - |
codechat-bison-32k | vertex_ai-code-chat-models | chat | $0.125 | $0.125 | 8,192 | - | - | - | - |
codechat-bison-32k@002 | vertex_ai-code-chat-models | chat | $0.125 | $0.125 | 8,192 | - | - | - | - |
meta_llama/Llama-4-Scout-17B-16E-Instruct-FP8 | meta_llama | chat | - | - | 128,000 | - | ✓ | - | - |
meta_llama/Llama-4-Maverick-17B-128E-Instruct-FP8 | meta_llama | chat | - | - | 128,000 | - | ✓ | - | - |
meta_llama/Llama-3.3-70B-Instruct | meta_llama | chat | - | - | 128,000 | - | ✓ | - | - |
meta_llama/Llama-3.3-8B-Instruct | meta_llama | chat | - | - | 128,000 | - | ✓ | - | - |
gemini-pro | vertex_ai-language-models | chat | $0.50 | $1.50 | 8,192 | - | ✓ | - | - |
gemini-1.0-pro | vertex_ai-language-models | chat | $0.50 | $1.50 | 8,192 | - | ✓ | - | - |
gemini-1.0-pro-001 | vertex_ai-language-models | chat | $0.50 | $1.50 | 8,192 | - | ✓ | - | 2025-04-09 |
gemini-1.0-ultra | vertex_ai-language-models | chat | $0.50 | $1.50 | 8,192 | - | ✓ | - | - |
gemini-1.0-ultra-001 | vertex_ai-language-models | chat | $0.50 | $1.50 | 8,192 | - | ✓ | - | - |
gemini-1.0-pro-002 | vertex_ai-language-models | chat | $0.50 | $1.50 | 8,192 | - | ✓ | - | 2025-04-09 |
gemini-1.5-pro | vertex_ai-language-models | chat | $1.25 | $5.00 | 8,192 | ✓ | ✓ | - | - |
gemini-1.5-pro-002 | vertex_ai-language-models | chat | $1.25 | $5.00 | 8,192 | ✓ | ✓ | - | 2025-09-24 |
gemini-1.5-pro-001 | vertex_ai-language-models | chat | $1.25 | $5.00 | 8,192 | ✓ | ✓ | - | 2025-05-24 |
gemini-1.5-pro-preview-0514 | vertex_ai-language-models | chat | $0.078125 | $0.3125 | 8,192 | - | ✓ | - | - |
gemini-1.5-pro-preview-0215 | vertex_ai-language-models | chat | $0.078125 | $0.3125 | 8,192 | - | ✓ | - | - |
gemini-1.5-pro-preview-0409 | vertex_ai-language-models | chat | $0.078125 | $0.3125 | 8,192 | - | ✓ | - | - |
gemini-1.5-flash | vertex_ai-language-models | chat | $0.075 | $0.30 | 8,192 | ✓ | ✓ | - | - |
gemini-1.5-flash-exp-0827 | vertex_ai-language-models | chat | $0.004688 | $0.0046875 | 8,192 | ✓ | ✓ | - | - |
gemini-1.5-flash-002 | vertex_ai-language-models | chat | $0.075 | $0.30 | 8,192 | ✓ | ✓ | - | 2025-09-24 |
gemini-1.5-flash-001 | vertex_ai-language-models | chat | $0.075 | $0.30 | 8,192 | ✓ | ✓ | - | 2025-05-24 |
gemini-1.5-flash-preview-0514 | vertex_ai-language-models | chat | $0.075 | $0.0046875 | 8,192 | ✓ | ✓ | - | - |
gemini-pro-experimental | vertex_ai-language-models | chat | - | - | 8,192 | - | - | - | - |
gemini-flash-experimental | vertex_ai-language-models | chat | - | - | 8,192 | - | - | - | - |
gemini-pro-vision | vertex_ai-vision-models | chat | $0.50 | $1.50 | 2,048 | ✓ | ✓ | - | - |
gemini-1.0-pro-vision | vertex_ai-vision-models | chat | $0.50 | $1.50 | 2,048 | ✓ | ✓ | - | - |
gemini-1.0-pro-vision-001 | vertex_ai-vision-models | chat | $0.50 | $1.50 | 2,048 | ✓ | ✓ | - | 2025-04-09 |
medlm-medium | vertex_ai-language-models | chat | - | - | 8,192 | - | - | - | - |
medlm-large | vertex_ai-language-models | chat | - | - | 1,024 | - | - | - | - |
gemini-2.5-pro-exp-03-25 | vertex_ai-language-models | chat | $1.25 | $10.00 | 65,535 | ✓ | ✓ | ✓ | - |
gemini-2.0-pro-exp-02-05 | vertex_ai-language-models | chat | $1.25 | $10.00 | 8,192 | ✓ | ✓ | ✓ | - |
gemini-2.0-flash-exp | vertex_ai-language-models | chat | $0.15 | $0.60 | 8,192 | ✓ | ✓ | ✓ | - |
gemini-2.0-flash-001 | vertex_ai-language-models | chat | $0.15 | $0.60 | 8,192 | ✓ | ✓ | ✓ | 2026-02-05 |
gemini-2.0-flash-thinking-exp | vertex_ai-language-models | chat | - | - | 8,192 | ✓ | ✓ | ✓ | - |
gemini-2.0-flash-thinking-exp-01-21 | vertex_ai-language-models | chat | - | - | 65,536 | ✓ | - | ✓ | - |
gemini-2.5-pro | vertex_ai-language-models | chat | $1.25 | $10.00 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-pro-exp-03-25 | gemini | chat | - | - | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-pro | gemini | chat | $1.25 | $10.00 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-flash | gemini | chat | $0.30 | $2.50 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-flash-image-preview | gemini | chat | $0.30 | $2.50 | 65,535 | ✓ | ✓ | ✓ | - |
gemini-2.5-flash | vertex_ai-language-models | chat | $0.30 | $2.50 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.0-flash-live-001 | gemini | chat | $0.35 | $1.50 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-flash-preview-tts | gemini | chat | $0.15 | $0.60 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-flash-preview-05-20 | gemini | chat | $0.30 | $2.50 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-flash-preview-04-17 | gemini | chat | $0.15 | $0.60 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-flash-lite-preview-06-17 | gemini | chat | $0.10 | $0.40 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-flash-lite | gemini | chat | $0.10 | $0.40 | 65,535 | ✓ | ✓ | ✓ | - |
gemini-2.5-flash-image-preview | vertex_ai-language-models | chat | $0.30 | $2.50 | 65,535 | ✓ | ✓ | ✓ | - |
gemini-2.5-flash-preview-05-20 | vertex_ai-language-models | chat | $0.30 | $2.50 | 65,535 | ✓ | ✓ | ✓ | - |
gemini-2.5-flash-preview-04-17 | vertex_ai-language-models | chat | $0.15 | $0.60 | 65,535 | ✓ | ✓ | ✓ | - |
gemini-2.5-flash-lite-preview-06-17 | vertex_ai-language-models | chat | $0.10 | $0.40 | 65,535 | ✓ | ✓ | ✓ | - |
gemini-2.5-flash-lite | vertex_ai-language-models | chat | $0.10 | $0.40 | 65,535 | ✓ | ✓ | ✓ | - |
gemini-2.0-flash | vertex_ai-language-models | chat | $0.10 | $0.40 | 8,192 | ✓ | ✓ | ✓ | - |
gemini-2.0-flash-lite | vertex_ai-language-models | chat | $0.075 | $0.30 | - | ✓ | ✓ | ✓ | - |
gemini-2.0-flash-lite-001 | vertex_ai-language-models | chat | $0.075 | $0.30 | - | ✓ | ✓ | ✓ | 2026-02-25 |
gemini-2.5-pro-preview-06-05 | vertex_ai-language-models | chat | $1.25 | $10.00 | 65,535 | ✓ | ✓ | ✓ | - |
gemini-2.5-pro-preview-05-06 | vertex_ai-language-models | chat | $1.25 | $10.00 | 65,535 | ✓ | ✓ | ✓ | - |
gemini-2.5-pro-preview-03-25 | vertex_ai-language-models | chat | $1.25 | $10.00 | 65,535 | ✓ | ✓ | ✓ | - |
gemini-2.0-flash-preview-image-generation | vertex_ai-language-models | chat | $0.10 | $0.40 | 8,192 | ✓ | ✓ | ✓ | - |
gemini-2.5-pro-preview-tts | vertex_ai-language-models | chat | $1.25 | $10.00 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.0-pro-exp-02-05 | gemini | chat | - | - | 8,192 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.0-flash-preview-image-generation | gemini | chat | $0.10 | $0.40 | 8,192 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.0-flash | gemini | chat | $0.10 | $0.40 | 8,192 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.0-flash-lite | gemini | chat | $0.075 | $0.30 | - | ✓ | ✓ | ✓ | - |
gemini/gemini-2.0-flash-001 | gemini | chat | $0.10 | $0.40 | 8,192 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-pro-preview-tts | gemini | chat | $1.25 | $10.00 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-pro-preview-06-05 | gemini | chat | $1.25 | $10.00 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-pro-preview-05-06 | gemini | chat | $1.25 | $10.00 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.5-pro-preview-03-25 | gemini | chat | $1.25 | $10.00 | 65,535 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.0-flash-exp | gemini | chat | - | - | 8,192 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.0-flash-lite-preview-02-05 | gemini | chat | $0.075 | $0.30 | 8,192 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.0-flash-thinking-exp | gemini | chat | - | - | 8,192 | ✓ | ✓ | ✓ | - |
gemini/gemini-2.0-flash-thinking-exp-01-21 | gemini | chat | - | - | 8,192 | ✓ | ✓ | ✓ | - |
gemini/gemma-3-27b-it | gemini | chat | - | - | 8,192 | ✓ | ✓ | - | - |
gemini/learnlm-1.5-pro-experimental | gemini | chat | - | - | 8,192 | ✓ | ✓ | - | - |
vertex_ai/claude-opus-4-1 | vertex_ai-anthropic_models | chat | $15.00 | $75.00 | 4,096 | ✓ | ✓ | - | - |
vertex_ai/claude-opus-4-1@20250805 | vertex_ai-anthropic_models | chat | $15.00 | $75.00 | 4,096 | ✓ | ✓ | - | - |
vertex_ai/claude-3-sonnet | vertex_ai-anthropic_models | chat | $3.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
gemini-2.0-flash-live-preview-04-09 | vertex_ai-language-models | chat | $0.50 | $2.00 | 65,535 | ✓ | ✓ | ✓ | - |
vertex_ai/claude-3-sonnet@20240229 | vertex_ai-anthropic_models | chat | $3.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
vertex_ai/claude-3-5-sonnet | vertex_ai-anthropic_models | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | - | - |
vertex_ai/claude-3-5-sonnet@20240620 | vertex_ai-anthropic_models | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | - | - |
vertex_ai/claude-3-5-sonnet-v2 | vertex_ai-anthropic_models | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | - | - |
vertex_ai/claude-3-5-sonnet-v2@20241022 | vertex_ai-anthropic_models | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | - | - |
vertex_ai/claude-3-7-sonnet@20250219 | vertex_ai-anthropic_models | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | ✓ | 2025-06-01 |
vertex_ai/claude-opus-4 | vertex_ai-anthropic_models | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
vertex_ai/claude-opus-4@20250514 | vertex_ai-anthropic_models | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
vertex_ai/claude-sonnet-4 | vertex_ai-anthropic_models | chat | $3.00 | $15.00 | 64,000 | ✓ | ✓ | ✓ | - |
vertex_ai/claude-sonnet-4@20250514 | vertex_ai-anthropic_models | chat | $3.00 | $15.00 | 64,000 | ✓ | ✓ | ✓ | - |
vertex_ai/claude-3-haiku | vertex_ai-anthropic_models | chat | $0.25 | $1.25 | 4,096 | ✓ | ✓ | - | - |
vertex_ai/claude-3-haiku@20240307 | vertex_ai-anthropic_models | chat | $0.25 | $1.25 | 4,096 | ✓ | ✓ | - | - |
vertex_ai/claude-3-5-haiku | vertex_ai-anthropic_models | chat | $1.00 | $5.00 | 8,192 | - | ✓ | - | - |
vertex_ai/claude-3-5-haiku@20241022 | vertex_ai-anthropic_models | chat | $1.00 | $5.00 | 8,192 | - | ✓ | - | - |
vertex_ai/claude-3-opus | vertex_ai-anthropic_models | chat | $15.00 | $75.00 | 4,096 | ✓ | ✓ | - | - |
vertex_ai/claude-3-opus@20240229 | vertex_ai-anthropic_models | chat | $15.00 | $75.00 | 4,096 | ✓ | ✓ | - | - |
vertex_ai/deepseek-ai/deepseek-r1-0528-maas | vertex_ai-deepseek_models | chat | $1.35 | $5.40 | 8,192 | - | ✓ | ✓ | - |
vertex_ai/qwen/qwen3-coder-480b-a35b-instruct-maas | vertex_ai-qwen_models | chat | $1.00 | $4.00 | 32,768 | - | ✓ | - | - |
vertex_ai/qwen/qwen3-235b-a22b-instruct-2507-maas | vertex_ai-qwen_models | chat | $0.25 | $1.00 | 16,384 | - | ✓ | - | - |
vertex_ai/meta/llama3-405b-instruct-maas | vertex_ai-llama_models | chat | - | - | 32,000 | - | - | - | - |
vertex_ai/meta/llama-4-scout-17b-16e-instruct-maas | vertex_ai-llama_models | chat | $0.25 | $0.70 | 10,000,000 | - | ✓ | - | - |
vertex_ai/meta/llama-4-scout-17b-128e-instruct-maas | vertex_ai-llama_models | chat | $0.25 | $0.70 | 10,000,000 | - | ✓ | - | - |
vertex_ai/meta/llama-4-maverick-17b-128e-instruct-maas | vertex_ai-llama_models | chat | $0.35 | $1.15 | 1,000,000 | - | ✓ | - | - |
vertex_ai/meta/llama-4-maverick-17b-16e-instruct-maas | vertex_ai-llama_models | chat | $0.35 | $1.15 | 1,000,000 | - | ✓ | - | - |
vertex_ai/meta/llama3-70b-instruct-maas | vertex_ai-llama_models | chat | - | - | 32,000 | - | - | - | - |
vertex_ai/meta/llama3-8b-instruct-maas | vertex_ai-llama_models | chat | - | - | 32,000 | - | - | - | - |
vertex_ai/meta/llama-3.1-8b-instruct-maas | vertex_ai-llama_models | chat | - | - | 128,000 | ✓ | - | - | - |
vertex_ai/meta/llama-3.1-70b-instruct-maas | vertex_ai-llama_models | chat | - | - | 128,000 | ✓ | - | - | - |
vertex_ai/meta/llama-3.1-405b-instruct-maas | vertex_ai-llama_models | chat | $5.00 | $16.00 | 128,000 | ✓ | - | - | - |
vertex_ai/meta/llama-3.2-90b-vision-instruct-maas | vertex_ai-llama_models | chat | - | - | 128,000 | ✓ | - | - | - |
vertex_ai/mistral-large@latest | vertex_ai-mistral_models | chat | $2.00 | $6.00 | 8,191 | - | ✓ | - | - |
vertex_ai/mistral-large@2411-001 | vertex_ai-mistral_models | chat | $2.00 | $6.00 | 8,191 | - | ✓ | - | - |
vertex_ai/mistral-large-2411 | vertex_ai-mistral_models | chat | $2.00 | $6.00 | 8,191 | - | ✓ | - | - |
vertex_ai/mistral-large@2407 | vertex_ai-mistral_models | chat | $2.00 | $6.00 | 8,191 | - | ✓ | - | - |
vertex_ai/mistral-nemo@latest | vertex_ai-mistral_models | chat | $0.15 | $0.15 | 128,000 | - | ✓ | - | - |
vertex_ai/mistral-small-2503@001 | vertex_ai-mistral_models | chat | $1.00 | $3.00 | 8,191 | - | ✓ | - | - |
vertex_ai/mistral-small-2503 | vertex_ai-mistral_models | chat | $1.00 | $3.00 | 128,000 | ✓ | ✓ | - | - |
vertex_ai/jamba-1.5-mini@001 | vertex_ai-ai21_models | chat | $0.20 | $0.40 | 256,000 | - | - | - | - |
vertex_ai/jamba-1.5-large@001 | vertex_ai-ai21_models | chat | $2.00 | $8.00 | 256,000 | - | - | - | - |
vertex_ai/jamba-1.5 | vertex_ai-ai21_models | chat | $0.20 | $0.40 | 256,000 | - | - | - | - |
vertex_ai/jamba-1.5-mini | vertex_ai-ai21_models | chat | $0.20 | $0.40 | 256,000 | - | - | - | - |
vertex_ai/jamba-1.5-large | vertex_ai-ai21_models | chat | $2.00 | $8.00 | 256,000 | - | - | - | - |
vertex_ai/mistral-nemo@2407 | vertex_ai-mistral_models | chat | $3.00 | $3.00 | 128,000 | - | ✓ | - | - |
vertex_ai/codestral@latest | vertex_ai-mistral_models | chat | $0.20 | $0.60 | 128,000 | - | ✓ | - | - |
vertex_ai/codestral@2405 | vertex_ai-mistral_models | chat | $0.20 | $0.60 | 128,000 | - | ✓ | - | - |
vertex_ai/codestral-2501 | vertex_ai-mistral_models | chat | $0.20 | $0.60 | 128,000 | - | ✓ | - | - |
vertex_ai/imagegeneration@006 | vertex_ai-image-models | image_generation | - | - | - | - | - | - | - |
vertex_ai/imagen-4.0-generate-001 | vertex_ai-image-models | image_generation | - | - | - | - | - | - | - |
vertex_ai/imagen-4.0-generate-preview-06-06 | vertex_ai-image-models | image_generation | - | - | - | - | - | - | - |
vertex_ai/imagen-4.0-ultra-generate-preview-06-06 | vertex_ai-image-models | image_generation | - | - | - | - | - | - | - |
vertex_ai/imagen-4.0-ultra-generate-001 | vertex_ai-image-models | image_generation | - | - | - | - | - | - | - |
vertex_ai/imagen-4.0-fast-generate-001 | vertex_ai-image-models | image_generation | - | - | - | - | - | - | - |
vertex_ai/imagen-4.0-fast-generate-preview-06-06 | vertex_ai-image-models | image_generation | - | - | - | - | - | - | - |
vertex_ai/imagen-3.0-generate-002 | vertex_ai-image-models | image_generation | - | - | - | - | - | - | - |
vertex_ai/imagen-3.0-generate-001 | vertex_ai-image-models | image_generation | - | - | - | - | - | - | - |
vertex_ai/imagen-3.0-fast-generate-001 | vertex_ai-image-models | image_generation | - | - | - | - | - | - | - |
text-embedding-004 | vertex_ai-embedding-models | embedding | $0.10 | - | 2,048 | - | - | - | - |
gemini-embedding-001 | vertex_ai-embedding-models | embedding | $0.15 | - | 2,048 | - | - | - | - |
text-embedding-005 | vertex_ai-embedding-models | embedding | $0.10 | - | 2,048 | - | - | - | - |
text-multilingual-embedding-002 | vertex_ai-embedding-models | embedding | $0.10 | - | 2,048 | - | - | - | - |
multimodalembedding | vertex_ai-embedding-models | embedding | $0.80 | - | 2,048 | - | - | - | - |
multimodalembedding@001 | vertex_ai-embedding-models | embedding | $0.80 | - | 2,048 | - | - | - | - |
text-embedding-large-exp-03-07 | vertex_ai-embedding-models | embedding | $0.10 | - | 8,192 | - | - | - | - |
textembedding-gecko | vertex_ai-embedding-models | embedding | $0.10 | - | 3,072 | - | - | - | - |
textembedding-gecko-multilingual | vertex_ai-embedding-models | embedding | $0.10 | - | 3,072 | - | - | - | - |
textembedding-gecko-multilingual@001 | vertex_ai-embedding-models | embedding | $0.10 | - | 3,072 | - | - | - | - |
textembedding-gecko@001 | vertex_ai-embedding-models | embedding | $0.10 | - | 3,072 | - | - | - | - |
textembedding-gecko@003 | vertex_ai-embedding-models | embedding | $0.10 | - | 3,072 | - | - | - | - |
text-embedding-preview-0409 | vertex_ai-embedding-models | embedding | $0.00625 | - | 3,072 | - | - | - | - |
text-multilingual-embedding-preview-0409 | vertex_ai-embedding-models | embedding | $0.00625 | - | 3,072 | - | - | - | - |
palm/chat-bison | palm | chat | $0.125 | $0.125 | 4,096 | - | - | - | - |
palm/chat-bison-001 | palm | chat | $0.125 | $0.125 | 4,096 | - | - | - | - |
palm/text-bison | palm | completion | $0.125 | $0.125 | 1,024 | - | - | - | - |
palm/text-bison-001 | palm | completion | $0.125 | $0.125 | 1,024 | - | - | - | - |
palm/text-bison-safety-off | palm | completion | $0.125 | $0.125 | 1,024 | - | - | - | - |
palm/text-bison-safety-recitation-off | palm | completion | $0.125 | $0.125 | 1,024 | - | - | - | - |
gemini/gemini-1.5-flash-002 | gemini | chat | $0.075 | $0.30 | 8,192 | ✓ | ✓ | ✓ | 2025-09-24 |
gemini/gemini-1.5-flash-001 | gemini | chat | $0.075 | $0.30 | 8,192 | ✓ | ✓ | ✓ | 2025-05-24 |
gemini/gemini-1.5-flash | gemini | chat | $0.075 | $0.30 | 8,192 | ✓ | ✓ | - | - |
gemini/gemini-1.5-flash-latest | gemini | chat | $0.075 | $0.30 | 8,192 | ✓ | ✓ | ✓ | - |
gemini/gemini-1.5-flash-8b | gemini | chat | - | - | 8,192 | ✓ | ✓ | ✓ | - |
gemini/gemini-1.5-flash-8b-exp-0924 | gemini | chat | - | - | 8,192 | ✓ | ✓ | ✓ | - |
gemini/gemini-exp-1114 | gemini | chat | - | - | 8,192 | ✓ | ✓ | - | - |
gemini/gemini-exp-1206 | gemini | chat | - | - | 8,192 | ✓ | ✓ | - | - |
gemini/gemini-1.5-flash-exp-0827 | gemini | chat | - | - | 8,192 | ✓ | ✓ | - | - |
gemini/gemini-1.5-flash-8b-exp-0827 | gemini | chat | - | - | 8,192 | ✓ | ✓ | - | - |
gemini/gemini-pro | gemini | chat | $0.35 | $1.05 | 8,192 | - | ✓ | - | - |
gemini/gemini-1.5-pro | gemini | chat | $3.50 | $10.50 | 8,192 | ✓ | ✓ | - | - |
gemini/gemini-1.5-pro-002 | gemini | chat | $3.50 | $10.50 | 8,192 | ✓ | ✓ | ✓ | 2025-09-24 |
gemini/gemini-1.5-pro-001 | gemini | chat | $3.50 | $10.50 | 8,192 | ✓ | ✓ | ✓ | 2025-05-24 |
gemini/gemini-1.5-pro-exp-0801 | gemini | chat | $3.50 | $10.50 | 8,192 | ✓ | ✓ | - | - |
gemini/gemini-1.5-pro-exp-0827 | gemini | chat | - | - | 8,192 | ✓ | ✓ | - | - |
gemini/gemini-1.5-pro-latest | gemini | chat | $3.50 | $1.05 | 8,192 | ✓ | ✓ | - | - |
gemini/gemini-pro-vision | gemini | chat | $0.35 | $1.05 | 2,048 | ✓ | ✓ | - | - |
gemini/gemini-gemma-2-27b-it | gemini | chat | $0.35 | $1.05 | 8,192 | ✓ | ✓ | - | - |
gemini/gemini-gemma-2-9b-it | gemini | chat | $0.35 | $1.05 | 8,192 | ✓ | ✓ | - | - |
gemini/imagen-4.0-generate-001 | gemini | image_generation | - | - | - | - | - | - | - |
gemini/imagen-4.0-generate-preview-06-06 | gemini | image_generation | - | - | - | - | - | - | - |
gemini/imagen-4.0-ultra-generate-001 | gemini | image_generation | - | - | - | - | - | - | - |
gemini/imagen-4.0-ultra-generate-preview-06-06 | gemini | image_generation | - | - | - | - | - | - | - |
gemini/imagen-4.0-fast-generate-001 | gemini | image_generation | - | - | - | - | - | - | - |
gemini/imagen-4.0-fast-generate-preview-06-06 | gemini | image_generation | - | - | - | - | - | - | - |
gemini/imagen-3.0-generate-002 | gemini | image_generation | - | - | - | - | - | - | - |
gemini/imagen-3.0-generate-001 | gemini | image_generation | - | - | - | - | - | - | - |
gemini/imagen-3.0-fast-generate-001 | gemini | image_generation | - | - | - | - | - | - | - |
command-a-03-2025 | cohere_chat | chat | $2.50 | $10.00 | 8,000 | - | ✓ | - | - |
command-r | cohere_chat | chat | $0.15 | $0.60 | 4,096 | - | ✓ | - | - |
command-r-08-2024 | cohere_chat | chat | $0.15 | $0.60 | 4,096 | - | ✓ | - | - |
command-r7b-12-2024 | cohere_chat | chat | $0.15 | $0.0375 | 4,096 | - | ✓ | - | - |
command-light | cohere_chat | chat | $0.30 | $0.60 | 4,096 | - | - | - | - |
command-r-plus | cohere_chat | chat | $2.50 | $10.00 | 4,096 | - | ✓ | - | - |
command-r-plus-08-2024 | cohere_chat | chat | $2.50 | $10.00 | 4,096 | - | ✓ | - | - |
command-nightly | cohere | completion | $1.00 | $2.00 | 4,096 | - | - | - | - |
command | cohere | completion | $1.00 | $2.00 | 4,096 | - | - | - | - |
rerank-v3.5 | cohere | rerank | - | - | 4,096 | - | - | - | - |
rerank-english-v3.0 | cohere | rerank | - | - | 4,096 | - | - | - | - |
rerank-multilingual-v3.0 | cohere | rerank | - | - | 4,096 | - | - | - | - |
rerank-english-v2.0 | cohere | rerank | - | - | 4,096 | - | - | - | - |
rerank-multilingual-v2.0 | cohere | rerank | - | - | 4,096 | - | - | - | - |
embed-english-light-v3.0 | cohere | embedding | $0.10 | - | 1,024 | - | - | - | - |
embed-multilingual-v3.0 | cohere | embedding | $0.10 | - | 1,024 | - | - | - | - |
embed-english-v2.0 | cohere | embedding | $0.10 | - | 4,096 | - | - | - | - |
embed-english-light-v2.0 | cohere | embedding | $0.10 | - | 1,024 | - | - | - | - |
embed-multilingual-v2.0 | cohere | embedding | $0.10 | - | 768 | - | - | - | - |
embed-english-v3.0 | cohere | embedding | $0.10 | - | 1,024 | - | - | - | - |
replicate/meta/llama-2-13b | replicate | chat | $0.10 | $0.50 | 4,096 | - | - | - | - |
replicate/meta/llama-2-13b-chat | replicate | chat | $0.10 | $0.50 | 4,096 | - | - | - | - |
replicate/meta/llama-2-70b | replicate | chat | $0.65 | $2.75 | 4,096 | - | - | - | - |
replicate/meta/llama-2-70b-chat | replicate | chat | $0.65 | $2.75 | 4,096 | - | - | - | - |
replicate/meta/llama-2-7b | replicate | chat | $0.05 | $0.25 | 4,096 | - | - | - | - |
replicate/meta/llama-2-7b-chat | replicate | chat | $0.05 | $0.25 | 4,096 | - | - | - | - |
replicate/meta/llama-3-70b | replicate | chat | $0.65 | $2.75 | 8,192 | - | - | - | - |
replicate/meta/llama-3-70b-instruct | replicate | chat | $0.65 | $2.75 | 8,192 | - | - | - | - |
replicate/meta/llama-3-8b | replicate | chat | $0.05 | $0.25 | 8,086 | - | - | - | - |
replicate/meta/llama-3-8b-instruct | replicate | chat | $0.05 | $0.25 | 8,086 | - | - | - | - |
replicate/mistralai/mistral-7b-v0.1 | replicate | chat | $0.05 | $0.25 | 4,096 | - | - | - | - |
replicate/mistralai/mistral-7b-instruct-v0.2 | replicate | chat | $0.05 | $0.25 | 4,096 | - | - | - | - |
replicate/mistralai/mixtral-8x7b-instruct-v0.1 | replicate | chat | $0.30 | $1.00 | 4,096 | - | - | - | - |
openrouter/deepseek/deepseek-r1-0528 | openrouter | chat | $0.50 | $2.15 | 8,192 | - | ✓ | ✓ | - |
openrouter/deepseek/deepseek-chat-v3.1 | openrouter | chat | $0.20 | $0.80 | 8,192 | - | ✓ | ✓ | - |
openrouter/x-ai/grok-4 | openrouter | chat | $3.00 | $15.00 | 256,000 | - | ✓ | - | - |
openrouter/bytedance/ui-tars-1.5-7b | openrouter | chat | $0.10 | $0.20 | 2,048 | - | - | - | - |
openrouter/deepseek/deepseek-r1 | openrouter | chat | $0.55 | $2.19 | 8,192 | - | ✓ | ✓ | - |
openrouter/deepseek/deepseek-chat | openrouter | chat | $0.14 | $0.28 | 8,192 | - | - | ✓ | - |
openrouter/deepseek/deepseek-chat-v3-0324 | openrouter | chat | $0.14 | $0.28 | 8,192 | - | - | ✓ | - |
openrouter/deepseek/deepseek-coder | openrouter | chat | $0.14 | $0.28 | 8,192 | - | - | ✓ | - |
openrouter/microsoft/wizardlm-2-8x22b:nitro | openrouter | chat | $1.00 | $1.00 | 65,536 | - | - | - | - |
openrouter/google/gemini-2.5-pro | openrouter | chat | $1.25 | $10.00 | 8,192 | ✓ | ✓ | - | - |
openrouter/google/gemini-pro-1.5 | openrouter | chat | $2.50 | $7.50 | 8,192 | ✓ | ✓ | - | - |
openrouter/google/gemini-2.0-flash-001 | openrouter | chat | $0.10 | $0.40 | 8,192 | ✓ | ✓ | - | - |
openrouter/google/gemini-2.5-flash | openrouter | chat | $0.30 | $2.50 | 8,192 | ✓ | ✓ | - | - |
openrouter/mistralai/mixtral-8x22b-instruct | openrouter | chat | $0.65 | $0.65 | 65,536 | - | - | - | - |
openrouter/cohere/command-r-plus | openrouter | chat | $3.00 | $15.00 | 128,000 | - | - | - | - |
openrouter/databricks/dbrx-instruct | openrouter | chat | $0.60 | $0.60 | 32,768 | - | - | - | - |
openrouter/anthropic/claude-3-haiku | openrouter | chat | $0.25 | $1.25 | 200,000 | ✓ | ✓ | - | - |
openrouter/anthropic/claude-3-5-haiku | openrouter | chat | $1.00 | $5.00 | 200,000 | - | ✓ | - | - |
openrouter/anthropic/claude-3-haiku-20240307 | openrouter | chat | $0.25 | $1.25 | 4,096 | ✓ | ✓ | - | - |
openrouter/anthropic/claude-3-5-haiku-20241022 | openrouter | chat | $1.00 | $5.00 | 8,192 | - | ✓ | - | - |
openrouter/anthropic/claude-3.5-sonnet | openrouter | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | - | - |
openrouter/anthropic/claude-3.5-sonnet:beta | openrouter | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | - | - |
openrouter/anthropic/claude-3.7-sonnet | openrouter | chat | $3.00 | $15.00 | 128,000 | ✓ | ✓ | - | - |
openrouter/anthropic/claude-3.7-sonnet:beta | openrouter | chat | $3.00 | $15.00 | 128,000 | ✓ | ✓ | - | - |
openrouter/anthropic/claude-3-sonnet | openrouter | chat | $3.00 | $15.00 | 200,000 | ✓ | ✓ | - | - |
openrouter/anthropic/claude-sonnet-4 | openrouter | chat | $3.00 | $15.00 | 64,000 | ✓ | ✓ | - | - |
openrouter/anthropic/claude-opus-4 | openrouter | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | - | - |
openrouter/anthropic/claude-opus-4.1 | openrouter | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | - | - |
openrouter/mistralai/mistral-large | openrouter | chat | $8.00 | $24.00 | 32,000 | - | - | - | - |
openrouter/mistralai/mistral-small-3.1-24b-instruct | openrouter | chat | $0.10 | $0.30 | 32,000 | - | - | - | - |
openrouter/mistralai/mistral-small-3.2-24b-instruct | openrouter | chat | $0.10 | $0.30 | 32,000 | - | - | - | - |
openrouter/cognitivecomputations/dolphin-mixtral-8x7b | openrouter | chat | $0.50 | $0.50 | 32,769 | - | - | - | - |
openrouter/google/gemini-pro-vision | openrouter | chat | $0.125 | $0.375 | 45,875 | ✓ | ✓ | - | - |
openrouter/fireworks/firellava-13b | openrouter | chat | $0.20 | $0.20 | 4,096 | - | - | - | - |
openrouter/meta-llama/llama-3-8b-instruct:free | openrouter | chat | - | - | 8,192 | - | - | - | - |
openrouter/meta-llama/llama-3-8b-instruct:extended | openrouter | chat | $0.225 | $2.25 | 16,384 | - | - | - | - |
openrouter/meta-llama/llama-3-70b-instruct:nitro | openrouter | chat | $0.90 | $0.90 | 8,192 | - | - | - | - |
openrouter/meta-llama/llama-3-70b-instruct | openrouter | chat | $0.59 | $0.79 | 8,192 | - | - | - | - |
openrouter/openai/o1 | openrouter | chat | $15.00 | $60.00 | 100,000 | ✓ | ✓ | ✓ | - |
openrouter/openai/o1-mini | openrouter | chat | $3.00 | $12.00 | 65,536 | - | ✓ | - | - |
openrouter/openai/o1-mini-2024-09-12 | openrouter | chat | $3.00 | $12.00 | 65,536 | - | ✓ | - | - |
openrouter/openai/o1-preview | openrouter | chat | $15.00 | $60.00 | 32,768 | - | ✓ | - | - |
openrouter/openai/o1-preview-2024-09-12 | openrouter | chat | $15.00 | $60.00 | 32,768 | - | ✓ | - | - |
openrouter/openai/o3-mini | openrouter | chat | $1.10 | $4.40 | 65,536 | - | ✓ | - | - |
openrouter/openai/o3-mini-high | openrouter | chat | $1.10 | $4.40 | 65,536 | - | ✓ | - | - |
openrouter/openai/gpt-4o | openrouter | chat | $2.50 | $10.00 | 4,096 | ✓ | ✓ | - | - |
openrouter/openai/gpt-4o-2024-05-13 | openrouter | chat | $5.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
openrouter/openai/gpt-4-vision-preview | openrouter | chat | $10.00 | $30.00 | 130,000 | ✓ | ✓ | - | - |
openrouter/openai/gpt-3.5-turbo | openrouter | chat | $1.50 | $2.00 | 4,095 | - | - | - | - |
openrouter/openai/gpt-3.5-turbo-16k | openrouter | chat | $3.00 | $4.00 | 16,383 | - | - | - | - |
openrouter/openai/gpt-4 | openrouter | chat | $30.00 | $60.00 | 8,192 | - | - | - | - |
openrouter/openai/gpt-5-mini | openrouter | chat | $0.25 | $2.00 | 128,000 | - | - | - | - |
openrouter/openai/gpt-5-nano | openrouter | chat | $0.05 | $0.40 | 128,000 | - | - | - | - |
openrouter/openai/gpt-5-chat | openrouter | chat | $1.25 | $10.00 | 128,000 | - | - | - | - |
openrouter/openai/gpt-oss-20b | openrouter | chat | $0.18 | $0.80 | 32,768 | - | ✓ | - | - |
openrouter/openai/gpt-oss-120b | openrouter | chat | $0.18 | $0.80 | 32,768 | - | ✓ | - | - |
openrouter/anthropic/claude-instant-v1 | openrouter | chat | $1.63 | $5.51 | 100,000 | - | - | - | - |
openrouter/anthropic/claude-2 | openrouter | chat | $11.02 | $32.68 | 100,000 | - | - | - | - |
openrouter/anthropic/claude-3-opus | openrouter | chat | $15.00 | $75.00 | 4,096 | ✓ | ✓ | - | - |
openrouter/google/palm-2-chat-bison | openrouter | chat | $0.50 | $0.50 | 25,804 | - | - | - | - |
openrouter/google/palm-2-codechat-bison | openrouter | chat | $0.50 | $0.50 | 20,070 | - | - | - | - |
openrouter/meta-llama/llama-2-13b-chat | openrouter | chat | $0.20 | $0.20 | 4,096 | - | - | - | - |
openrouter/meta-llama/llama-2-70b-chat | openrouter | chat | $1.50 | $1.50 | 4,096 | - | - | - | - |
openrouter/meta-llama/codellama-34b-instruct | openrouter | chat | $0.50 | $0.50 | 8,192 | - | - | - | - |
openrouter/nousresearch/nous-hermes-llama2-13b | openrouter | chat | $0.20 | $0.20 | 4,096 | - | - | - | - |
openrouter/mancer/weaver | openrouter | chat | $5.625 | $5.625 | 8,000 | - | - | - | - |
openrouter/gryphe/mythomax-l2-13b | openrouter | chat | $1.875 | $1.875 | 8,192 | - | - | - | - |
openrouter/jondurbin/airoboros-l2-70b-2.1 | openrouter | chat | $13.875 | $13.875 | 4,096 | - | - | - | - |
openrouter/undi95/remm-slerp-l2-13b | openrouter | chat | $1.875 | $1.875 | 6,144 | - | - | - | - |
openrouter/pygmalionai/mythalion-13b | openrouter | chat | $1.875 | $1.875 | 4,096 | - | - | - | - |
openrouter/mistralai/mistral-7b-instruct | openrouter | chat | $0.13 | $0.13 | 8,192 | - | - | - | - |
openrouter/mistralai/mistral-7b-instruct:free | openrouter | chat | - | - | 8,192 | - | - | - | - |
openrouter/qwen/qwen-2.5-coder-32b-instruct | openrouter | chat | $0.18 | $0.18 | 33,792 | - | - | - | - |
openrouter/qwen/qwen-vl-plus | openrouter | chat | $0.21 | $0.63 | 8,192 | - | - | - | - |
openrouter/qwen/qwen3-coder | openrouter | chat | $1.00 | $5.00 | 1,000,000 | - | - | - | - |
openrouter/switchpoint/router | openrouter | chat | $0.85 | $3.40 | 131,072 | - | - | - | - |
j2-ultra | ai21 | completion | $15.00 | $15.00 | 8,192 | - | - | - | - |
jamba-1.5-mini@001 | ai21 | chat | $0.20 | $0.40 | 256,000 | - | - | - | - |
jamba-1.5-large@001 | ai21 | chat | $2.00 | $8.00 | 256,000 | - | - | - | - |
jamba-1.5 | ai21 | chat | $0.20 | $0.40 | 256,000 | - | - | - | - |
jamba-1.5-mini | ai21 | chat | $0.20 | $0.40 | 256,000 | - | - | - | - |
jamba-1.5-large | ai21 | chat | $2.00 | $8.00 | 256,000 | - | - | - | - |
jamba-large-1.6 | ai21 | chat | $2.00 | $8.00 | 256,000 | - | - | - | - |
jamba-large-1.7 | ai21 | chat | $2.00 | $8.00 | 256,000 | - | - | - | - |
jamba-mini-1.6 | ai21 | chat | $0.20 | $0.40 | 256,000 | - | - | - | - |
jamba-mini-1.7 | ai21 | chat | $0.20 | $0.40 | 256,000 | - | - | - | - |
j2-mid | ai21 | completion | $10.00 | $10.00 | 8,192 | - | - | - | - |
j2-light | ai21 | completion | $3.00 | $3.00 | 8,192 | - | - | - | - |
dolphin | nlp_cloud | completion | $0.50 | $0.50 | 16,384 | - | - | - | - |
chatdolphin | nlp_cloud | chat | $0.50 | $0.50 | 16,384 | - | - | - | - |
luminous-base | aleph_alpha | completion | $30.00 | $33.00 | 2,048 | - | - | - | - |
luminous-base-control | aleph_alpha | chat | $37.50 | $41.25 | 2,048 | - | - | - | - |
luminous-extended | aleph_alpha | completion | $45.00 | $49.50 | 2,048 | - | - | - | - |
luminous-extended-control | aleph_alpha | chat | $56.25 | $61.875 | 2,048 | - | - | - | - |
luminous-supreme | aleph_alpha | completion | $175.00 | $192.50 | 2,048 | - | - | - | - |
luminous-supreme-control | aleph_alpha | chat | $218.75 | $240.625 | 2,048 | - | - | - | - |
ai21.j2-mid-v1 | bedrock | chat | $12.50 | $12.50 | 8,191 | - | - | - | - |
ai21.j2-ultra-v1 | bedrock | chat | $18.80 | $18.80 | 8,191 | - | - | - | - |
ai21.jamba-instruct-v1:0 | bedrock | chat | $0.50 | $0.70 | 4,096 | - | - | - | - |
ai21.jamba-1-5-large-v1:0 | bedrock | chat | $2.00 | $8.00 | 256,000 | - | - | - | - |
ai21.jamba-1-5-mini-v1:0 | bedrock | chat | $0.20 | $0.40 | 256,000 | - | - | - | - |
amazon.rerank-v1:0 | bedrock | rerank | - | - | 32,000 | - | - | - | - |
amazon.titan-text-lite-v1 | bedrock | chat | $0.30 | $0.40 | 4,000 | - | - | - | - |
amazon.titan-text-express-v1 | bedrock | chat | $1.30 | $1.70 | 8,000 | - | - | - | - |
amazon.titan-text-premier-v1:0 | bedrock | chat | $0.50 | $1.50 | 32,000 | - | - | - | - |
amazon.titan-embed-text-v1 | bedrock | embedding | $0.10 | - | 8,192 | - | - | - | - |
amazon.titan-embed-text-v2:0 | bedrock | embedding | $0.20 | - | 8,192 | - | - | - | - |
amazon.titan-embed-image-v1 | bedrock | embedding | $0.80 | - | 128 | - | - | - | - |
mistral.mistral-7b-instruct-v0:2 | bedrock | chat | $0.15 | $0.20 | 8,191 | - | - | - | - |
mistral.mixtral-8x7b-instruct-v0:1 | bedrock | chat | $0.45 | $0.70 | 8,191 | - | - | - | - |
mistral.mistral-large-2402-v1:0 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | ✓ | - | - |
mistral.mistral-large-2407-v1:0 | bedrock | chat | $3.00 | $9.00 | 8,191 | - | ✓ | - | - |
mistral.mistral-small-2402-v1:0 | bedrock | chat | $1.00 | $3.00 | 8,191 | - | ✓ | - | - |
eu.mistral.pixtral-large-2502-v1:0 | bedrock_converse | chat | $2.00 | $6.00 | 128,000 | - | ✓ | - | - |
us.mistral.pixtral-large-2502-v1:0 | bedrock_converse | chat | $2.00 | $6.00 | 128,000 | - | ✓ | - | - |
bedrock/us-west-2/mistral.mixtral-8x7b-instruct-v0:1 | bedrock | chat | $0.45 | $0.70 | 8,191 | - | - | - | - |
bedrock/us-east-1/mistral.mixtral-8x7b-instruct-v0:1 | bedrock | chat | $0.45 | $0.70 | 8,191 | - | - | - | - |
bedrock/eu-west-3/mistral.mixtral-8x7b-instruct-v0:1 | bedrock | chat | $0.59 | $0.91 | 8,191 | - | - | - | - |
bedrock/us-west-2/mistral.mistral-7b-instruct-v0:2 | bedrock | chat | $0.15 | $0.20 | 8,191 | - | - | - | - |
bedrock/us-east-1/mistral.mistral-7b-instruct-v0:2 | bedrock | chat | $0.15 | $0.20 | 8,191 | - | - | - | - |
bedrock/eu-west-3/mistral.mistral-7b-instruct-v0:2 | bedrock | chat | $0.20 | $0.26 | 8,191 | - | - | - | - |
bedrock/us-east-1/mistral.mistral-large-2402-v1:0 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | ✓ | - | - |
bedrock/us-west-2/mistral.mistral-large-2402-v1:0 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | ✓ | - | - |
bedrock/eu-west-3/mistral.mistral-large-2402-v1:0 | bedrock | chat | $10.40 | $31.20 | 8,191 | - | ✓ | - | - |
amazon.nova-micro-v1:0 | bedrock_converse | chat | $0.035 | $0.14 | 10,000 | - | ✓ | ✓ | - |
us.amazon.nova-micro-v1:0 | bedrock_converse | chat | $0.035 | $0.14 | 10,000 | - | ✓ | ✓ | - |
eu.amazon.nova-micro-v1:0 | bedrock_converse | chat | $0.046 | $0.184 | 10,000 | - | ✓ | ✓ | - |
amazon.nova-lite-v1:0 | bedrock_converse | chat | $0.06 | $0.24 | 10,000 | ✓ | ✓ | ✓ | - |
us.amazon.nova-lite-v1:0 | bedrock_converse | chat | $0.06 | $0.24 | 10,000 | ✓ | ✓ | ✓ | - |
eu.amazon.nova-lite-v1:0 | bedrock_converse | chat | $0.078 | $0.312 | 10,000 | ✓ | ✓ | ✓ | - |
amazon.nova-pro-v1:0 | bedrock_converse | chat | $0.80 | $3.20 | 10,000 | ✓ | ✓ | ✓ | - |
us.amazon.nova-pro-v1:0 | bedrock_converse | chat | $0.80 | $3.20 | 10,000 | ✓ | ✓ | ✓ | - |
1024-x-1024/50-steps/bedrock/amazon.nova-canvas-v1:0 | bedrock | image_generation | - | - | - | - | - | - | - |
eu.amazon.nova-pro-v1:0 | bedrock_converse | chat | $1.05 | $4.20 | 10,000 | ✓ | ✓ | ✓ | - |
apac.amazon.nova-micro-v1:0 | bedrock_converse | chat | $0.037 | $0.148 | 10,000 | - | ✓ | ✓ | - |
apac.amazon.nova-lite-v1:0 | bedrock_converse | chat | $0.063 | $0.252 | 10,000 | ✓ | ✓ | ✓ | - |
apac.amazon.nova-pro-v1:0 | bedrock_converse | chat | $0.84 | $3.36 | 10,000 | ✓ | ✓ | ✓ | - |
us.amazon.nova-premier-v1:0 | bedrock_converse | chat | $2.50 | $12.50 | 10,000 | ✓ | ✓ | - | - |
anthropic.claude-3-sonnet-20240229-v1:0 | bedrock | chat | $3.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
bedrock/invoke/anthropic.claude-3-5-sonnet-20240620-v1:0 | bedrock | chat | $3.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
anthropic.claude-3-5-sonnet-20240620-v1:0 | bedrock | chat | $3.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
openai.gpt-oss-20b-1:0 | bedrock_converse | chat | $0.07 | $0.30 | 128,000 | - | - | - | - |
openai.gpt-oss-120b-1:0 | bedrock_converse | chat | $0.15 | $0.60 | 128,000 | - | - | - | - |
anthropic.claude-opus-4-1-20250805-v1:0 | bedrock_converse | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
anthropic.claude-opus-4-20250514-v1:0 | bedrock_converse | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
anthropic.claude-sonnet-4-20250514-v1:0 | bedrock_converse | chat | $3.00 | $15.00 | 64,000 | ✓ | ✓ | ✓ | - |
anthropic.claude-3-7-sonnet-20250219-v1:0 | bedrock_converse | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | ✓ | - |
anthropic.claude-3-5-sonnet-20241022-v2:0 | bedrock | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | ✓ | - |
anthropic.claude-3-haiku-20240307-v1:0 | bedrock | chat | $0.25 | $1.25 | 4,096 | ✓ | ✓ | - | - |
anthropic.claude-3-5-haiku-20241022-v1:0 | bedrock | chat | $0.80 | $4.00 | 8,192 | - | ✓ | ✓ | - |
anthropic.claude-3-opus-20240229-v1:0 | bedrock | chat | $15.00 | $75.00 | 4,096 | ✓ | ✓ | - | - |
us.anthropic.claude-3-sonnet-20240229-v1:0 | bedrock | chat | $3.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
us.anthropic.claude-3-5-sonnet-20240620-v1:0 | bedrock | chat | $3.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
us.anthropic.claude-3-5-sonnet-20241022-v2:0 | bedrock | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | ✓ | - |
us.anthropic.claude-3-7-sonnet-20250219-v1:0 | bedrock_converse | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | ✓ | - |
us.anthropic.claude-opus-4-1-20250805-v1:0 | bedrock_converse | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
us.anthropic.claude-opus-4-20250514-v1:0 | bedrock_converse | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
us.anthropic.claude-sonnet-4-20250514-v1:0 | bedrock_converse | chat | $3.00 | $15.00 | 64,000 | ✓ | ✓ | ✓ | - |
us.anthropic.claude-3-haiku-20240307-v1:0 | bedrock | chat | $0.25 | $1.25 | 4,096 | ✓ | ✓ | - | - |
us.anthropic.claude-3-5-haiku-20241022-v1:0 | bedrock | chat | $0.80 | $4.00 | 8,192 | - | ✓ | ✓ | - |
us.anthropic.claude-3-opus-20240229-v1:0 | bedrock | chat | $15.00 | $75.00 | 4,096 | ✓ | ✓ | - | - |
eu.anthropic.claude-3-sonnet-20240229-v1:0 | bedrock | chat | $3.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
eu.anthropic.claude-3-5-sonnet-20240620-v1:0 | bedrock | chat | $3.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
eu.anthropic.claude-3-5-sonnet-20241022-v2:0 | bedrock | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | ✓ | - |
eu.anthropic.claude-3-7-sonnet-20250219-v1:0 | bedrock | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | ✓ | - |
eu.anthropic.claude-3-haiku-20240307-v1:0 | bedrock | chat | $0.25 | $1.25 | 4,096 | ✓ | ✓ | - | - |
eu.anthropic.claude-opus-4-1-20250805-v1:0 | bedrock_converse | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
eu.anthropic.claude-opus-4-20250514-v1:0 | bedrock_converse | chat | $15.00 | $75.00 | 32,000 | ✓ | ✓ | ✓ | - |
eu.anthropic.claude-sonnet-4-20250514-v1:0 | bedrock_converse | chat | $3.00 | $15.00 | 64,000 | ✓ | ✓ | ✓ | - |
apac.anthropic.claude-3-haiku-20240307-v1:0 | bedrock | chat | $0.25 | $1.25 | 4,096 | ✓ | ✓ | - | - |
apac.anthropic.claude-3-sonnet-20240229-v1:0 | bedrock | chat | $3.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
apac.anthropic.claude-3-5-sonnet-20240620-v1:0 | bedrock | chat | $3.00 | $15.00 | 4,096 | ✓ | ✓ | - | - |
apac.anthropic.claude-3-5-sonnet-20241022-v2:0 | bedrock | chat | $3.00 | $15.00 | 8,192 | ✓ | ✓ | ✓ | - |
apac.anthropic.claude-sonnet-4-20250514-v1:0 | bedrock_converse | chat | $3.00 | $15.00 | 64,000 | ✓ | ✓ | ✓ | - |
eu.anthropic.claude-3-5-haiku-20241022-v1:0 | bedrock | chat | $0.25 | $1.25 | 8,192 | - | ✓ | ✓ | - |
eu.anthropic.claude-3-opus-20240229-v1:0 | bedrock | chat | $15.00 | $75.00 | 4,096 | ✓ | ✓ | - | - |
anthropic.claude-v1 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/us-east-1/anthropic.claude-v1 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/us-west-2/anthropic.claude-v1 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/anthropic.claude-v1 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/eu-central-1/anthropic.claude-v1 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/eu-central-1/1-month-commitment/anthropic.claude-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/eu-central-1/6-month-commitment/anthropic.claude-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-east-1/1-month-commitment/anthropic.claude-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-east-1/6-month-commitment/anthropic.claude-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-west-2/1-month-commitment/anthropic.claude-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-west-2/6-month-commitment/anthropic.claude-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
anthropic.claude-v2 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/us-east-1/anthropic.claude-v2 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/us-west-2/anthropic.claude-v2 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/anthropic.claude-v2 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/eu-central-1/anthropic.claude-v2 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-east-1/1-month-commitment/anthropic.claude-v2 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-east-1/6-month-commitment/anthropic.claude-v2 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-west-2/1-month-commitment/anthropic.claude-v2 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-west-2/6-month-commitment/anthropic.claude-v2 | bedrock | chat | - | - | 8,191 | - | - | - | - |
anthropic.claude-v2:1 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/us-east-1/anthropic.claude-v2:1 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/us-west-2/anthropic.claude-v2:1 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/anthropic.claude-v2:1 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-v2:1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-v2:1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/eu-central-1/anthropic.claude-v2:1 | bedrock | chat | $8.00 | $24.00 | 8,191 | - | - | - | - |
bedrock/eu-central-1/1-month-commitment/anthropic.claude-v2:1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/eu-central-1/6-month-commitment/anthropic.claude-v2:1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-east-1/1-month-commitment/anthropic.claude-v2:1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-east-1/6-month-commitment/anthropic.claude-v2:1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-west-2/1-month-commitment/anthropic.claude-v2:1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-west-2/6-month-commitment/anthropic.claude-v2:1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
anthropic.claude-instant-v1 | bedrock | chat | $0.80 | $2.40 | 8,191 | - | - | - | - |
bedrock/us-east-1/anthropic.claude-instant-v1 | bedrock | chat | $0.80 | $2.40 | 8,191 | - | - | - | - |
bedrock/us-east-1/1-month-commitment/anthropic.claude-instant-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-east-1/6-month-commitment/anthropic.claude-instant-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-west-2/1-month-commitment/anthropic.claude-instant-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-west-2/6-month-commitment/anthropic.claude-instant-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/us-west-2/anthropic.claude-instant-v1 | bedrock | chat | $0.80 | $2.40 | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/anthropic.claude-instant-v1 | bedrock | chat | $2.23 | $7.55 | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/1-month-commitment/anthropic.claude-instant-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/ap-northeast-1/6-month-commitment/anthropic.claude-instant-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/eu-central-1/anthropic.claude-instant-v1 | bedrock | chat | $2.48 | $8.38 | 8,191 | - | - | - | - |
bedrock/eu-central-1/1-month-commitment/anthropic.claude-instant-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
bedrock/eu-central-1/6-month-commitment/anthropic.claude-instant-v1 | bedrock | chat | - | - | 8,191 | - | - | - | - |
cohere.rerank-v3-5:0 | bedrock | rerank | - | - | 32,000 | - | - | - | - |
cohere.command-text-v14 | bedrock | chat | $1.50 | $2.00 | 4,096 | - | - | - | - |
bedrock/*/1-month-commitment/cohere.command-text-v14 | bedrock | chat | - | - | 4,096 | - | - | - | - |
bedrock/*/6-month-commitment/cohere.command-text-v14 | bedrock | chat | - | - | 4,096 | - | - | - | - |
cohere.command-light-text-v14 | bedrock | chat | $0.30 | $0.60 | 4,096 | - | - | - | - |
bedrock/*/1-month-commitment/cohere.command-light-text-v14 | bedrock | chat | - | - | 4,096 | - | - | - | - |
bedrock/*/6-month-commitment/cohere.command-light-text-v14 | bedrock | chat | - | - | 4,096 | - | - | - | - |
cohere.command-r-plus-v1:0 | bedrock | chat | $3.00 | $15.00 | 4,096 | - | - | - | - |
cohere.command-r-v1:0 | bedrock | chat | $0.50 | $1.50 | 4,096 | - | - | - | - |
cohere.embed-english-v3 | bedrock | embedding | $0.10 | - | 512 | - | - | - | - |
cohere.embed-multilingual-v3 | bedrock | embedding | $0.10 | - | 512 | - | - | - | - |
us.deepseek.r1-v1:0 | bedrock_converse | chat | $1.35 | $5.40 | 4,096 | - | - | - | - |
meta.llama3-3-70b-instruct-v1:0 | bedrock_converse | chat | $0.72 | $0.72 | 4,096 | - | ✓ | - | - |
meta.llama2-13b-chat-v1 | bedrock | chat | $0.75 | $1.00 | 4,096 | - | - | - | - |
meta.llama2-70b-chat-v1 | bedrock | chat | $1.95 | $2.56 | 4,096 | - | - | - | - |
meta.llama3-8b-instruct-v1:0 | bedrock | chat | $0.30 | $0.60 | 8,192 | - | - | - | - |
bedrock/us-east-1/meta.llama3-8b-instruct-v1:0 | bedrock | chat | $0.30 | $0.60 | 8,192 | - | - | - | - |
bedrock/us-west-1/meta.llama3-8b-instruct-v1:0 | bedrock | chat | $0.30 | $0.60 | 8,192 | - | - | - | - |
bedrock/ap-south-1/meta.llama3-8b-instruct-v1:0 | bedrock | chat | $0.36 | $0.72 | 8,192 | - | - | - | - |
bedrock/ca-central-1/meta.llama3-8b-instruct-v1:0 | bedrock | chat | $0.35 | $0.69 | 8,192 | - | - | - | - |
bedrock/eu-west-1/meta.llama3-8b-instruct-v1:0 | bedrock | chat | $0.32 | $0.65 | 8,192 | - | - | - | - |
bedrock/eu-west-2/meta.llama3-8b-instruct-v1:0 | bedrock | chat | $0.39 | $0.78 | 8,192 | - | - | - | - |
bedrock/sa-east-1/meta.llama3-8b-instruct-v1:0 | bedrock | chat | $0.50 | $1.01 | 8,192 | - | - | - | - |
meta.llama3-70b-instruct-v1:0 | bedrock | chat | $2.65 | $3.50 | 8,192 | - | - | - | - |
bedrock/us-east-1/meta.llama3-70b-instruct-v1:0 | bedrock | chat | $2.65 | $3.50 | 8,192 | - | - | - | - |
bedrock/us-west-1/meta.llama3-70b-instruct-v1:0 | bedrock | chat | $2.65 | $3.50 | 8,192 | - | - | - | - |
bedrock/ap-south-1/meta.llama3-70b-instruct-v1:0 | bedrock | chat | $3.18 | $4.20 | 8,192 | - | - | - | - |
bedrock/ca-central-1/meta.llama3-70b-instruct-v1:0 | bedrock | chat | $3.05 | $4.03 | 8,192 | - | - | - | - |
bedrock/eu-west-1/meta.llama3-70b-instruct-v1:0 | bedrock | chat | $2.86 | $3.78 | 8,192 | - | - | - | - |
bedrock/eu-west-2/meta.llama3-70b-instruct-v1:0 | bedrock | chat | $3.45 | $4.55 | 8,192 | - | - | - | - |
bedrock/sa-east-1/meta.llama3-70b-instruct-v1:0 | bedrock | chat | $4.45 | $5.88 | 8,192 | - | - | - | - |
meta.llama3-1-8b-instruct-v1:0 | bedrock | chat | $0.22 | $0.22 | 128,000 | - | ✓ | - | - |
us.meta.llama3-1-8b-instruct-v1:0 | bedrock | chat | $0.22 | $0.22 | 128,000 | - | ✓ | - | - |
meta.llama3-1-70b-instruct-v1:0 | bedrock | chat | $0.99 | $0.99 | 128,000 | - | ✓ | - | - |
us.meta.llama3-1-70b-instruct-v1:0 | bedrock | chat | $0.99 | $0.99 | 128,000 | - | ✓ | - | - |
meta.llama3-1-405b-instruct-v1:0 | bedrock | chat | $5.32 | $16.00 | 128,000 | - | ✓ | - | - |
us.meta.llama3-1-405b-instruct-v1:0 | bedrock | chat | $5.32 | $16.00 | 128,000 | - | ✓ | - | - |
meta.llama3-2-1b-instruct-v1:0 | bedrock | chat | $0.10 | $0.10 | 128,000 | - | ✓ | - | - |
us.meta.llama3-2-1b-instruct-v1:0 | bedrock | chat | $0.10 | $0.10 | 128,000 | - | ✓ | - | - |
eu.meta.llama3-2-1b-instruct-v1:0 | bedrock | chat | $0.13 | $0.13 | 128,000 | - | ✓ | - | - |
meta.llama3-2-3b-instruct-v1:0 | bedrock | chat | $0.15 | $0.15 | 128,000 | - | ✓ | - | - |
us.meta.llama3-2-3b-instruct-v1:0 | bedrock | chat | $0.15 | $0.15 | 128,000 | - | ✓ | - | - |
eu.meta.llama3-2-3b-instruct-v1:0 | bedrock | chat | $0.19 | $0.19 | 128,000 | - | ✓ | - | - |
meta.llama3-2-11b-instruct-v1:0 | bedrock | chat | $0.35 | $0.35 | 128,000 | ✓ | ✓ | - | - |
us.meta.llama3-2-11b-instruct-v1:0 | bedrock | chat | $0.35 | $0.35 | 128,000 | ✓ | ✓ | - | - |
meta.llama3-2-90b-instruct-v1:0 | bedrock | chat | $2.00 | $2.00 | 128,000 | ✓ | ✓ | - | - |
us.meta.llama3-2-90b-instruct-v1:0 | bedrock | chat | $2.00 | $2.00 | 128,000 | ✓ | ✓ | - | - |
us.meta.llama3-3-70b-instruct-v1:0 | bedrock_converse | chat | $0.72 | $0.72 | 4,096 | - | ✓ | - | - |
meta.llama4-maverick-17b-instruct-v1:0 | bedrock_converse | chat | $0.24 | $0.97 | 4,096 | - | ✓ | - | - |
us.meta.llama4-maverick-17b-instruct-v1:0 | bedrock_converse | chat | $0.24 | $0.97 | 4,096 | - | ✓ | - | - |
meta.llama4-scout-17b-instruct-v1:0 | bedrock_converse | chat | $0.17 | $0.66 | 4,096 | - | ✓ | - | - |
us.meta.llama4-scout-17b-instruct-v1:0 | bedrock_converse | chat | $0.17 | $0.66 | 4,096 | - | ✓ | - | - |
512-x-512/50-steps/stability.stable-diffusion-xl-v0 | bedrock | image_generation | - | - | 77 | - | - | - | - |
512-x-512/max-steps/stability.stable-diffusion-xl-v0 | bedrock | image_generation | - | - | 77 | - | - | - | - |
max-x-max/50-steps/stability.stable-diffusion-xl-v0 | bedrock | image_generation | - | - | 77 | - | - | - | - |
max-x-max/max-steps/stability.stable-diffusion-xl-v0 | bedrock | image_generation | - | - | 77 | - | - | - | - |
1024-x-1024/50-steps/stability.stable-diffusion-xl-v1 | bedrock | image_generation | - | - | 77 | - | - | - | - |
1024-x-1024/max-steps/stability.stable-diffusion-xl-v1 | bedrock | image_generation | - | - | 77 | - | - | - | - |
stability.sd3-large-v1:0 | bedrock | image_generation | - | - | 77 | - | - | - | - |
stability.sd3-5-large-v1:0 | bedrock | image_generation | - | - | 77 | - | - | - | - |
stability.stable-image-core-v1:0 | bedrock | image_generation | - | - | 77 | - | - | - | - |
stability.stable-image-core-v1:1 | bedrock | image_generation | - | - | 77 | - | - | - | - |
stability.stable-image-ultra-v1:0 | bedrock | image_generation | - | - | 77 | - | - | - | - |
stability.stable-image-ultra-v1:1 | bedrock | image_generation | - | - | 77 | - | - | - | - |
sagemaker/meta-textgeneration-llama-2-7b | sagemaker | completion | - | - | 4,096 | - | - | - | - |
sagemaker/meta-textgeneration-llama-2-7b-f | sagemaker | chat | - | - | 4,096 | - | - | - | - |
sagemaker/meta-textgeneration-llama-2-13b | sagemaker | completion | - | - | 4,096 | - | - | - | - |
sagemaker/meta-textgeneration-llama-2-13b-f | sagemaker | chat | - | - | 4,096 | - | - | - | - |
sagemaker/meta-textgeneration-llama-2-70b | sagemaker | completion | - | - | 4,096 | - | - | - | - |
sagemaker/meta-textgeneration-llama-2-70b-b-f | sagemaker | chat | - | - | 4,096 | - | - | - | - |
together-ai-up-to-4b | together_ai | chat | $0.10 | $0.10 | - | - | - | - | - |
together-ai-4.1b-8b | together_ai | chat | $0.20 | $0.20 | - | - | - | - | - |
together-ai-8.1b-21b | together_ai | chat | $0.30 | $0.30 | 1,000 | - | - | - | - |
together-ai-21.1b-41b | together_ai | chat | $0.80 | $0.80 | - | - | - | - | - |
together-ai-41.1b-80b | together_ai | chat | $0.90 | $0.90 | - | - | - | - | - |
together-ai-81.1b-110b | together_ai | chat | $1.80 | $1.80 | - | - | - | - | - |
together-ai-embedding-up-to-150m | together_ai | embedding | $0.008 | - | - | - | - | - | - |
together-ai-embedding-151m-to-350m | together_ai | embedding | $0.016 | - | - | - | - | - | - |
together_ai/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo | together_ai | chat | $0.18 | $0.18 | - | - | ✓ | - | - |
together_ai/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo | together_ai | chat | $0.88 | $0.88 | - | - | ✓ | - | - |
together_ai/meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo | together_ai | chat | $3.50 | $3.50 | - | - | ✓ | - | - |
together_ai/meta-llama/Llama-3.3-70B-Instruct-Turbo | together_ai | chat | $0.88 | $0.88 | - | - | ✓ | - | - |
together_ai/meta-llama/Llama-3.3-70B-Instruct-Turbo-Free | together_ai | chat | - | - | - | - | ✓ | - | - |
together_ai/mistralai/Mixtral-8x7B-Instruct-v0.1 | together_ai | chat | $0.60 | $0.60 | - | - | ✓ | - | - |
together_ai/mistralai/Mistral-7B-Instruct-v0.1 | together_ai | chat | - | - | - | - | ✓ | - | - |
together_ai/togethercomputer/CodeLlama-34b-Instruct | together_ai | chat | - | - | - | - | ✓ | - | - |
together_ai/meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8 | together_ai | chat | $0.27 | $0.85 | - | - | ✓ | - | - |
together_ai/meta-llama/Llama-4-Scout-17B-16E-Instruct | together_ai | chat | $0.18 | $0.59 | - | - | ✓ | - | - |
together_ai/meta-llama/Llama-3.2-3B-Instruct-Turbo | together_ai | chat | - | - | - | - | ✓ | - | - |
together_ai/Qwen/Qwen2.5-7B-Instruct-Turbo | together_ai | chat | - | - | - | - | ✓ | - | - |
together_ai/Qwen/Qwen2.5-72B-Instruct-Turbo | together_ai | chat | - | - | - | - | ✓ | - | - |
together_ai/Qwen/Qwen3-235B-A22B-Instruct-2507-tput | together_ai | chat | $0.20 | $6.00 | - | - | - | - | - |
together_ai/Qwen/Qwen3-Coder-480B-A35B-Instruct-FP8 | together_ai | chat | $2.00 | $2.00 | - | - | - | - | - |
together_ai/Qwen/Qwen3-235B-A22B-Thinking-2507 | together_ai | chat | $0.65 | $3.00 | - | - | - | - | - |
together_ai/Qwen/Qwen3-235B-A22B-fp8-tput | together_ai | chat | $0.20 | $0.60 | - | - | - | - | - |
together_ai/deepseek-ai/DeepSeek-V3 | together_ai | chat | $1.25 | $1.25 | 8,192 | - | ✓ | - | - |
together_ai/deepseek-ai/DeepSeek-R1 | together_ai | chat | $3.00 | $7.00 | 20,480 | - | ✓ | - | - |
together_ai/deepseek-ai/DeepSeek-R1-0528-tput | together_ai | chat | $0.55 | $2.19 | - | - | - | - | - |
together_ai/mistralai/Mistral-Small-24B-Instruct-2501 | together_ai | chat | - | - | - | - | ✓ | - | - |
together_ai/moonshotai/Kimi-K2-Instruct | together_ai | chat | $1.00 | $3.00 | - | - | ✓ | - | - |
together_ai/openai/gpt-oss-120b | together_ai | chat | $0.15 | $0.60 | - | - | - | - | - |
together_ai/OpenAI/gpt-oss-20B | together_ai | chat | $0.05 | $0.20 | - | - | - | - | - |
together_ai/zai-org/GLM-4.5-Air-FP8 | together_ai | chat | $0.20 | $1.10 | - | - | - | - | - |
ollama/codegemma | ollama | completion | - | - | 8,192 | - | - | - | - |
ollama/codegeex4 | ollama | chat | - | - | 32,768 | - | - | - | - |
ollama/deepseek-coder-v2-instruct | ollama | chat | - | - | 32,768 | - | ✓ | - | - |
ollama/deepseek-coder-v2-base | ollama | completion | - | - | 8,192 | - | ✓ | - | - |
ollama/deepseek-coder-v2-lite-instruct | ollama | chat | - | - | 32,768 | - | ✓ | - | - |
ollama/deepseek-coder-v2-lite-base | ollama | completion | - | - | 8,192 | - | ✓ | - | - |
ollama/internlm2_5-20b-chat | ollama | chat | - | - | 32,768 | - | ✓ | - | - |
ollama/llama2 | ollama | chat | - | - | 4,096 | - | - | - | - |
ollama/llama2:7b | ollama | chat | - | - | 4,096 | - | - | - | - |
ollama/llama2:13b | ollama | chat | - | - | 4,096 | - | - | - | - |
ollama/llama2:70b | ollama | chat | - | - | 4,096 | - | - | - | - |
ollama/llama2-uncensored | ollama | completion | - | - | 4,096 | - | - | - | - |
ollama/llama3 | ollama | chat | - | - | 8,192 | - | - | - | - |
ollama/llama3:8b | ollama | chat | - | - | 8,192 | - | - | - | - |
ollama/llama3:70b | ollama | chat | - | - | 8,192 | - | - | - | - |
ollama/llama3.1 | ollama | chat | - | - | 32,768 | - | ✓ | - | - |
ollama/mistral-large-instruct-2407 | ollama | chat | - | - | 65,536 | - | ✓ | - | - |
ollama/mistral | ollama | completion | - | - | 8,192 | - | ✓ | - | - |
ollama/mistral-7B-Instruct-v0.1 | ollama | chat | - | - | 8,192 | - | ✓ | - | - |
ollama/mistral-7B-Instruct-v0.2 | ollama | chat | - | - | 32,768 | - | ✓ | - | - |
ollama/mixtral-8x7B-Instruct-v0.1 | ollama | chat | - | - | 32,768 | - | ✓ | - | - |
ollama/mixtral-8x22B-Instruct-v0.1 | ollama | chat | - | - | 65,536 | - | ✓ | - | - |
ollama/codellama | ollama | completion | - | - | 4,096 | - | - | - | - |
ollama/orca-mini | ollama | completion | - | - | 4,096 | - | - | - | - |
ollama/vicuna | ollama | completion | - | - | 2,048 | - | - | - | - |
deepinfra/Austism/chronos-hermes-13b-v2 | deepinfra | chat | $0.13 | $0.13 | 4,096 | - | - | - | - |
deepinfra/Gryphe/MythoMax-L2-13b | deepinfra | chat | $0.072 | $0.072 | 4,096 | - | - | - | - |
deepinfra/Gryphe/MythoMax-L2-13b-turbo | deepinfra | chat | $0.13 | $0.13 | 4,096 | - | - | - | - |
deepinfra/KoboldAI/LLaMA2-13B-Tiefighter | deepinfra | chat | $0.10 | $0.10 | 4,096 | - | - | - | - |
deepinfra/NousResearch/Hermes-3-Llama-3.1-405B | deepinfra | chat | $0.70 | $0.80 | 131,072 | - | - | - | - |
deepinfra/NousResearch/Hermes-3-Llama-3.1-70B | deepinfra | chat | $0.10 | $0.28 | 131,072 | - | - | - | - |
deepinfra/NovaSky-AI/Sky-T1-32B-Preview | deepinfra | chat | $0.12 | $0.18 | 32,768 | - | - | - | - |
deepinfra/Phind/Phind-CodeLlama-34B-v2 | deepinfra | chat | $0.60 | $0.60 | 4,096 | - | - | - | - |
deepinfra/Qwen/QVQ-72B-Preview | deepinfra | chat | $0.25 | $0.50 | 32,000 | - | - | - | - |
deepinfra/Qwen/QwQ-32B | deepinfra | chat | $0.075 | $0.15 | 131,072 | - | - | - | - |
deepinfra/Qwen/QwQ-32B-Preview | deepinfra | chat | $0.12 | $0.18 | 32,768 | - | - | - | - |
deepinfra/Qwen/Qwen2-72B-Instruct | deepinfra | chat | $0.35 | $0.40 | 32,768 | - | - | - | - |
deepinfra/Qwen/Qwen2-7B-Instruct | deepinfra | chat | $0.055 | $0.055 | 32,768 | - | - | - | - |
deepinfra/Qwen/Qwen2.5-72B-Instruct | deepinfra | chat | $0.12 | $0.39 | 32,768 | - | - | - | - |
deepinfra/Qwen/Qwen2.5-7B-Instruct | deepinfra | chat | $0.04 | $0.10 | 32,768 | - | - | - | - |
deepinfra/Qwen/Qwen2.5-Coder-32B-Instruct | deepinfra | chat | $0.06 | $0.15 | 32,768 | - | - | - | - |
deepinfra/Qwen/Qwen2.5-Coder-7B | deepinfra | chat | $0.025 | $0.05 | 32,768 | - | - | - | - |
deepinfra/Qwen/Qwen2.5-VL-32B-Instruct | deepinfra | chat | $0.20 | $0.60 | 128,000 | - | - | - | - |
deepinfra/Qwen/Qwen3-14B | deepinfra | chat | $0.06 | $0.24 | 40,960 | - | - | - | - |
deepinfra/Qwen/Qwen3-235B-A22B | deepinfra | chat | $0.13 | $0.60 | 40,960 | - | - | - | - |
deepinfra/Qwen/Qwen3-235B-A22B-Instruct-2507 | deepinfra | chat | $0.13 | $0.60 | 262,144 | - | - | - | - |
deepinfra/Qwen/Qwen3-235B-A22B-Thinking-2507 | deepinfra | chat | $0.13 | $0.60 | 262,144 | - | - | - | - |
deepinfra/Qwen/Qwen3-30B-A3B | deepinfra | chat | $0.08 | $0.29 | 40,960 | - | - | - | - |
deepinfra/Qwen/Qwen3-32B | deepinfra | chat | $0.10 | $0.30 | 40,960 | - | - | - | - |
deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct | deepinfra | chat | $0.40 | $1.60 | 262,144 | - | - | - | - |
deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo | deepinfra | chat | $0.30 | $1.20 | 262,144 | - | - | - | - |
deepinfra/Sao10K/L3-70B-Euryale-v2.1 | deepinfra | chat | $0.70 | $0.80 | 8,192 | - | - | - | - |
deepinfra/Sao10K/L3-8B-Lunaris-v1 | deepinfra | chat | $0.03 | $0.06 | 8,192 | - | - | - | - |
deepinfra/Sao10K/L3-8B-Lunaris-v1-Turbo | deepinfra | chat | $0.02 | $0.05 | 8,192 | - | - | - | - |
deepinfra/Sao10K/L3.1-70B-Euryale-v2.2 | deepinfra | chat | $0.65 | $0.75 | 131,072 | - | - | - | - |
deepinfra/Sao10K/L3.3-70B-Euryale-v2.3 | deepinfra | chat | $0.65 | $0.75 | 131,072 | - | - | - | - |
deepinfra/allenai/olmOCR-7B-0725-FP8 | deepinfra | chat | $0.27 | $1.50 | 16,384 | - | - | - | - |
deepinfra/anthropic/claude-3-7-sonnet-latest | deepinfra | chat | $3.30 | $16.50 | 200,000 | - | - | - | - |
deepinfra/anthropic/claude-4-opus | deepinfra | chat | $16.50 | $82.50 | 200,000 | - | - | - | - |
deepinfra/anthropic/claude-4-sonnet | deepinfra | chat | $3.30 | $16.50 | 200,000 | - | - | - | - |
deepinfra/bigcode/starcoder2-15b-instruct-v0.1 | deepinfra | chat | $0.15 | $0.15 | 4,096 | - | - | - | - |
deepinfra/cognitivecomputations/dolphin-2.6-mixtral-8x7b | deepinfra | chat | $0.24 | $0.24 | 32,768 | - | - | - | - |
deepinfra/cognitivecomputations/dolphin-2.9.1-llama-3-70b | deepinfra | chat | $0.35 | $0.40 | 8,192 | - | - | - | - |
deepinfra/deepinfra/airoboros-70b | deepinfra | chat | $0.70 | $0.90 | 4,096 | - | - | - | - |
deepinfra/deepseek-ai/DeepSeek-Prover-V2-671B | deepinfra | chat | $0.50 | $2.18 | 163,840 | - | - | - | - |
deepinfra/deepseek-ai/DeepSeek-R1 | deepinfra | chat | $0.45 | $2.15 | 163,840 | - | - | - | - |
deepinfra/deepseek-ai/DeepSeek-R1-0528 | deepinfra | chat | $0.50 | $2.15 | 163,840 | - | - | - | - |
deepinfra/deepseek-ai/DeepSeek-R1-0528-Turbo | deepinfra | chat | $1.00 | $3.00 | 32,768 | - | - | - | - |
deepinfra/deepseek-ai/DeepSeek-R1-Distill-Llama-70B | deepinfra | chat | $0.10 | $0.40 | 131,072 | - | - | - | - |
deepinfra/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B | deepinfra | chat | $0.075 | $0.15 | 131,072 | - | - | - | - |
deepinfra/deepseek-ai/DeepSeek-R1-Turbo | deepinfra | chat | $1.00 | $3.00 | 163,840 | - | - | - | - |
deepinfra/deepseek-ai/DeepSeek-V3 | deepinfra | chat | $0.38 | $0.89 | 163,840 | - | - | - | - |
deepinfra/deepseek-ai/DeepSeek-V3-0324 | deepinfra | chat | $0.28 | $0.88 | 163,840 | - | - | - | - |
deepinfra/deepseek-ai/DeepSeek-V3-0324-Turbo | deepinfra | chat | $1.00 | $3.00 | 32,768 | - | - | - | - |
deepinfra/deepseek-ai/DeepSeek-V3.1 | deepinfra | chat | $0.30 | $1.00 | 163,840 | - | - | - | - |
deepinfra/google/codegemma-7b-it | deepinfra | chat | $0.07 | $0.07 | 8,192 | - | - | - | - |
deepinfra/google/gemini-1.5-flash | deepinfra | chat | $0.075 | $0.30 | 1,000,000 | - | - | - | - |
deepinfra/google/gemini-1.5-flash-8b | deepinfra | chat | $0.0375 | $0.15 | 1,000,000 | - | - | - | - |
deepinfra/google/gemini-2.0-flash-001 | deepinfra | chat | $0.10 | $0.40 | 1,000,000 | - | - | - | - |
deepinfra/google/gemini-2.5-flash | deepinfra | chat | $0.21 | $1.75 | 1,000,000 | - | - | - | - |
deepinfra/google/gemini-2.5-pro | deepinfra | chat | $0.875 | $7.00 | 1,000,000 | - | - | - | - |
deepinfra/google/gemma-1.1-7b-it | deepinfra | chat | $0.07 | $0.07 | 8,192 | - | - | - | - |
deepinfra/google/gemma-2-27b-it | deepinfra | chat | $0.27 | $0.27 | 8,192 | - | - | - | - |
deepinfra/google/gemma-2-9b-it | deepinfra | chat | $0.03 | $0.06 | 8,192 | - | - | - | - |
deepinfra/google/gemma-3-12b-it | deepinfra | chat | $0.05 | $0.10 | 131,072 | - | - | - | - |
deepinfra/google/gemma-3-27b-it | deepinfra | chat | $0.09 | $0.17 | 131,072 | - | - | - | - |
deepinfra/google/gemma-3-4b-it | deepinfra | chat | $0.02 | $0.04 | 131,072 | - | - | - | - |
deepinfra/lizpreciatior/lzlv_70b_fp16_hf | deepinfra | chat | $0.35 | $0.40 | 4,096 | - | - | - | - |
deepinfra/mattshumer/Reflection-Llama-3.1-70B | deepinfra | chat | $0.35 | $0.40 | 8,192 | - | - | - | - |
deepinfra/meta-llama/Llama-2-13b-chat-hf | deepinfra | chat | $0.13 | $0.13 | 4,096 | - | - | - | - |
deepinfra/meta-llama/Llama-2-70b-chat-hf | deepinfra | chat | $0.64 | $0.80 | 4,096 | - | - | - | - |
deepinfra/meta-llama/Llama-3.2-11B-Vision-Instruct | deepinfra | chat | $0.049 | $0.049 | 131,072 | - | - | - | - |
deepinfra/meta-llama/Llama-3.2-1B-Instruct | deepinfra | chat | $0.005 | $0.01 | 131,072 | - | - | - | - |
deepinfra/meta-llama/Llama-3.2-3B-Instruct | deepinfra | chat | $0.012 | $0.024 | 131,072 | - | - | - | - |
deepinfra/meta-llama/Llama-3.2-90B-Vision-Instruct | deepinfra | chat | $0.35 | $0.40 | 32,768 | - | - | - | - |
deepinfra/meta-llama/Llama-3.3-70B-Instruct | deepinfra | chat | $0.23 | $0.40 | 131,072 | - | - | - | - |
deepinfra/meta-llama/Llama-3.3-70B-Instruct-Turbo | deepinfra | chat | $0.038 | $0.12 | 131,072 | - | - | - | - |
deepinfra/meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8 | deepinfra | chat | $0.15 | $0.60 | 1,048,576 | - | - | - | - |
deepinfra/meta-llama/Llama-4-Maverick-17B-128E-Instruct-Turbo | deepinfra | chat | $0.50 | $0.50 | 8,192 | - | - | - | - |
deepinfra/meta-llama/Llama-4-Scout-17B-16E-Instruct | deepinfra | chat | $0.08 | $0.30 | 327,680 | - | - | - | - |
deepinfra/meta-llama/Llama-Guard-3-8B | deepinfra | chat | $0.055 | $0.055 | 131,072 | - | - | - | - |
deepinfra/meta-llama/Llama-Guard-4-12B | deepinfra | chat | $0.18 | $0.18 | 163,840 | - | - | - | - |
deepinfra/meta-llama/Meta-Llama-3-70B-Instruct | deepinfra | chat | $0.30 | $0.40 | 8,192 | - | - | - | - |
deepinfra/meta-llama/Meta-Llama-3-8B-Instruct | deepinfra | chat | $0.03 | $0.06 | 8,192 | - | - | - | - |
deepinfra/meta-llama/Meta-Llama-3.1-405B-Instruct | deepinfra | chat | $0.80 | $0.80 | 32,768 | - | - | - | - |
deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct | deepinfra | chat | $0.23 | $0.40 | 131,072 | - | - | - | - |
deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo | deepinfra | chat | $0.10 | $0.28 | 131,072 | - | - | - | - |
deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct | deepinfra | chat | $0.03 | $0.05 | 131,072 | - | - | - | - |
deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo | deepinfra | chat | $0.015 | $0.02 | 131,072 | - | - | - | - |
deepinfra/microsoft/Phi-3-medium-4k-instruct | deepinfra | chat | $0.14 | $0.14 | 4,096 | - | - | - | - |
deepinfra/microsoft/Phi-4-multimodal-instruct | deepinfra | chat | $0.05 | $0.10 | 131,072 | - | - | - | - |
deepinfra/microsoft/WizardLM-2-7B | deepinfra | chat | $0.055 | $0.055 | 32,768 | - | - | - | - |
deepinfra/microsoft/WizardLM-2-8x22B | deepinfra | chat | $0.48 | $0.48 | 65,536 | - | - | - | - |
deepinfra/microsoft/phi-4 | deepinfra | chat | $0.07 | $0.14 | 16,384 | - | - | - | - |
deepinfra/microsoft/phi-4-reasoning-plus | deepinfra | chat | $0.07 | $0.35 | 32,768 | - | - | - | - |
deepinfra/mistralai/Devstral-Small-2505 | deepinfra | chat | $0.06 | $0.12 | 128,000 | - | - | - | - |
deepinfra/mistralai/Devstral-Small-2507 | deepinfra | chat | $0.07 | $0.28 | 128,000 | - | - | - | - |
deepinfra/mistralai/Mistral-7B-Instruct-v0.1 | deepinfra | chat | $0.055 | $0.055 | 32,768 | - | - | - | - |
deepinfra/mistralai/Mistral-7B-Instruct-v0.2 | deepinfra | chat | $0.055 | $0.055 | 32,768 | - | - | - | - |
deepinfra/mistralai/Mistral-7B-Instruct-v0.3 | deepinfra | chat | $0.028 | $0.054 | 32,768 | - | - | - | - |
deepinfra/mistralai/Mistral-Nemo-Instruct-2407 | deepinfra | chat | $0.02 | $0.04 | 131,072 | - | - | - | - |
deepinfra/mistralai/Mistral-Small-24B-Instruct-2501 | deepinfra | chat | $0.05 | $0.08 | 32,768 | - | - | - | - |
deepinfra/mistralai/Mistral-Small-3.1-24B-Instruct-2503 | deepinfra | chat | $0.05 | $0.10 | 128,000 | - | - | - | - |
deepinfra/mistralai/Mistral-Small-3.2-24B-Instruct-2506 | deepinfra | chat | $0.05 | $0.10 | 128,000 | - | - | - | - |
deepinfra/mistralai/Mixtral-8x22B-Instruct-v0.1 | deepinfra | chat | $0.65 | $0.65 | 65,536 | - | - | - | - |
deepinfra/mistralai/Mixtral-8x7B-Instruct-v0.1 | deepinfra | chat | $0.08 | $0.24 | 32,768 | - | - | - | - |
deepinfra/moonshotai/Kimi-K2-Instruct | deepinfra | chat | $0.50 | $2.00 | 131,072 | - | - | - | - |
deepinfra/nvidia/Llama-3.1-Nemotron-70B-Instruct | deepinfra | chat | $0.12 | $0.30 | 131,072 | - | - | - | - |
deepinfra/nvidia/Nemotron-4-340B-Instruct | deepinfra | chat | $4.20 | $4.20 | 4,096 | - | - | - | - |
deepinfra/openai/gpt-oss-120b | deepinfra | chat | $0.09 | $0.45 | 131,072 | - | - | - | - |
deepinfra/openai/gpt-oss-20b | deepinfra | chat | $0.04 | $0.16 | 131,072 | - | - | - | - |
deepinfra/openbmb/MiniCPM-Llama3-V-2_5 | deepinfra | chat | $0.34 | $0.34 | 8,192 | - | - | - | - |
deepinfra/openchat/openchat-3.6-8b | deepinfra | chat | $0.055 | $0.055 | 8,192 | - | - | - | - |
deepinfra/openchat/openchat_3.5 | deepinfra | chat | $0.055 | $0.055 | 8,192 | - | - | - | - |
deepinfra/zai-org/GLM-4.5 | deepinfra | chat | $0.55 | $2.00 | 131,072 | - | - | - | - |
deepinfra/zai-org/GLM-4.5-Air | deepinfra | chat | $0.20 | $1.10 | 131,072 | - | - | - | - |
perplexity/codellama-34b-instruct | perplexity | chat | $0.35 | $1.40 | 16,384 | - | - | - | - |
perplexity/codellama-70b-instruct | perplexity | chat | $0.70 | $2.80 | 16,384 | - | - | - | - |
perplexity/llama-3.1-70b-instruct | perplexity | chat | $1.00 | $1.00 | 131,072 | - | - | - | - |
perplexity/llama-3.1-8b-instruct | perplexity | chat | $0.20 | $0.20 | 131,072 | - | - | - | - |
perplexity/llama-3.1-sonar-huge-128k-online | perplexity | chat | $5.00 | $5.00 | 127,072 | - | - | - | 2025-02-22 |
perplexity/llama-3.1-sonar-large-128k-online | perplexity | chat | $1.00 | $1.00 | 127,072 | - | - | - | 2025-02-22 |
perplexity/llama-3.1-sonar-large-128k-chat | perplexity | chat | $1.00 | $1.00 | 131,072 | - | - | - | 2025-02-22 |
perplexity/llama-3.1-sonar-small-128k-chat | perplexity | chat | $0.20 | $0.20 | 131,072 | - | - | - | 2025-02-22 |
perplexity/llama-3.1-sonar-small-128k-online | perplexity | chat | $0.20 | $0.20 | 127,072 | - | - | - | 2025-02-22 |
perplexity/pplx-7b-chat | perplexity | chat | $0.07 | $0.28 | 8,192 | - | - | - | - |
perplexity/pplx-70b-chat | perplexity | chat | $0.70 | $2.80 | 4,096 | - | - | - | - |
perplexity/pplx-7b-online | perplexity | chat | - | $0.28 | 4,096 | - | - | - | - |
perplexity/pplx-70b-online | perplexity | chat | - | $2.80 | 4,096 | - | - | - | - |
perplexity/llama-2-70b-chat | perplexity | chat | $0.70 | $2.80 | 4,096 | - | - | - | - |
perplexity/mistral-7b-instruct | perplexity | chat | $0.07 | $0.28 | 4,096 | - | - | - | - |
perplexity/mixtral-8x7b-instruct | perplexity | chat | $0.07 | $0.28 | 4,096 | - | - | - | - |
perplexity/sonar-small-chat | perplexity | chat | $0.07 | $0.28 | 16,384 | - | - | - | - |
perplexity/sonar-small-online | perplexity | chat | - | $0.28 | 12,000 | - | - | - | - |
perplexity/sonar-medium-chat | perplexity | chat | $0.60 | $1.80 | 16,384 | - | - | - | - |
perplexity/sonar-medium-online | perplexity | chat | - | $1.80 | 12,000 | - | - | - | - |
perplexity/sonar | perplexity | chat | $1.00 | $1.00 | 128,000 | - | - | - | - |
perplexity/sonar-pro | perplexity | chat | $3.00 | $15.00 | 8,000 | - | - | - | - |
perplexity/sonar-reasoning | perplexity | chat | $1.00 | $5.00 | 128,000 | - | - | - | - |
perplexity/sonar-reasoning-pro | perplexity | chat | $2.00 | $8.00 | 128,000 | - | - | - | - |
perplexity/sonar-deep-research | perplexity | chat | $2.00 | $8.00 | 128,000 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/llama-v3p2-1b-instruct | fireworks_ai | chat | $0.10 | $0.10 | 16,384 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/llama-v3p2-3b-instruct | fireworks_ai | chat | $0.10 | $0.10 | 16,384 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/llama-v3p1-8b-instruct | fireworks_ai | chat | $0.10 | $0.10 | 16,384 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/llama-v3p2-11b-vision-instruct | fireworks_ai | chat | $0.20 | $0.20 | 16,384 | ✓ | - | - | - |
fireworks_ai/accounts/fireworks/models/llama-v3p2-90b-vision-instruct | fireworks_ai | chat | $0.90 | $0.90 | 16,384 | ✓ | - | - | - |
fireworks_ai/accounts/fireworks/models/firefunction-v2 | fireworks_ai | chat | $0.90 | $0.90 | 8,192 | - | ✓ | - | - |
fireworks_ai/accounts/fireworks/models/mixtral-8x22b-instruct-hf | fireworks_ai | chat | $1.20 | $1.20 | 65,536 | - | ✓ | - | - |
fireworks_ai/accounts/fireworks/models/qwen2-72b-instruct | fireworks_ai | chat | $0.90 | $0.90 | 32,768 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/qwen2p5-coder-32b-instruct | fireworks_ai | chat | $0.90 | $0.90 | 4,096 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/yi-large | fireworks_ai | chat | $3.00 | $3.00 | 32,768 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/deepseek-coder-v2-instruct | fireworks_ai | chat | $1.20 | $1.20 | 65,536 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/deepseek-v3 | fireworks_ai | chat | $0.90 | $0.90 | 8,192 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/deepseek-v3-0324 | fireworks_ai | chat | $0.90 | $0.90 | 163,840 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/deepseek-r1 | fireworks_ai | chat | $3.00 | $8.00 | 20,480 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/deepseek-r1-basic | fireworks_ai | chat | $0.55 | $2.19 | 20,480 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/deepseek-r1-0528 | fireworks_ai | chat | $3.00 | $8.00 | 160,000 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/deepseek-v3p1 | fireworks_ai | chat | $0.56 | $1.68 | 8,192 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/kimi-k2-instruct | fireworks_ai | chat | $0.60 | $2.50 | 131,072 | - | ✓ | - | - |
fireworks_ai/accounts/fireworks/models/llama-v3p1-405b-instruct | fireworks_ai | chat | $3.00 | $3.00 | 16,384 | - | ✓ | - | - |
fireworks_ai/accounts/fireworks/models/llama4-maverick-instruct-basic | fireworks_ai | chat | $0.22 | $0.88 | 131,072 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/llama4-scout-instruct-basic | fireworks_ai | chat | $0.15 | $0.60 | 131,072 | - | - | - | - |
fireworks_ai/accounts/fireworks/models/glm-4p5 | fireworks_ai | chat | $0.55 | $2.19 | 96,000 | - | ✓ | - | - |
fireworks_ai/accounts/fireworks/models/glm-4p5-air | fireworks_ai | chat | $0.22 | $0.88 | 96,000 | - | ✓ | - | - |
fireworks_ai/accounts/fireworks/models/gpt-oss-120b | fireworks_ai | chat | $0.15 | $0.60 | 131,072 | - | ✓ | - | - |
fireworks_ai/accounts/fireworks/models/gpt-oss-20b | fireworks_ai | chat | $0.05 | $0.20 | 131,072 | - | ✓ | - | - |
fireworks_ai/nomic-ai/nomic-embed-text-v1.5 | fireworks_ai-embedding-models | embedding | $0.008 | - | 8,192 | - | - | - | - |
fireworks_ai/nomic-ai/nomic-embed-text-v1 | fireworks_ai-embedding-models | embedding | $0.008 | - | 8,192 | - | - | - | - |
fireworks_ai/WhereIsAI/UAE-Large-V1 | fireworks_ai-embedding-models | embedding | $0.016 | - | 512 | - | - | - | - |
fireworks_ai/thenlper/gte-large | fireworks_ai-embedding-models | embedding | $0.016 | - | 512 | - | - | - | - |
fireworks_ai/thenlper/gte-base | fireworks_ai-embedding-models | embedding | $0.008 | - | 512 | - | - | - | - |
fireworks-ai-up-to-4b | fireworks_ai | chat | $0.20 | $0.20 | - | - | - | - | - |
fireworks-ai-4.1b-to-16b | fireworks_ai | chat | $0.20 | $0.20 | - | - | - | - | - |
fireworks-ai-above-16b | fireworks_ai | chat | $0.90 | $0.90 | - | - | - | - | - |
fireworks-ai-moe-up-to-56b | fireworks_ai | chat | $0.50 | $0.50 | - | - | - | - | - |
fireworks-ai-56b-to-176b | fireworks_ai | chat | $1.20 | $1.20 | - | - | - | - | - |
fireworks-ai-default | fireworks_ai | chat | - | - | - | - | - | - | - |
fireworks-ai-embedding-up-to-150m | fireworks_ai-embedding-models | chat | $0.008 | - | - | - | - | - | - |
fireworks-ai-embedding-150m-to-350m | fireworks_ai-embedding-models | chat | $0.016 | - | - | - | - | - | - |
anyscale/mistralai/Mistral-7B-Instruct-v0.1 | anyscale | chat | $0.15 | $0.15 | 16,384 | - | ✓ | - | - |
anyscale/mistralai/Mixtral-8x7B-Instruct-v0.1 | anyscale | chat | $0.15 | $0.15 | 16,384 | - | ✓ | - | - |
anyscale/mistralai/Mixtral-8x22B-Instruct-v0.1 | anyscale | chat | $0.90 | $0.90 | 65,536 | - | ✓ | - | - |
anyscale/HuggingFaceH4/zephyr-7b-beta | anyscale | chat | $0.15 | $0.15 | 16,384 | - | - | - | - |
anyscale/google/gemma-7b-it | anyscale | chat | $0.15 | $0.15 | 8,192 | - | - | - | - |
anyscale/meta-llama/Llama-2-7b-chat-hf | anyscale | chat | $0.15 | $0.15 | 4,096 | - | - | - | - |
anyscale/meta-llama/Llama-2-13b-chat-hf | anyscale | chat | $0.25 | $0.25 | 4,096 | - | - | - | - |
anyscale/meta-llama/Llama-2-70b-chat-hf | anyscale | chat | $1.00 | $1.00 | 4,096 | - | - | - | - |
anyscale/codellama/CodeLlama-34b-Instruct-hf | anyscale | chat | $1.00 | $1.00 | 4,096 | - | - | - | - |
anyscale/codellama/CodeLlama-70b-Instruct-hf | anyscale | chat | $1.00 | $1.00 | 4,096 | - | - | - | - |
anyscale/meta-llama/Meta-Llama-3-8B-Instruct | anyscale | chat | $0.15 | $0.15 | 8,192 | - | - | - | - |
anyscale/meta-llama/Meta-Llama-3-70B-Instruct | anyscale | chat | $1.00 | $1.00 | 8,192 | - | - | - | - |
cloudflare/@cf/meta/llama-2-7b-chat-fp16 | cloudflare | chat | $1.923 | $1.923 | 3,072 | - | - | - | - |
cloudflare/@cf/meta/llama-2-7b-chat-int8 | cloudflare | chat | $1.923 | $1.923 | 2,048 | - | - | - | - |
cloudflare/@cf/mistral/mistral-7b-instruct-v0.1 | cloudflare | chat | $1.923 | $1.923 | 8,192 | - | - | - | - |
cloudflare/@hf/thebloke/codellama-7b-instruct-awq | cloudflare | chat | $1.923 | $1.923 | 4,096 | - | - | - | - |
v0/v0-1.0-md | v0 | chat | $3.00 | $15.00 | 128,000 | ✓ | ✓ | - | - |
v0/v0-1.5-md | v0 | chat | $3.00 | $15.00 | 128,000 | ✓ | ✓ | - | - |
v0/v0-1.5-lg | v0 | chat | $15.00 | $75.00 | 512,000 | ✓ | ✓ | - | - |
lambda_ai/deepseek-llama3.3-70b | lambda_ai | chat | $0.20 | $0.60 | 131,072 | - | ✓ | - | - |
lambda_ai/deepseek-r1-0528 | lambda_ai | chat | $0.20 | $0.60 | 131,072 | - | ✓ | - | - |
lambda_ai/deepseek-r1-671b | lambda_ai | chat | $0.80 | $0.80 | 131,072 | - | ✓ | - | - |
lambda_ai/deepseek-v3-0324 | lambda_ai | chat | $0.20 | $0.60 | 131,072 | - | ✓ | - | - |
lambda_ai/hermes3-405b | lambda_ai | chat | $0.80 | $0.80 | 131,072 | - | ✓ | - | - |
lambda_ai/hermes3-70b | lambda_ai | chat | $0.12 | $0.30 | 131,072 | - | ✓ | - | - |
lambda_ai/hermes3-8b | lambda_ai | chat | $0.025 | $0.04 | 131,072 | - | ✓ | - | - |
lambda_ai/lfm-40b | lambda_ai | chat | $0.10 | $0.20 | 131,072 | - | ✓ | - | - |
lambda_ai/lfm-7b | lambda_ai | chat | $0.025 | $0.04 | 131,072 | - | ✓ | - | - |
lambda_ai/llama-4-maverick-17b-128e-instruct-fp8 | lambda_ai | chat | $0.05 | $0.10 | 131,072 | - | ✓ | - | - |
lambda_ai/llama-4-scout-17b-16e-instruct | lambda_ai | chat | $0.05 | $0.10 | 16,384 | - | ✓ | - | - |
lambda_ai/llama3.1-405b-instruct-fp8 | lambda_ai | chat | $0.80 | $0.80 | 131,072 | - | ✓ | - | - |
lambda_ai/llama3.1-70b-instruct-fp8 | lambda_ai | chat | $0.12 | $0.30 | 131,072 | - | ✓ | - | - |
lambda_ai/llama3.1-8b-instruct | lambda_ai | chat | $0.025 | $0.04 | 131,072 | - | ✓ | - | - |
lambda_ai/llama3.1-nemotron-70b-instruct-fp8 | lambda_ai | chat | $0.12 | $0.30 | 131,072 | - | ✓ | - | - |
lambda_ai/llama3.2-11b-vision-instruct | lambda_ai | chat | $0.015 | $0.025 | 131,072 | ✓ | ✓ | - | - |
lambda_ai/llama3.2-3b-instruct | lambda_ai | chat | $0.015 | $0.025 | 131,072 | - | ✓ | - | - |
lambda_ai/llama3.3-70b-instruct-fp8 | lambda_ai | chat | $0.12 | $0.30 | 131,072 | - | ✓ | - | - |
lambda_ai/qwen25-coder-32b-instruct | lambda_ai | chat | $0.05 | $0.10 | 131,072 | - | ✓ | - | - |
lambda_ai/qwen3-32b-fp8 | lambda_ai | chat | $0.05 | $0.10 | 131,072 | - | ✓ | - | - |
hyperbolic/moonshotai/Kimi-K2-Instruct | hyperbolic | chat | $2.00 | $2.00 | 131,072 | - | ✓ | - | - |
hyperbolic/deepseek-ai/DeepSeek-R1-0528 | hyperbolic | chat | $0.25 | $0.25 | 131,072 | - | ✓ | - | - |
hyperbolic/Qwen/Qwen3-235B-A22B | hyperbolic | chat | $2.00 | $2.00 | 131,072 | - | ✓ | - | - |
hyperbolic/deepseek-ai/DeepSeek-V3-0324 | hyperbolic | chat | $0.40 | $0.40 | 32,768 | - | ✓ | - | - |
hyperbolic/Qwen/QwQ-32B | hyperbolic | chat | $0.20 | $0.20 | 131,072 | - | ✓ | - | - |
hyperbolic/deepseek-ai/DeepSeek-R1 | hyperbolic | chat | $0.40 | $0.40 | 32,768 | - | ✓ | - | - |
hyperbolic/deepseek-ai/DeepSeek-V3 | hyperbolic | chat | $0.20 | $0.20 | 32,768 | - | ✓ | - | - |
hyperbolic/meta-llama/Llama-3.3-70B-Instruct | hyperbolic | chat | $0.12 | $0.30 | 131,072 | - | ✓ | - | - |
hyperbolic/Qwen/Qwen2.5-Coder-32B-Instruct | hyperbolic | chat | $0.12 | $0.30 | 32,768 | - | ✓ | - | - |
hyperbolic/meta-llama/Llama-3.2-3B-Instruct | hyperbolic | chat | $0.12 | $0.30 | 32,768 | - | ✓ | - | - |
hyperbolic/Qwen/Qwen2.5-72B-Instruct | hyperbolic | chat | $0.12 | $0.30 | 131,072 | - | ✓ | - | - |
hyperbolic/meta-llama/Meta-Llama-3-70B-Instruct | hyperbolic | chat | $0.12 | $0.30 | 131,072 | - | ✓ | - | - |
hyperbolic/NousResearch/Hermes-3-Llama-3.1-70B | hyperbolic | chat | $0.12 | $0.30 | 32,768 | - | ✓ | - | - |
hyperbolic/meta-llama/Meta-Llama-3.1-405B-Instruct | hyperbolic | chat | $0.12 | $0.30 | 32,768 | - | ✓ | - | - |
hyperbolic/meta-llama/Meta-Llama-3.1-8B-Instruct | hyperbolic | chat | $0.12 | $0.30 | 32,768 | - | ✓ | - | - |
hyperbolic/meta-llama/Meta-Llama-3.1-70B-Instruct | hyperbolic | chat | $0.12 | $0.30 | 32,768 | - | ✓ | - | - |
voyage/voyage-lite-01 | voyage | embedding | $0.10 | - | 4,096 | - | - | - | - |
voyage/voyage-large-2 | voyage | embedding | $0.12 | - | 16,000 | - | - | - | - |
voyage/voyage-finance-2 | voyage | embedding | $0.12 | - | 32,000 | - | - | - | - |
voyage/voyage-lite-02-instruct | voyage | embedding | $0.10 | - | 4,000 | - | - | - | - |
voyage/voyage-law-2 | voyage | embedding | $0.12 | - | 16,000 | - | - | - | - |
voyage/voyage-code-2 | voyage | embedding | $0.12 | - | 16,000 | - | - | - | - |
voyage/voyage-2 | voyage | embedding | $0.10 | - | 4,000 | - | - | - | - |
voyage/voyage-3-large | voyage | embedding | $0.18 | - | 32,000 | - | - | - | - |
voyage/voyage-3 | voyage | embedding | $0.06 | - | 32,000 | - | - | - | - |
voyage/voyage-3-lite | voyage | embedding | $0.02 | - | 32,000 | - | - | - | - |
voyage/voyage-code-3 | voyage | embedding | $0.18 | - | 32,000 | - | - | - | - |
voyage/voyage-multimodal-3 | voyage | embedding | $0.12 | - | 32,000 | - | - | - | - |
voyage/voyage-context-3 | voyage | embedding | $0.18 | - | 120,000 | - | - | - | - |
voyage/rerank-2 | voyage | rerank | $0.05 | - | 16,000 | - | - | - | - |
voyage/rerank-2-lite | voyage | rerank | $0.02 | - | 8,000 | - | - | - | - |
databricks/databricks-claude-3-7-sonnet | databricks | chat | $2.50 | $17.857 | 200,000 | - | ✓ | - | - |
databricks/databricks-meta-llama-3-1-405b-instruct | databricks | chat | $5.00 | $15.00002 | 128,000 | - | - | - | - |
databricks/databricks-meta-llama-3-3-70b-instruct | databricks | chat | $1.00002 | $2.99999 | 128,000 | - | - | - | - |
databricks/databricks-llama-4-maverick | databricks | chat | $5.00 | $15.00 | 128,000 | - | - | - | - |
databricks/databricks-meta-llama-3-70b-instruct | databricks | chat | $1.00002 | $2.99999 | 128,000 | - | - | - | - |
databricks/databricks-llama-2-70b-chat | databricks | chat | $0.50001 | $1.50 | 4,096 | - | - | - | - |
databricks/databricks-mixtral-8x7b-instruct | databricks | chat | $0.50001 | $0.99902 | 4,096 | - | - | - | - |
databricks/databricks-mpt-30b-instruct | databricks | chat | $0.99902 | $0.99902 | 8,192 | - | - | - | - |
databricks/databricks-mpt-7b-instruct | databricks | chat | $0.50001 | - | 8,192 | - | - | - | - |
databricks/databricks-bge-large-en | databricks | embedding | $0.10003 | - | 512 | - | - | - | - |
databricks/databricks-gte-large-en | databricks | embedding | $0.12999 | - | 8,192 | - | - | - | - |
sambanova/Meta-Llama-3.1-8B-Instruct | sambanova | chat | $0.10 | $0.20 | 16,384 | - | ✓ | - | - |
sambanova/Meta-Llama-3.1-405B-Instruct | sambanova | chat | $5.00 | $10.00 | 16,384 | - | ✓ | - | - |
sambanova/Meta-Llama-3.2-1B-Instruct | sambanova | chat | $0.04 | $0.08 | 16,384 | - | - | - | - |
sambanova/Meta-Llama-3.2-3B-Instruct | sambanova | chat | $0.08 | $0.16 | 4,096 | - | - | - | - |
sambanova/Llama-4-Maverick-17B-128E-Instruct | sambanova | chat | $0.63 | $1.80 | 131,072 | ✓ | ✓ | - | - |
sambanova/Llama-4-Scout-17B-16E-Instruct | sambanova | chat | $0.40 | $0.70 | 8,192 | - | ✓ | - | - |
sambanova/Meta-Llama-3.3-70B-Instruct | sambanova | chat | $0.60 | $1.20 | 131,072 | - | ✓ | - | - |
sambanova/Meta-Llama-Guard-3-8B | sambanova | chat | $0.30 | $0.30 | 16,384 | - | - | - | - |
sambanova/Qwen3-32B | sambanova | chat | $0.40 | $0.80 | 8,192 | - | ✓ | - | - |
sambanova/QwQ-32B | sambanova | chat | $0.50 | $1.00 | 16,384 | - | - | - | - |
sambanova/Qwen2-Audio-7B-Instruct | sambanova | chat | $0.50 | $100.00 | 4,096 | - | - | - | - |
sambanova/DeepSeek-R1-Distill-Llama-70B | sambanova | chat | $0.70 | $1.40 | 131,072 | - | - | - | - |
sambanova/DeepSeek-R1 | sambanova | chat | $5.00 | $7.00 | 32,768 | - | - | - | - |
sambanova/DeepSeek-V3-0324 | sambanova | chat | $3.00 | $4.50 | 32,768 | - | ✓ | - | - |
assemblyai/nano | assemblyai | audio_transcription | - | - | - | - | - | - | - |
assemblyai/best | assemblyai | audio_transcription | - | - | - | - | - | - | - |
jina-reranker-v2-base-multilingual | jina_ai | rerank | $0.018 | $0.018 | 1,024 | - | - | - | - |
snowflake/deepseek-r1 | snowflake | chat | - | - | 32,768 | - | - | - | - |
snowflake/snowflake-arctic | snowflake | chat | - | - | 4,096 | - | - | - | - |
snowflake/claude-3-5-sonnet | snowflake | chat | - | - | 18,000 | - | - | - | - |
snowflake/mistral-large | snowflake | chat | - | - | 32,000 | - | - | - | - |
snowflake/mistral-large2 | snowflake | chat | - | - | 128,000 | - | - | - | - |
snowflake/reka-flash | snowflake | chat | - | - | 100,000 | - | - | - | - |
snowflake/reka-core | snowflake | chat | - | - | 32,000 | - | - | - | - |
snowflake/jamba-instruct | snowflake | chat | - | - | 256,000 | - | - | - | - |
snowflake/jamba-1.5-mini | snowflake | chat | - | - | 256,000 | - | - | - | - |
snowflake/jamba-1.5-large | snowflake | chat | - | - | 256,000 | - | - | - | - |
snowflake/mixtral-8x7b | snowflake | chat | - | - | 32,000 | - | - | - | - |
snowflake/llama2-70b-chat | snowflake | chat | - | - | 4,096 | - | - | - | - |
snowflake/llama3-8b | snowflake | chat | - | - | 8,000 | - | - | - | - |
snowflake/llama3-70b | snowflake | chat | - | - | 8,000 | - | - | - | - |
snowflake/llama3.1-8b | snowflake | chat | - | - | 128,000 | - | - | - | - |
snowflake/llama3.1-70b | snowflake | chat | - | - | 128,000 | - | - | - | - |
snowflake/llama3.3-70b | snowflake | chat | - | - | 128,000 | - | - | - | - |
snowflake/snowflake-llama-3.3-70b | snowflake | chat | - | - | 8,000 | - | - | - | - |
snowflake/llama3.1-405b | snowflake | chat | - | - | 128,000 | - | - | - | - |
snowflake/snowflake-llama-3.1-405b | snowflake | chat | - | - | 8,000 | - | - | - | - |
snowflake/llama3.2-1b | snowflake | chat | - | - | 128,000 | - | - | - | - |
snowflake/llama3.2-3b | snowflake | chat | - | - | 128,000 | - | - | - | - |
snowflake/mistral-7b | snowflake | chat | - | - | 32,000 | - | - | - | - |
snowflake/gemma-7b | snowflake | chat | - | - | 8,000 | - | - | - | - |
gradient_ai/anthropic-claude-3.7-sonnet | gradient_ai | chat | $3.00 | $15.00 | 1,024 | - | - | - | - |
gradient_ai/anthropic-claude-3.5-sonnet | gradient_ai | chat | $3.00 | $15.00 | 1,024 | - | - | - | - |
gradient_ai/anthropic-claude-3.5-haiku | gradient_ai | chat | $0.80 | $4.00 | 1,024 | - | - | - | - |
gradient_ai/anthropic-claude-3-opus | gradient_ai | chat | $15.00 | $75.00 | 1,024 | - | - | - | - |
gradient_ai/deepseek-r1-distill-llama-70b | gradient_ai | chat | $0.99 | $0.99 | 8,000 | - | - | - | - |
gradient_ai/llama3.3-70b-instruct | gradient_ai | chat | $0.65 | $0.65 | 2,048 | - | - | - | - |
gradient_ai/llama3-8b-instruct | gradient_ai | chat | $0.20 | $0.20 | 512 | - | - | - | - |
gradient_ai/mistral-nemo-instruct-2407 | gradient_ai | chat | $0.30 | $0.30 | 512 | - | - | - | - |
gradient_ai/openai-o3 | gradient_ai | chat | $2.00 | $8.00 | 100,000 | - | - | - | - |
gradient_ai/openai-o3-mini | gradient_ai | chat | $1.10 | $4.40 | 100,000 | - | - | - | - |
gradient_ai/openai-gpt-4o | gradient_ai | chat | - | - | 16,384 | - | - | - | - |
gradient_ai/openai-gpt-4o-mini | gradient_ai | chat | - | - | 16,384 | - | - | - | - |
gradient_ai/alibaba-qwen3-32b | gradient_ai | chat | - | - | 2,048 | - | - | - | - |
nscale/meta-llama/Llama-4-Scout-17B-16E-Instruct | nscale | chat | $0.09 | $0.29 | - | - | - | - | - |
nscale/Qwen/Qwen2.5-Coder-3B-Instruct | nscale | chat | $0.01 | $0.03 | - | - | - | - | - |
nscale/Qwen/Qwen2.5-Coder-7B-Instruct | nscale | chat | $0.01 | $0.03 | - | - | - | - | - |
nscale/Qwen/Qwen2.5-Coder-32B-Instruct | nscale | chat | $0.06 | $0.20 | - | - | - | - | - |
nscale/Qwen/QwQ-32B | nscale | chat | $0.18 | $0.20 | - | - | - | - | - |
nscale/deepseek-ai/DeepSeek-R1-Distill-Llama-70B | nscale | chat | $0.375 | $0.375 | - | - | - | - | - |
nscale/deepseek-ai/DeepSeek-R1-Distill-Llama-8B | nscale | chat | $0.025 | $0.025 | - | - | - | - | - |
nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-1.5B | nscale | chat | $0.09 | $0.09 | - | - | - | - | - |
nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B | nscale | chat | $0.20 | $0.20 | - | - | - | - | - |
nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B | nscale | chat | $0.07 | $0.07 | - | - | - | - | - |
nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B | nscale | chat | $0.15 | $0.15 | - | - | - | - | - |
nscale/mistralai/mixtral-8x22b-instruct-v0.1 | nscale | chat | $0.60 | $0.60 | - | - | - | - | - |
nscale/meta-llama/Llama-3.1-8B-Instruct | nscale | chat | $0.03 | $0.03 | - | - | - | - | - |
nscale/meta-llama/Llama-3.3-70B-Instruct | nscale | chat | $0.20 | $0.20 | - | - | - | - | - |
nscale/black-forest-labs/FLUX.1-schnell | nscale | image_generation | - | - | - | - | - | - | - |
nscale/stabilityai/stable-diffusion-xl-base-1.0 | nscale | image_generation | - | - | - | - | - | - | - |
featherless_ai/featherless-ai/Qwerky-72B | featherless_ai | chat | - | - | 32,768 | - | - | - | - |
featherless_ai/featherless-ai/Qwerky-QwQ-32B | featherless_ai | chat | - | - | 32,768 | - | - | - | - |
deepgram/nova-3 | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-3-general | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-3-medical | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-2 | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-2-general | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-2-meeting | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-2-phonecall | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-2-voicemail | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-2-finance | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-2-conversationalai | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-2-video | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-2-drivethru | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-2-automotive | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-2-atc | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-general | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/nova-phonecall | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/enhanced | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/enhanced-general | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/enhanced-meeting | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/enhanced-phonecall | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/enhanced-finance | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/base | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/base-general | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/base-meeting | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/base-phonecall | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/base-voicemail | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/base-finance | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/base-conversationalai | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/base-video | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/whisper | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/whisper-tiny | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/whisper-base | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/whisper-small | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/whisper-medium | deepgram | audio_transcription | - | - | - | - | - | - | - |
deepgram/whisper-large | deepgram | audio_transcription | - | - | - | - | - | - | - |
elevenlabs/scribe_v1 | elevenlabs | audio_transcription | - | - | - | - | - | - | - |
elevenlabs/scribe_v1_experimental | elevenlabs | audio_transcription | - | - | - | - | - | - | - |
bedrock/us-gov-east-1/amazon.titan-embed-text-v1 | bedrock | embedding | $0.10 | - | 8,192 | - | - | - | - |
bedrock/us-gov-east-1/amazon.titan-embed-text-v2:0 | bedrock | embedding | $0.20 | - | 8,192 | - | - | - | - |
bedrock/us-gov-east-1/amazon.titan-text-express-v1 | bedrock | chat | $1.30 | $1.70 | 8,000 | - | - | - | - |
bedrock/us-gov-east-1/amazon.titan-text-lite-v1 | bedrock | chat | $0.30 | $0.40 | 4,000 | - | - | - | - |
bedrock/us-gov-east-1/amazon.titan-text-premier-v1:0 | bedrock | chat | $0.50 | $1.50 | 32,000 | - | - | - | - |
bedrock/us-gov-east-1/anthropic.claude-3-5-sonnet-20240620-v1:0 | bedrock | chat | $3.60 | $18.00 | 8,192 | ✓ | ✓ | - | - |
bedrock/us-gov-east-1/anthropic.claude-3-haiku-20240307-v1:0 | bedrock | chat | $0.30 | $1.50 | 4,096 | ✓ | ✓ | - | - |
bedrock/us-gov-east-1/meta.llama3-70b-instruct-v1:0 | bedrock | chat | $2.65 | $3.50 | 2,048 | - | - | - | - |
bedrock/us-gov-east-1/meta.llama3-8b-instruct-v1:0 | bedrock | chat | $0.30 | $2.65 | 2,048 | - | - | - | - |
bedrock/us-gov-west-1/amazon.titan-embed-text-v1 | bedrock | embedding | $0.10 | - | 8,192 | - | - | - | - |
bedrock/us-gov-west-1/amazon.titan-embed-text-v2:0 | bedrock | embedding | $0.20 | - | 8,192 | - | - | - | - |
bedrock/us-gov-west-1/amazon.titan-text-express-v1 | bedrock | chat | $1.30 | $1.70 | 8,000 | - | - | - | - |
bedrock/us-gov-west-1/amazon.titan-text-lite-v1 | bedrock | chat | $0.30 | $0.40 | 4,000 | - | - | - | - |
bedrock/us-gov-west-1/amazon.titan-text-premier-v1:0 | bedrock | chat | $0.50 | $1.50 | 32,000 | - | - | - | - |
bedrock/us-gov-west-1/anthropic.claude-3-5-sonnet-20240620-v1:0 | bedrock | chat | $3.60 | $18.00 | 8,192 | ✓ | ✓ | - | - |
bedrock/us-gov-west-1/anthropic.claude-3-haiku-20240307-v1:0 | bedrock | chat | $0.30 | $1.50 | 4,096 | ✓ | ✓ | - | - |
bedrock/us-gov-west-1/meta.llama3-70b-instruct-v1:0 | bedrock | chat | $2.65 | $3.50 | 2,048 | - | - | - | - |
bedrock/us-gov-west-1/meta.llama3-8b-instruct-v1:0 | bedrock | chat | $0.30 | $2.65 | 2,048 | - | - | - | - |
bedrock/us-gov-east-1/amazon.nova-pro-v1:0 | bedrock | chat | $0.96 | $3.84 | 10,000 | ✓ | ✓ | ✓ | - |
bedrock/us-gov-west-1/amazon.nova-pro-v1:0 | bedrock | chat | $0.96 | $3.84 | 10,000 | ✓ | ✓ | ✓ | - |
dashscope/qwen-max | dashscope | chat | - | - | 32,768 | - | ✓ | - | - |
dashscope/qwen-plus-latest | dashscope | chat | - | - | 131,072 | - | ✓ | - | - |
dashscope/qwen-turbo-latest | dashscope | chat | - | - | 131,072 | - | ✓ | - | - |
dashscope/qwen3-30b-a3b | dashscope | chat | - | - | 131,072 | - | ✓ | - | - |
moonshot/moonshot-v1-8k | moonshot | chat | $0.20 | $2.00 | 8,192 | - | ✓ | - | - |
moonshot/moonshot-v1-32k | moonshot | chat | $1.00 | $3.00 | 32,768 | - | ✓ | - | - |
moonshot/moonshot-v1-128k | moonshot | chat | $2.00 | $5.00 | 131,072 | - | ✓ | - | - |
moonshot/moonshot-v1-auto | moonshot | chat | $2.00 | $5.00 | 131,072 | - | ✓ | - | - |
moonshot/kimi-k2-0711-preview | moonshot | chat | $0.60 | $2.50 | 131,072 | - | ✓ | - | - |
moonshot/moonshot-v1-32k-0430 | moonshot | chat | $1.00 | $3.00 | 32,768 | - | ✓ | - | - |
moonshot/moonshot-v1-128k-0430 | moonshot | chat | $2.00 | $5.00 | 131,072 | - | ✓ | - | - |
moonshot/moonshot-v1-8k-0430 | moonshot | chat | $0.20 | $2.00 | 8,192 | - | ✓ | - | - |
moonshot/kimi-latest | moonshot | chat | $2.00 | $5.00 | 131,072 | ✓ | ✓ | - | - |
moonshot/kimi-latest-8k | moonshot | chat | $0.20 | $2.00 | 8,192 | ✓ | ✓ | - | - |
moonshot/kimi-latest-32k | moonshot | chat | $1.00 | $3.00 | 32,768 | ✓ | ✓ | - | - |
moonshot/kimi-latest-128k | moonshot | chat | $2.00 | $5.00 | 131,072 | ✓ | ✓ | - | - |
moonshot/kimi-thinking-preview | moonshot | chat | $30.00 | $30.00 | 131,072 | ✓ | - | - | - |
moonshot/moonshot-v1-8k-vision-preview | moonshot | chat | $0.20 | $2.00 | 8,192 | ✓ | ✓ | - | - |
moonshot/moonshot-v1-32k-vision-preview | moonshot | chat | $1.00 | $3.00 | 32,768 | ✓ | ✓ | - | - |
moonshot/moonshot-v1-128k-vision-preview | moonshot | chat | $2.00 | $5.00 | 131,072 | ✓ | ✓ | - | - |
recraft/recraftv3 | recraft | image_generation | - | - | - | - | - | - | - |
recraft/recraftv2 | recraft | image_generation | - | - | - | - | - | - | - |
morph/morph-v3-fast | morph | chat | $0.80 | $1.20 | 16,000 | - | - | - | - |
morph/morph-v3-large | morph | chat | $0.90 | $1.90 | 16,000 | - | - | - | - |
oci/meta.llama-4-maverick-17b-128e-instruct-fp8 | oci | chat | $0.72 | $0.72 | 512,000 | - | ✓ | - | - |
oci/meta.llama-4-scout-17b-16e-instruct | oci | chat | $0.72 | $0.72 | 192,000 | - | ✓ | - | - |
oci/meta.llama-3.3-70b-instruct | oci | chat | $0.72 | $0.72 | 128,000 | - | ✓ | - | - |
oci/meta.llama-3.2-90b-vision-instruct | oci | chat | $2.00 | $2.00 | 128,000 | - | ✓ | - | - |
oci/meta.llama-3.1-405b-instruct | oci | chat | $10.68 | $10.68 | 128,000 | - | ✓ | - | - |
oci/xai.grok-4 | oci | chat | $3.00 | $0.15 | 128,000 | - | ✓ | - | - |
oci/xai.grok-3 | oci | chat | $3.00 | $0.15 | 131,072 | - | ✓ | - | - |
oci/xai.grok-3-mini | oci | chat | $0.30 | $0.50 | 131,072 | - | ✓ | - | - |
oci/xai.grok-3-fast | oci | chat | $5.00 | $25.00 | 131,072 | - | ✓ | - | - |
oci/xai.grok-3-mini-fast | oci | chat | $0.60 | $4.00 | 131,072 | - | ✓ | - | - |
aiml/flux/kontext-pro/text-to-image | aiml | image_generation | - | - | - | - | - | - | - |
aiml/flux/kontext-max/text-to-image | aiml | image_generation | - | - | - | - | - | - | - |
aiml/flux-pro/v1.1-ultra | aiml | image_generation | - | - | - | - | - | - | - |
aiml/flux-pro/v1.1 | aiml | image_generation | - | - | - | - | - | - | - |
aiml/flux-realism | aiml | image_generation | - | - | - | - | - | - | - |
aiml/flux/schnell | aiml | image_generation | - | - | - | - | - | - | - |
aiml/flux/dev | aiml | image_generation | - | - | - | - | - | - | - |
aiml/flux-pro | aiml | image_generation | - | - | - | - | - | - | - |
aiml/dall-e-3 | aiml | image_generation | - | - | - | - | - | - | - |
aiml/dall-e-2 | aiml | image_generation | - | - | - | - | - | - | - |