D
DeepInfra
197 models available
197 models
Provider | Model ID | Input $/M | Output $/M | Cache Read $/M | Cache Write $/M | Features | Verified | Updated | |
|---|---|---|---|---|---|---|---|---|---|
allenai/Olmo-3.1-32B-Instruct | $0.20 | $0.60 | — | — | — | — | 5d ago | ||
allenai/olmOCR-2-7B-1025 | $0.09 | $0.19 | — | — | — | — | 1mo ago | ||
anthropic/claude-3-7-sonnet-latest | $3.30 | $16.50 | $0.33 | — | — | — | 1mo ago | ||
anthropic/claude-4-opus | $16.50 | $82.50 | — | — | — | — | 5d ago | ||
anthropic/claude-4-sonnet | $3.30 | $16.50 | — | — | — | — | 1mo ago | ||
deepseek-ai/DeepSeek-OCR | $0.03 | $0.10 | — | — | — | — | 1mo ago | ||
deepseek-ai/DeepSeek-R1-0528 | $0.50 | $2.15 | $0.40 | — | — | — | 1mo ago | ||
deepseek-ai/DeepSeek-R1-0528-Turbo | $1.00 | $3.00 | — | — | — | — | 1mo ago | ||
deepseek-ai/DeepSeek-R1-Distill-Llama-70B | $0.70 | $0.80 | — | — | — | — | 5d ago | ||
deepseek-ai/DeepSeek-V3 | $0.32 | $0.89 | — | — | — | — | 5d ago | ||
deepseek-ai/DeepSeek-V3-0324 | $0.20 | $0.77 | $0.11 | — | — | — | 5d ago | ||
deepseek-ai/DeepSeek-V3.1 | $0.21 | $0.79 | $0.17 | — | — | — | 1mo ago | ||
deepseek-ai/DeepSeek-V3.1-Terminus | $0.21 | $0.79 | $0.17 | — | — | — | 1mo ago | ||
deepseek-ai/DeepSeek-V3.2 | $0.26 | $0.38 | $0.13 | — | — | — | 5d ago | ||
google/gemini-1.5-flash | $0.07 | $0.30 | — | — | — | — | 1mo ago | ||
google/gemini-1.5-flash-8b | $0.04 | $0.15 | — | — | — | — | 1mo ago | ||
google/gemini-2.0-flash-001 | $0.10 | $0.40 | — | — | — | — | 1mo ago | ||
google/gemini-2.5-flash | $0.30 | $2.50 | — | — | — | — | 1mo ago | ||
google/gemini-2.5-pro | $1.25 | $10.00 | — | — | — | — | 1mo ago | ||
google/gemma-3-12b-it | $0.04 | $0.13 | — | — | — | — | 1mo ago | ||
google/gemma-3-27b-it | $0.08 | $0.16 | — | — | — | — | 5d ago | ||
google/gemma-3-4b-it | $0.04 | $0.08 | — | — | — | — | 1mo ago | ||
Gryphe/MythoMax-L2-13b | $0.40 | $0.40 | — | — | — | — | 5d ago | ||
lizpreciatior/lzlv_70b_fp16_hf | $0.35 | $0.40 | — | — | — | — | 1mo ago | ||
meta-llama/Llama-3.2-11B-Vision-Instruct | $0.05 | $0.05 | — | — | — | — | 1mo ago | ||
meta-llama/Llama-3.2-3B-Instruct | $0.02 | $0.02 | — | — | — | — | 1mo ago | ||
meta-llama/Llama-3.3-70B-Instruct-Turbo | $0.10 | $0.32 | — | — | — | — | 5d ago | ||
meta-llama/Llama-4-Maverick-17B-128E-Instruct-FP8 | $0.15 | $0.60 | — | — | — | — | 1mo ago | ||
meta-llama/Llama-4-Scout-17B-16E-Instruct | $0.08 | $0.30 | — | — | — | — | 1mo ago | ||
meta-llama/Llama-Guard-4-12B | $0.18 | $0.18 | — | — | — | — | 1mo ago | ||
meta-llama/Meta-Llama-3-70B-Instruct | $0.23 | $0.40 | — | — | — | — | 1mo ago | ||
meta-llama/Meta-Llama-3-8B-Instruct | $0.03 | $0.04 | — | — | — | — | 5d ago | ||
meta-llama/Meta-Llama-3.1-405B-Instruct | $0.09 | $0.09 | — | — | — | — | 1mo ago | ||
meta-llama/Meta-Llama-3.1-70B-Instruct | $0.40 | $0.40 | — | — | — | — | 1mo ago | ||
meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo | $0.40 | $0.40 | — | — | — | — | 1mo ago | ||
meta-llama/Meta-Llama-3.1-8B-Instruct | $0.02 | $0.05 | — | — | — | — | 5d ago | ||
meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo | $0.02 | $0.03 | — | — | — | — | 1mo ago | ||
meta-llama/Meta-Llama-3.3-70B-Instruct | $0.23 | $0.04 | — | — | — | — | 1mo ago | ||
meta-llama/Meta-Llama-3.3-70B-Instruct-Turbo | $0.12 | $0.03 | — | — | — | — | 1mo ago | ||
microsoft/phi-4 | $0.07 | $0.14 | — | — | — | — | 1mo ago | ||
microsoft/WizardLM-2-7B | $0.06 | $0.06 | — | — | — | — | 1mo ago | ||
microsoft/WizardLM-2-8x22B | $0.48 | $0.48 | — | — | — | — | 1mo ago | ||
MiniMaxAI/MiniMax-M2 | $0.27 | $1.15 | — | — | — | — | 1mo ago | ||
MiniMaxAI/MiniMax-M2.1 | $0.27 | $0.95 | $0.03 | — | — | — | 5d ago | ||
mistralai/Mistral-7B-Instruct-v0.3 | $0.03 | $0.06 | — | — | — | — | 1mo ago | ||
mistralai/Mistral-Nemo-Instruct-2407 | $0.02 | $0.04 | — | — | — | — | 1mo ago | ||
mistralai/Mistral-Small-24B-Instruct-2501 | $0.05 | $0.08 | — | — | — | — | 1mo ago | ||
mistralai/Mistral-Small-3.2-24B-Instruct-2506 | $0.07 | $0.20 | — | — | — | — | 1mo ago | ||
mistralai/Mixtral-8x7B-Instruct-v0.1 | $0.54 | $0.54 | — | — | — | 1mo ago | |||
moonshotai/Kimi-K2-Instruct-0905 | $0.40 | $2.00 | $0.40 | — | — | — | 5d ago | ||
moonshotai/Kimi-K2-Thinking | $0.47 | $2.00 | $0.14 | — | — | — | 1mo ago | ||
moonshotai/Kimi-K2.5 | $0.45 | $2.25 | $0.07 | — | — | — | 5d ago | ||
NousResearch/Hermes-3-Llama-3.1-405B | $1.00 | $1.00 | — | — | — | — | 1mo ago | ||
NousResearch/Hermes-3-Llama-3.1-70B | $0.30 | $0.30 | — | — | — | — | 1mo ago | ||
nvidia/Llama-3.1-Nemotron-70B-Instruct | $1.20 | $1.20 | — | — | — | — | 1mo ago | ||
nvidia/Llama-3.3-Nemotron-Super-49B-v1.5 | $0.10 | $0.40 | — | — | — | — | 1mo ago | ||
nvidia/Nemotron-3-Nano-30B-A3B | $0.05 | $0.20 | — | — | — | — | 5d ago | ||
nvidia/NVIDIA-Nemotron-Nano-12B-v2-VL | $0.20 | $0.60 | — | — | — | — | 1mo ago | ||
nvidia/NVIDIA-Nemotron-Nano-9B-v2 | $0.04 | $0.16 | — | — | — | — | 1mo ago | ||
openai/gpt-oss-120b | $0.04 | $0.19 | — | — | — | — | 1mo ago | ||
openai/gpt-oss-120b-Turbo | $0.15 | $0.60 | — | — | — | — | 1mo ago | ||
openai/gpt-oss-20b | $0.03 | $0.14 | — | — | — | — | 1mo ago | ||
openchat/openchat_3.5 | $0.06 | $0.06 | — | — | — | — | 1mo ago | ||
PaddlePaddle/PaddleOCR-VL-0.9B | $0.14 | $0.80 | — | — | — | — | 1mo ago | ||
Qwen/Qwen2.5-72B-Instruct | $0.12 | $0.39 | — | — | — | — | 1mo ago | ||
Qwen/Qwen2.5-VL-32B-Instruct | $0.20 | $0.60 | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-14B | $0.12 | $0.24 | — | — | — | — | 5d ago | ||
Qwen/Qwen3-235B-A22B-Instruct-2507 | $0.07 | $0.10 | — | — | — | — | 5d ago | ||
Qwen/Qwen3-235B-A22B-Thinking-2507 | $0.23 | $2.30 | — | — | — | — | 5d ago | ||
Qwen/Qwen3-30B-A3B | $0.08 | $0.28 | — | — | — | — | 5d ago | ||
Qwen/Qwen3-32B | $0.08 | $0.28 | — | — | — | — | 5d ago | ||
Qwen/Qwen3-Coder-480B-A35B-Instruct | $0.40 | $1.60 | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-Coder-480B-A35B-Instruct-Turbo | $0.22 | $1.00 | — | — | — | — | 5d ago | ||
Qwen/Qwen3-Max | $1.20 | $6.00 | $0.24 | — | — | — | 5d ago | ||
Qwen/Qwen3-Max-Thinking | $1.20 | $6.00 | $0.24 | — | — | — | 5d ago | ||
Qwen/Qwen3-Next-80B-A3B-Instruct | $0.09 | $1.10 | — | — | — | — | 5d ago | ||
Qwen/Qwen3-VL-235B-A22B-Instruct | $0.20 | $0.88 | — | — | — | — | 5d ago | ||
Qwen/Qwen3-VL-30B-A3B-Instruct | $0.15 | $0.60 | — | — | — | — | 1mo ago | ||
Sao10K/L3-8B-Lunaris-v1-Turbo | $0.04 | $0.05 | — | — | — | — | 1mo ago | ||
Sao10K/L3.1-70B-Euryale-v2.2 | $0.85 | $0.85 | — | — | — | — | 1mo ago | ||
Sao10K/L3.3-70B-Euryale-v2.3 | $0.85 | $0.85 | — | — | — | — | 1mo ago | ||
zai-org/GLM-4.6 | $0.43 | $1.74 | $0.08 | — | — | — | 5d ago | ||
zai-org/GLM-4.6V | $0.30 | $0.90 | — | — | — | — | 5d ago | ||
zai-org/GLM-4.7 | $0.40 | $1.75 | $0.08 | — | — | — | 5d ago | ||
zai-org/GLM-4.7-Flash | $0.06 | $0.40 | $0.01 | — | — | — | 5d ago | ||
zai-org/GLM-5 | $0.80 | $2.56 | $0.16 | — | — | — | 5d ago | ||
01-ai/Yi-34B-Chat | — | — | — | — | — | — | 1mo ago | ||
allenai/olmOCR-7B-0725-FP8 | — | — | — | — | — | — | 1mo ago | ||
Austism/chronos-hermes-13b-v2 | — | — | — | — | — | — | 1mo ago | ||
BAAI/bge-base-en-v1.5 | — | — | — | — | — | — | 1mo ago | ||
BAAI/bge-en-icl | — | — | — | — | — | — | 1mo ago | ||
BAAI/bge-large-en-v1.5 | — | — | — | — | — | — | 1mo ago | ||
BAAI/bge-m3 | — | — | — | — | — | — | 1mo ago | ||
BAAI/bge-m3-multi | — | — | — | — | — | — | 1mo ago | ||
black-forest-labs/FLUX-1-dev | — | — | — | — | — | — | 1mo ago | ||
black-forest-labs/FLUX-1-Redux-dev | — | — | — | — | — | — | 1mo ago | ||
black-forest-labs/FLUX-1-schnell | — | — | — | — | — | — | 1mo ago | ||
black-forest-labs/FLUX-1.1-pro | — | — | — | — | — | — | 1mo ago | ||
black-forest-labs/FLUX-2-dev | — | — | — | — | — | — | 1mo ago | ||
black-forest-labs/FLUX-2-klein-4b | — | — | — | — | — | — | 5d ago | ||
black-forest-labs/FLUX-2-klein-9b | — | — | — | — | — | — | 5d ago | ||
black-forest-labs/FLUX-2-pro | — | — | — | — | — | — | 1mo ago | ||
black-forest-labs/FLUX-pro | — | — | — | — | — | — | 1mo ago | ||
black-forest-labs/FLUX.1-Kontext-dev | — | — | — | — | — | — | 1mo ago | ||
bosonai/HiggsAudioV2.5 | — | — | — | — | — | — | 2w ago | ||
Bria/blur_background | — | — | — | — | — | — | 1mo ago | ||
Bria/Bria-3.2 | — | — | — | — | — | — | 1mo ago | ||
Bria/Bria-3.2-vector | — | — | — | — | — | — | 1mo ago | ||
Bria/enhance | — | — | — | — | — | — | 1mo ago | ||
Bria/erase | — | — | — | — | — | — | 1mo ago | ||
Bria/erase_foreground | — | — | — | — | — | — | 1mo ago | ||
Bria/expand | — | — | — | — | — | — | 1mo ago | ||
Bria/fibo | — | — | — | — | — | — | 1mo ago | ||
Bria/fibo_edit | — | — | — | — | — | — | 5d ago | ||
Bria/gen_fill | — | — | — | — | — | — | 1mo ago | ||
Bria/remove_background | — | — | — | — | — | — | 1mo ago | ||
Bria/replace_background | — | — | — | — | — | — | 1mo ago | ||
ByteDance/SeeDance-T2V | — | — | — | — | — | — | 1mo ago | ||
ByteDance/Seedream-4 | — | — | — | — | — | — | 1mo ago | ||
canopylabs/orpheus-3b-0.1-ft | — | — | — | — | — | — | 1mo ago | ||
codellama/CodeLlama-34b-Instruct-hf | — | — | — | — | — | — | 1mo ago | ||
codellama/CodeLlama-70b-Instruct-hf | — | — | — | — | — | — | 1mo ago | ||
cognitivecomputations/dolphin-2.6-mixtral-8x7b | — | — | — | — | — | — | 1mo ago | ||
deepinfra/airoboros-70b | — | — | — | — | — | — | 1mo ago | ||
DeepInfra/pygmalion-13b-4bit-128g | — | — | — | — | — | — | 1mo ago | ||
deepseek-ai/DeepSeek-R1 | — | — | — | — | — | — | 1mo ago | ||
deepseek-ai/DeepSeek-R1-Distill-Qwen-32B | — | — | — | — | — | — | 1mo ago | ||
deepseek-ai/DeepSeek-R1-Turbo | — | — | — | — | — | — | 1mo ago | ||
deepseek-ai/DeepSeek-V3-0324-Turbo | — | — | — | — | — | — | 1mo ago | ||
deepseek-ai/Janus-Pro-1B | — | — | — | — | — | — | 1mo ago | ||
deepseek-ai/Janus-Pro-7B | — | — | — | — | — | — | 1mo ago | ||
EleutherAI/pythia-2.8b | — | — | — | — | — | — | 1mo ago | ||
google/embeddinggemma-300m | — | — | — | — | — | — | 1mo ago | ||
google/gemma-7b-it | — | — | — | — | — | — | 1mo ago | ||
hexgrad/Kokoro-82M | — | — | — | — | — | — | 1mo ago | ||
intfloat/e5-base-v2 | — | — | — | — | — | — | 1mo ago | ||
intfloat/e5-large-v2 | — | — | — | — | — | — | 1mo ago | ||
intfloat/multilingual-e5-large | — | — | — | — | — | — | 1mo ago | ||
intfloat/multilingual-e5-large-instruct | — | — | — | — | — | — | 1mo ago | ||
jondurbin/airoboros-l2-70b-gpt4-1.4.1 | — | — | — | — | — | — | 1mo ago | ||
llava-hf/llava-1.5-7b-hf | — | — | — | — | — | — | 1mo ago | ||
meta-llama/Llama-2-13b-chat-hf | — | — | — | — | — | — | 1mo ago | ||
meta-llama/Llama-2-70b-chat-hf | — | — | — | — | — | — | 1mo ago | ||
meta-llama/Llama-2-7b-chat-hf | — | — | — | — | — | — | 1mo ago | ||
meta-llama/Llama-3.2-90B-Vision-Instruct | — | — | — | — | — | — | 1mo ago | ||
meta-llama/Llama-3.3-70B-Instruct | — | — | — | — | — | — | 1mo ago | ||
meta-llama/Llama-4-Maverick-17B-128E-Instruct-Turbo | — | — | — | — | — | — | 1mo ago | ||
meta-llama/Llama-Guard-3-8B | — | — | — | — | — | — | 1mo ago | ||
mistralai/Devstral-Small-2507 | — | — | — | — | — | — | 1mo ago | ||
mistralai/Mistral-7B-Instruct-v0.1 | — | — | — | — | — | 1mo ago | |||
mistralai/Mistral-Small-3.1-24B-Instruct-2503 | — | — | — | — | — | — | 1mo ago | ||
mistralai/Voxtral-Mini-3B-2507 | — | — | — | — | — | — | 1mo ago | ||
mistralai/Voxtral-Small-24B-2507 | — | — | — | — | — | — | 1mo ago | ||
moonshotai/Kimi-K2-Instruct | — | — | — | — | — | — | 1mo ago | ||
openai/clip-vit-base-patch32 | — | — | — | — | — | — | 1mo ago | ||
openai/clip-vit-large-patch14-336 | — | — | — | — | — | — | 1mo ago | ||
openai/whisper-large-v3 | — | — | — | — | — | — | 1mo ago | ||
openai/whisper-large-v3-turbo | — | — | — | — | — | — | 1mo ago | ||
Phind/Phind-CodeLlama-34B-v2 | — | — | — | — | — | — | 1mo ago | ||
PrunaAI/p-image | — | — | — | — | — | — | 1mo ago | ||
PrunaAI/p-image-Edit | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen-Image-Edit | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen2.5-7B-Instruct | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen2.5-Coder-32B-Instruct | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-235B-A22B | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-Embedding-0.6B | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-Embedding-0.6B-batch | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-Embedding-4B | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-Embedding-4B-batch | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-Embedding-8B | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-Embedding-8B-batch | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-Reranker-0.6B | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-Reranker-4B | — | — | — | — | — | — | 1mo ago | ||
Qwen/Qwen3-Reranker-8B | — | — | — | — | — | — | 1mo ago | ||
Qwen/QwQ-32B | — | — | — | — | — | — | 1mo ago | ||
ResembleAI/chatterbox | — | — | — | — | — | — | 1mo ago | ||
ResembleAI/chatterbox-turbo | — | — | — | — | — | — | 2w ago | ||
sentence-transformers/all-MiniLM-L12-v2 | — | — | — | — | — | — | 1mo ago | ||
sentence-transformers/all-MiniLM-L6-v2 | — | — | — | — | — | — | 1mo ago | ||
sentence-transformers/all-mpnet-base-v2 | — | — | — | — | — | — | 1mo ago | ||
sentence-transformers/clip-ViT-B-32 | — | — | — | — | — | — | 1mo ago | ||
sentence-transformers/clip-ViT-B-32-multilingual-v1 | — | — | — | — | — | — | 1mo ago | ||
sentence-transformers/multi-qa-mpnet-base-dot-v1 | — | — | — | — | — | — | 1mo ago | ||
sentence-transformers/paraphrase-MiniLM-L6-v2 | — | — | — | — | — | — | 1mo ago | ||
sesame/csm-1b | — | — | — | — | — | — | 1mo ago | ||
shibing624/text2vec-base-chinese | — | — | — | — | — | — | 1mo ago | ||
stabilityai/sd3.5 | — | — | — | — | — | — | 1mo ago | ||
stabilityai/sd3.5-medium | — | — | — | — | — | — | 1mo ago | ||
stabilityai/sdxl-turbo | — | — | — | — | — | — | 1mo ago | ||
thenlper/gte-base | — | — | — | — | — | — | 1mo ago | ||
thenlper/gte-large | — | — | — | — | — | — | 1mo ago | ||
Wan-AI/Wan2.1-T2V-1.3B | — | — | — | — | — | — | 1mo ago | ||
Wan-AI/Wan2.1-T2V-14B | — | — | — | — | — | — | 1mo ago | ||
zai-org/GLM-4.5 | — | — | — | — | — | — | 1mo ago | ||
zai-org/GLM-4.5-Air | — | — | — | — | — | — | 1mo ago | ||
Zyphra/Zonos-v0.1-hybrid | — | — | — | — | — | — | 1mo ago | ||
Zyphra/Zonos-v0.1-transformer | — | — | — | — | — | — | 1mo ago |