nvidia
Models from nvidia
Models (87)
abacusai/dracarys-llama-3.1-70b-instruct
nvidia/abacusai/dracarys-llama-3.1-70b-instruct
Free
33K ctx
deepseek-ai/deepseek-coder-6.7b-instruct
nvidia/deepseek-ai/deepseek-coder-6.7b-instruct
Free
33K ctx
deepseek-ai/deepseek-v4-flash
nvidia/deepseek-ai/deepseek-v4-flash
$0.13/M
1M ctx
deepseek-ai/deepseek-v4-flash
nvidia/deepseek-ai/deepseek-v4-flash
$0.13/M
1M ctx
deepseek-ai/deepseek-v4-pro
nvidia/deepseek-ai/deepseek-v4-pro
$0.43/M
1M ctx
deepseek-ai/deepseek-v4-pro
nvidia/deepseek-ai/deepseek-v4-pro
$0.43/M
1M ctx
google/codegemma-1.1-7b
nvidia/google/codegemma-1.1-7b
Free
33K ctx
google/codegemma-7b
nvidia/google/codegemma-7b
Free
33K ctx
google/gemma-2-2b-it
nvidia/google/gemma-2-2b-it
Free
33K ctx
google/gemma-2b
nvidia/google/gemma-2b
Free
33K ctx
google/gemma-3-12b-it
nvidia/google/gemma-3-12b-it
$0.04/M
131K ctx
google/gemma-3-4b-it
nvidia/google/gemma-3-4b-it
$0.04/M
131K ctx
google/gemma-3n-e2b-it
nvidia/google/gemma-3n-e2b-it
Free
33K ctx
google/gemma-3n-e4b-it
nvidia/google/gemma-3n-e4b-it
$0.06/M
33K ctx
google/gemma-4-31b-it
nvidia/google/gemma-4-31b-it
$0.12/M
262K ctx
google/recurrentgemma-2b
nvidia/google/recurrentgemma-2b
Free
33K ctx
meta/codellama-70b
nvidia/meta/codellama-70b
Free
33K ctx
meta/llama-3.1-70b-instruct
nvidia/meta/llama-3.1-70b-instruct
$0.40/M
131K ctx
meta/llama-3.1-8b-instruct
nvidia/meta/llama-3.1-8b-instruct
$0.02/M
16K ctx
meta/llama-3.2-11b-vision-instruct
nvidia/meta/llama-3.2-11b-vision-instruct
$0.24/M
131K ctx
meta/llama-3.2-1b-instruct
nvidia/meta/llama-3.2-1b-instruct
$0.03/M
60K ctx
meta/llama-3.2-3b-instruct
nvidia/meta/llama-3.2-3b-instruct
$0.05/M
80K ctx
meta/llama-3.2-90b-vision-instruct
nvidia/meta/llama-3.2-90b-vision-instruct
Free
33K ctx
meta/llama-3.3-70b-instruct
nvidia/meta/llama-3.3-70b-instruct
$0.10/M
131K ctx
meta/llama-4-maverick-17b-128e-instruct
nvidia/meta/llama-4-maverick-17b-128e-instruct
Free
33K ctx
meta/llama-guard-4-12b
nvidia/meta/llama-guard-4-12b
$0.18/M
164K ctx
meta/llama2-70b
nvidia/meta/llama2-70b
Free
33K ctx
mistralai/codestral-22b-instruct-v0.1
nvidia/mistralai/codestral-22b-instruct-v0.1
Free
33K ctx
mistralai/ministral-14b-instruct-2512
nvidia/mistralai/ministral-14b-instruct-2512
Free
33K ctx
mistralai/mistral-7b-instruct-v0.3
nvidia/mistralai/mistral-7b-instruct-v0.3
Free
33K ctx
mistralai/mistral-large
nvidia/mistralai/mistral-large
$2.00/M
128K ctx
mistralai/mistral-large-2-instruct
nvidia/mistralai/mistral-large-2-instruct
Free
33K ctx
mistralai/mistral-large-3-675b-instruct-2512
nvidia/mistralai/mistral-large-3-675b-instruct-2512
Free
33K ctx
mistralai/mistral-medium-3.5-128b
nvidia/mistralai/mistral-medium-3.5-128b
Free
33K ctx
mistralai/mistral-nemotron
nvidia/mistralai/mistral-nemotron
Free
33K ctx
mistralai/mistral-small-4-119b-2603
nvidia/mistralai/mistral-small-4-119b-2603
Free
33K ctx
mistralai/mixtral-8x22b-instruct-v0.1
nvidia/mistralai/mixtral-8x22b-instruct-v0.1
Free
33K ctx
mistralai/mixtral-8x22b-v0.1
nvidia/mistralai/mixtral-8x22b-v0.1
Free
33K ctx
mistralai/mixtral-8x7b-instruct-v0.1
nvidia/mistralai/mixtral-8x7b-instruct-v0.1
Free
33K ctx
nv-mistralai/mistral-nemo-12b-instruct
nvidia/nv-mistralai/mistral-nemo-12b-instruct
Free
33K ctx
NVIDIA: Llama 3.3 Nemotron Super 49B V1.5
nvidia/llama-3.3-nemotron-super-49b-v1.5
$0.10/M
131K ctx
NVIDIA: Nemotron 3 Nano 30B A3B
nvidia/nemotron-3-nano-30b-a3b
$0.05/M
262K ctx
NVIDIA: Nemotron 3 Nano 30B A3B (free)
nvidia/nemotron-3-nano-30b-a3b:free
Free
256K ctx
NVIDIA: Nemotron 3 Nano Omni (free)
nvidia/nemotron-3-nano-omni-30b-a3b-reasoning:free
Free
256K ctx
NVIDIA: Nemotron 3 Super
nvidia/nemotron-3-super-120b-a12b
$0.09/M
262K ctx
NVIDIA: Nemotron 3 Super (free)
nvidia/nemotron-3-super-120b-a12b:free
Free
262K ctx
NVIDIA: Nemotron Nano 12B 2 VL (free)
nvidia/nemotron-nano-12b-v2-vl:free
Free
128K ctx
NVIDIA: Nemotron Nano 9B V2
nvidia/nemotron-nano-9b-v2
$0.04/M
131K ctx
NVIDIA: Nemotron Nano 9B V2 (free)
nvidia/nemotron-nano-9b-v2:free
Free
128K ctx
nvidia/llama-3.1-nemoguard-8b-content-safety
nvidia/nvidia/llama-3.1-nemoguard-8b-content-safety
Free
33K ctx
nvidia/llama-3.1-nemoguard-8b-topic-control
nvidia/nvidia/llama-3.1-nemoguard-8b-topic-control
Free
33K ctx
nvidia/llama-3.1-nemotron-51b-instruct
nvidia/nvidia/llama-3.1-nemotron-51b-instruct
Free
33K ctx
nvidia/llama-3.1-nemotron-70b-instruct
nvidia/nvidia/llama-3.1-nemotron-70b-instruct
Free
33K ctx
nvidia/llama-3.1-nemotron-nano-8b-v1
nvidia/nvidia/llama-3.1-nemotron-nano-8b-v1
Free
33K ctx
nvidia/llama-3.1-nemotron-nano-vl-8b-v1
nvidia/nvidia/llama-3.1-nemotron-nano-vl-8b-v1
Free
33K ctx
nvidia/llama-3.1-nemotron-safety-guard-8b-v3
nvidia/nvidia/llama-3.1-nemotron-safety-guard-8b-v3
Free
33K ctx
nvidia/llama-3.1-nemotron-ultra-253b-v1
nvidia/nvidia/llama-3.1-nemotron-ultra-253b-v1
Free
33K ctx
nvidia/llama-3.2-nemoretriever-1b-vlm-embed-v1
nvidia/nvidia/llama-3.2-nemoretriever-1b-vlm-embed-v1
Free
33K ctx
nvidia/llama-3.2-nemoretriever-300m-embed-v1
nvidia/nvidia/llama-3.2-nemoretriever-300m-embed-v1
Free
33K ctx
nvidia/llama-3.2-nv-embedqa-1b-v1
nvidia/nvidia/llama-3.2-nv-embedqa-1b-v1
Free
33K ctx
nvidia/llama-3.2-nv-embedqa-1b-v2
nvidia/nvidia/llama-3.2-nv-embedqa-1b-v2
Free
33K ctx
nvidia/llama-3.3-nemotron-super-49b-v1
nvidia/nvidia/llama-3.3-nemotron-super-49b-v1
Free
33K ctx
nvidia/llama-3.3-nemotron-super-49b-v1.5
nvidia/nvidia/llama-3.3-nemotron-super-49b-v1.5
$0.10/M
131K ctx
nvidia/llama-nemotron-embed-1b-v2
nvidia/nvidia/llama-nemotron-embed-1b-v2
Free
33K ctx
nvidia/llama-nemotron-embed-vl-1b-v2
nvidia/nvidia/llama-nemotron-embed-vl-1b-v2
Free
33K ctx
nvidia/llama3-chatqa-1.5-70b
nvidia/nvidia/llama3-chatqa-1.5-70b
Free
33K ctx
nvidia/mistral-nemo-minitron-8b-8k-instruct
nvidia/nvidia/mistral-nemo-minitron-8b-8k-instruct
Free
33K ctx
nvidia/nemotron-3-content-safety
nvidia/nvidia/nemotron-3-content-safety
Free
33K ctx
nvidia/nemotron-3-nano-30b-a3b
nvidia/nvidia/nemotron-3-nano-30b-a3b
$0.05/M
262K ctx
nvidia/nemotron-3-nano-omni-30b-a3b-reasoning
nvidia/nvidia/nemotron-3-nano-omni-30b-a3b-reasoning
Free
33K ctx
nvidia/nemotron-3-nano-omni-30b-a3b-reasoning
nvidia/nvidia/nemotron-3-nano-omni-30b-a3b-reasoning
Free
33K ctx
nvidia/nemotron-3-super-120b-a12b
nvidia/nvidia/nemotron-3-super-120b-a12b
$0.09/M
262K ctx
nvidia/nemotron-3-super-120b-a12b
nvidia/nvidia/nemotron-3-super-120b-a12b
$0.09/M
262K ctx
nvidia/nemotron-4-340b-instruct
nvidia/nvidia/nemotron-4-340b-instruct
Free
33K ctx
nvidia/nemotron-4-340b-reward
nvidia/nvidia/nemotron-4-340b-reward
Free
33K ctx
nvidia/nemotron-content-safety-reasoning-4b
nvidia/nvidia/nemotron-content-safety-reasoning-4b
Free
33K ctx
nvidia/nemotron-mini-4b-instruct
nvidia/nvidia/nemotron-mini-4b-instruct
Free
33K ctx
nvidia/nemotron-nano-12b-v2-vl
nvidia/nvidia/nemotron-nano-12b-v2-vl
Free
33K ctx
nvidia/nemotron-nano-3-30b-a3b
nvidia/nvidia/nemotron-nano-3-30b-a3b
Free
33K ctx
nvidia/nemotron-parse
nvidia/nvidia/nemotron-parse
Free
33K ctx
nvidia/nv-embedqa-mistral-7b-v2
nvidia/nvidia/nv-embedqa-mistral-7b-v2
Free
33K ctx
nvidia/nvidia-nemotron-nano-9b-v2
nvidia/nvidia/nvidia-nemotron-nano-9b-v2
Free
33K ctx
qwen/qwen3-coder-480b-a35b-instruct
nvidia/qwen/qwen3-coder-480b-a35b-instruct
Free
33K ctx
qwen/qwen3-next-80b-a3b-instruct
nvidia/qwen/qwen3-next-80b-a3b-instruct
$0.09/M
262K ctx
qwen/qwen3-next-80b-a3b-thinking
nvidia/qwen/qwen3-next-80b-a3b-thinking
$0.10/M
131K ctx
qwen/qwen3.5-122b-a10b
nvidia/qwen/qwen3.5-122b-a10b
$0.26/M
262K ctx
qwen/qwen3.5-397b-a17b
nvidia/qwen/qwen3.5-397b-a17b
$0.39/M
262K ctx