{"data":[{"id":"nvidia-nemotron-super-3-120b-a12b","name":"nvidia-nemotron-super-3-120b-a12b","display_name":"Nemotron Super 3 120B A12B","description":"A 120B-parameter hybrid MoE Nemotron Super 3 model with 12B active parameters, optimized by NVIDIA for compute-efficient reasoning in specialized agentic systems.","creator":"nvidia","family":"nemotron_h","tier":"","version":"3","type":"language","size_in_bn":120,"modalities":{"input":["text"],"output":["text"]},"context_window":1000000,"max_output_tokens":262144,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-11","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["nvidia-nemotron-super-3-120b-a12b","nvidia-nemotron-3-super-120b-a12b","amazon_sagemaker/huggingface-llm-nvidia-nemotron-3-super-120b-a12b-bf16","artificialanalysis/nvidia-nemotron-3-super-120b-a12b","deepinfra/nvidia/NVIDIA-Nemotron-3-Super-120B-A12B","fireworks/accounts/fireworks/models/nvidia-nemotron-3-super-120b-a12b-fp8","fireworks/accounts/fireworks/models/nvidia-nemotron-3-super-120b-a12b-nvfp4","openrouter/nvidia/nemotron-3-super-120b-a12b","openrouter/nvidia/nemotron-3-super-120b-a12b:free","vercel/nvidia/nemotron-3-super-120b-a12b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-07 08:02:45"},{"id":"nvidia-nemotron-nano-2-9b","name":"nemotron-nano-2-9b","display_name":"Nemotron Nano 2 9B","description":"A 9B-parameter hybrid LLM from NVIDIA's Nemotron Nano v2 series, trained from scratch as a unified model for both reasoning and non-reasoning workloads.","creator":"nvidia","family":"nemotron_h","tier":"","version":"2","type":"language","size_in_bn":9,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-03-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-05","earliest_deprecation_date":"2026-06-11","deprecated":false,"has_pricing":true,"provider_count":5,"ids":["nvidia-nemotron-nano-2-9b","deepinfra/nvidia/NVIDIA-Nemotron-Nano-9B-v2","fireworks_ai/accounts/fireworks/models/nvidia-nemotron-nano-9b-v2","nvidia.nemotron-nano-9b-v2","nvidia-nemotron-nano-9b-v2","nvidia-nemotron-nano-9b-v2-reasoning","amazon_bedrock/nvidia.nemotron-nano-9b-v2","amazon_bedrock_global/nvidia.nemotron-nano-9b-v2","amazon_sagemaker/nvidia-nemotron-nano-9b-v2","artificialanalysis/nvidia-nemotron-nano-9b-v2","artificialanalysis/nvidia-nemotron-nano-9b-v2-reasoning","fireworks/accounts/fireworks/models/nvidia-nemotron-nano-9b-v2","litellm/deepinfra/nvidia/NVIDIA-Nemotron-Nano-9B-v2","litellm/fireworks_ai/accounts/fireworks/models/nvidia-nemotron-nano-9b-v2","litellm/nvidia.nemotron-nano-9b-v2","openrouter/nvidia/nemotron-nano-9b-v2","openrouter/nvidia/nemotron-nano-9b-v2:free","vercel/nvidia/nemotron-nano-9b-v2"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-07 08:02:45"},{"id":"nvidia-nemotron-nano-3-30b-a3b","name":"nvidia-nemotron-nano-3-30b-a3b","display_name":"Nemotron Nano 3 30B A3B","description":"A 30B-parameter hybrid MoE Nemotron Nano 3 model with 3B active parameters, combining Mamba-Transformer architecture for efficient reasoning and agentic tasks.","creator":"nvidia","family":"nemotron_h","tier":"","version":"3","type":"language","size_in_bn":30,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":228000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-12-14","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["nvidia-nemotron-nano-3-30b-a3b","nvidia-nemotron-3-nano-30b-a3b","nvidia-nemotron-3-nano-30b-a3b-reasoning","artificialanalysis/nvidia-nemotron-3-nano-30b-a3b","artificialanalysis/nvidia-nemotron-3-nano-30b-a3b-reasoning","deepinfra/nvidia/Nemotron-3-Nano-30B-A3B","fireworks/accounts/fireworks/models/nemotron-nano-3-30b-a3b","openrouter/nvidia/nemotron-3-nano-30b-a3b","openrouter/nvidia/nemotron-3-nano-30b-a3b:free","vercel/nvidia/nemotron-3-nano-30b-a3b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-07 08:02:45"},{"id":"nvidia-nemotron-3-ultra","name":"nemotron-3-ultra","display_name":"Nemotron 3 Ultra","description":"A frontier-scale Nemotron large language model from NVIDIA designed for strong agentic, reasoning, and conversational capabilities at extreme parameter counts.","creator":"nvidia","family":"nemotron_h","tier":"ultra","version":"3","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["nvidia-nemotron-3-ultra","fireworks/accounts/fireworks/models/nemotron-3-ultra-bf16","fireworks/accounts/fireworks/models/nemotron-3-ultra-nvfp4"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-07 08:02:45"},{"id":"nvidia-nemotron-nano-2-12b","name":"nemotron-nano-2-12b","display_name":"Nemotron Nano 2 12B","description":"A 12B-parameter hybrid LLM from NVIDIA's Nemotron Nano v2 series, trained from scratch as a unified model supporting both reasoning and non-reasoning modes.","creator":"nvidia","family":"nemotron_h","tier":"","version":"2","type":"language","size_in_bn":12,"modalities":{"input":["image","text"],"output":["text"]},"context_window":131072,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-12-02","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["nvidia-nemotron-nano-2-12b","fireworks_ai/accounts/fireworks/models/nvidia-nemotron-nano-12b-v2","nvidia.nemotron-nano-12b-v2","amazon_bedrock/nvidia.nemotron-nano-12b-v2","amazon_bedrock_global/nvidia.nemotron-nano-12b-v2","fireworks/accounts/fireworks/models/nvidia-nemotron-nano-12b-v2","litellm/fireworks_ai/accounts/fireworks/models/nvidia-nemotron-nano-12b-v2","litellm/nvidia.nemotron-nano-12b-v2"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-07 08:02:45"}],"pagination":{"page_size":50,"has_next":false,"next_token":null,"total_count":5},"meta":{"updated_at":"2026-06-07","request_id":"4d828108-0673-4b26-9179-629917065487","execution_ms":2}}