{"data":[{"id":"deepseek-v3-2-reasoning-925","name":"deepseek-v3-2-reasoning-925","display_name":"DeepSeek V3.2 Exp Reasoning","description":"A reasoning-mode experimental build of DeepSeek V3.2 (925 variant), combining sparse attention efficiency with chain-of-thought inference.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.2","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["deepseek-v3-2-reasoning-0925","deepseek-v3-2-reasoning-925"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"deepseek-v3-2","name":"v3-2","display_name":"DeepSeek V3.2","description":"DeepSeek's V3.2 MoE LLM featuring implicit caching support and improved tool-use capabilities over the V3.1 generation.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.2","type":"language","size_in_bn":685.397,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":163840,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-01","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":12,"ids":["accounts/fireworks/models/deepseek-v3p2","azure_ai/deepseek-v3.2","bedrock/ap-northeast-1/deepseek.v3.2","bedrock/ap-south-1/deepseek.v3.2","bedrock/ap-southeast-3/deepseek.v3.2","bedrock/eu-north-1/deepseek.v3.2","bedrock/sa-east-1/deepseek.v3.2","bedrock/us-east-1/deepseek.v3.2","bedrock/us-east-2/deepseek.v3.2","bedrock/us-west-2/deepseek.v3.2","deepseek-ai/DeepSeek-V3.2","deepseek-llm-deepseek-v3-2","deepseek-v3-2","deepseek-v3-2-251201","deepseek-v3-2-reasoning","deepseek-v3.2-maas","deepseek-v3.2685","deepseek.v3.2","deepseek/deepseek-v3.2","eu.deepseek.v3.2","fireworks_ai/accounts/fireworks/models/deepseek-v3p2","gmi/deepseek-ai/DeepSeek-V3.2","novita/deepseek/deepseek-v3.2","openrouter/deepseek/deepseek-v3.2","publishers/google/models/deepseek-v3.2-maas","us.deepseek.v3.2","vertex_ai/deepseek-ai/deepseek-v3.2-maas"],"hf_likes":1413,"hf_downloads":10366446,"hf_downloads_all_time":11229842,"hf_trending_score":6,"updated_at":"2026-06-11 08:02:18"},{"id":"deepseek-v3-2-speciale","name":"deepseek-v3-2-speciale","display_name":"DeepSeek V3.2 Speciale","description":"A high-compute variant of DeepSeek V3.2 optimized for maximum reasoning and agentic performance using DeepSeek Sparse Attention for long-context tasks.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.2","type":"language","size_in_bn":685.397,"modalities":{"input":["text"],"output":["text"]},"context_window":163840,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-01","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["azure_ai/deepseek-v3.2-speciale","deepseek-v3-2-speciale","deepseek/deepseek-v3.2-speciale"],"hf_likes":703,"hf_downloads":12474,"hf_downloads_all_time":252919,"hf_trending_score":1,"updated_at":"2026-06-11 08:02:18"},{"id":"deepseek-v3-1-terminus","name":"deepseek-v3-1-terminus","display_name":"DeepSeek V3.1 Terminus","description":"An update to DeepSeek V3.1 that addresses language consistency and agent capability issues while preserving the model's core performance.","creator":"deepseek","family":"deepseek-v3","tier":"terminus","version":"3.1","type":"language","size_in_bn":684.531,"modalities":{"input":["text"],"output":["text"]},"context_window":163840,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-03-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-22","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["accounts/fireworks/models/deepseek-v3p1-terminus","deepinfra/deepseek-ai/DeepSeek-V3.1-Terminus","deepseek-ai/DeepSeek-V3.1-Terminus","deepseek-v3-1-terminus","deepseek-v3-1-terminus-reasoning","deepseek/deepseek-v3.1-terminus","fireworks_ai/accounts/fireworks/models/deepseek-v3p1-terminus","novita/deepseek/deepseek-v3.1-terminus"],"hf_likes":363,"hf_downloads":3879,"hf_downloads_all_time":180017,"hf_trending_score":0,"updated_at":"2026-06-11 08:02:18"},{"id":"deepseek-v3-2-925","name":"deepseek-v3-2-925","display_name":"DeepSeek V3.2 Exp","description":"An experimental build of DeepSeek V3.2 identified by the 925 variant code, offering early access to V3.2 generation capabilities.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.2","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["deepseek-v3-2-0925","deepseek-v3-2-925"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"deepseek-v3-324","name":"deepseek-v3-324","display_name":"DeepSeek V3 324","description":"The March 2024 update of DeepSeek V3 (V3-0324), a 671B MoE LLM representing an improved iteration over the original V3 release.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.0","type":"language","size_in_bn":684.531,"modalities":{"input":["text"],"output":["text"]},"context_window":163840,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":13,"ids":["accounts/fireworks/models/deepseek-v3-0324","azure_ai/deepseek-v3-0324","baseten/deepseek-ai/DeepSeek-V3-0324","crusoe/deepseek-ai/DeepSeek-V3-0324","deepinfra/deepseek-ai/DeepSeek-V3-0324","deepseek-ai/DeepSeek-V3-0324","deepseek-v3-0324","deepseek-v3-324","deepseek/deepseek-v3-0324","fireworks_ai/accounts/fireworks/models/deepseek-v3-0324","gmi/deepseek-ai/DeepSeek-V3-0324","hyperbolic/deepseek-ai/DeepSeek-V3-0324","lambda_ai/deepseek-v3-0324","nebius/deepseek-ai/DeepSeek-V3-0324","novita/deepseek/deepseek-v3-0324","sambanova/DeepSeek-V3-0324","wandb/deepseek-ai/DeepSeek-V3-0324"],"hf_likes":3101,"hf_downloads":617973,"hf_downloads_all_time":4563386,"hf_trending_score":0,"updated_at":"2026-06-11 08:02:18"},{"id":"deepseek-v3","name":"v3","display_name":"DeepSeek V3","description":"DeepSeek's third-generation MoE LLM with 671B total parameters (37B activated per token), excelling at coding, reasoning, and tool use.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.0","type":"language","size_in_bn":684.531,"modalities":{"input":["image","text"],"output":["text"]},"context_window":163840,"max_output_tokens":81920,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-07-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-12-26","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":11,"ids":["accounts/fireworks/models/deepseek-v3","azure_ai/deepseek-v3","deepinfra/deepseek-ai/DeepSeek-V3","deepseek-ai/DeepSeek-V3","deepseek-chat","deepseek-v3","deepseek.v3-v1:0","deepseek/deepseek_v3","deepseek/deepseek-chat","deepseek/deepseek-v3","fireworks_ai/accounts/fireworks/models/deepseek-v3","hyperbolic/deepseek-ai/DeepSeek-V3","nebius/deepseek-ai/DeepSeek-V3","openrouter/deepseek/deepseek-chat","replicate/deepseek-ai/deepseek-v3","together_ai/deepseek-ai/DeepSeek-V3","vercel_ai_gateway/deepseek/deepseek-v3"],"hf_likes":4056,"hf_downloads":882009,"hf_downloads_all_time":15156328,"hf_trending_score":4,"updated_at":"2026-06-11 08:02:18"},{"id":"deepseek-v3-324b","name":"v3-324b","display_name":"DeepSeek V3 324B","description":"A 324B-parameter variant of DeepSeek V3, offering a mid-scale MoE LLM option within the V3 product line.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.0","type":"language","size_in_bn":324,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["deepseek-v3-324b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"deepseek-v3-turbo","name":"deepseek-v3-turbo","display_name":"DeepSeek V3 Turbo","description":"A turbo-speed variant of DeepSeek V3 optimized for faster inference, pre-trained on nearly 15 trillion tokens with strong coding and instruction-following abilities.","creator":"deepseek","family":"deepseek-v3","tier":"turbo","version":"3.0","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":64000,"max_output_tokens":16000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["deepseek-v3-turbo","deepseek/deepseek-v3-turbo","novita/deepseek/deepseek-v3-turbo"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"deepseek-v3-1-671b","name":"deepseek-v3-1-671b","display_name":"DeepSeek V3.1 671B","description":"The full 671B-parameter release of DeepSeek V3.1, a MoE LLM with enhanced reasoning and agentic capabilities over the original V3.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.1","type":"language","size_in_bn":671,"modalities":{"input":["text"],"output":["text"]},"context_window":163840,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["deepseek-v3-1-671b","ollama/deepseek-v3.1:671b-cloud"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"deepseek-v3-2-exp","name":"deepseek-v3-2-exp","display_name":"DeepSeek V3.2 Exp","description":"An experimental DeepSeek V3.2 variant introducing the DeepSeek Sparse Attention mechanism for enhanced long-context processing efficiency.","creator":"deepseek","family":"deepseek-v3","tier":"exp","version":"3.2","type":"language","size_in_bn":685.397,"modalities":{"input":["text"],"output":["text"]},"context_window":163840,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-07-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-29","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["deepseek-v3-2-exp","deepseek-v3.2-exp685","deepseek/deepseek-v3.2-exp","novita/deepseek/deepseek-v3.2-exp","openrouter/deepseek/deepseek-v3.2-exp"],"hf_likes":988,"hf_downloads":218917,"hf_downloads_all_time":636879,"hf_trending_score":5,"updated_at":"2026-06-11 08:02:18"},{"id":"deepseek-v3-2-thinking","name":"deepseek-v3-2-thinking","display_name":"DeepSeek V3.2 Thinking","description":"The thinking-mode variant of DeepSeek V3.2, enabling extended internal reasoning traces for complex problem-solving scenarios.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.2","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":128000,"max_output_tokens":8000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-12-01","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["deepseek-v3-2-thinking","deepseek/deepseek-v3.2-thinking"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"}],"pagination":{"page_size":50,"has_next":false,"next_token":null,"total_count":12},"meta":{"updated_at":"2026-06-11","request_id":"9713cb67-eba1-4eb9-95c5-1827c1b19de9","execution_ms":9}}