{"data":[{"id":"alibaba-qwen3-4b-instruct","name":"qwen3-4b-instruct","display_name":"Qwen3 4B Instruct","description":"An instruction-tuned 4B Qwen3 model offering efficient text generation and reasoning in a small parameter footprint.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"language","size_in_bn":4,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["accounts/fireworks/models/qwen3-4b-instruct-2507","alibaba-qwen3-4b-instruct","fireworks_ai/accounts/fireworks/models/qwen3-4b-instruct-2507","huggingface-reasoning-qwen3-4b-instruct-2507","lemonade/Qwen3-4B-Instruct-2507-GGUF","qwen3-4b-2507-instruct","qwen3-4b-2507-instruct-reasoning","qwen3-4b-instruct","qwen3-4b-instruct-reasoning"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"kwaipilot-kat-32b-dev","name":"kat-32b-dev","display_name":"KwaiPilot KAT 32B Dev","description":"An open-source 32B-parameter coding LLM based on the Qwen3 architecture, optimized for software engineering tasks through multi-stage training including SFT and reinforcement learning.","creator":"kwaipilot","family":"qwen3","tier":"","version":null,"type":"language","size_in_bn":32,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["accounts/fireworks/models/kat-dev-32b","fireworks_ai/accounts/fireworks/models/kat-dev-32b","kwaipilot-kat-32b-dev"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-0-6b","name":"qwen3-0-6b","display_name":"Qwen3 0.6B","description":"A 0.6-billion-parameter base LLM from Alibaba's Qwen3 series, designed for ultra-lightweight deployment and on-device language tasks.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"language","size_in_bn":0.6,"modalities":{"input":["text"],"output":["text"]},"context_window":40960,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["accounts/fireworks/models/qwen3-0p6b","alibaba-qwen3-0-6b","fireworks_ai/accounts/fireworks/models/qwen3-0p6b","qwen3-0.6b","qwen3-0.6b-instruct","qwen3-0.6b-instruct-reasoning"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-1-7b","name":"qwen3-1-7b","display_name":"Qwen3 1.7B","description":"A 1.7-billion-parameter base LLM from Alibaba's Qwen3 series, balancing compact size with reasoning and language generation capabilities.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"language","size_in_bn":1.7,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["accounts/fireworks/models/qwen3-1p7b","alibaba-qwen3-1-7b","fireworks_ai/accounts/fireworks/models/qwen3-1p7b","huggingface-asr-qwen3-asr-1-7b","huggingface-reasoning-qwen3-1-7b","qwen3-1.7b","qwen3-1.7b-instruct","qwen3-1.7b-instruct-reasoning"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-14b","name":"qwen3-14b","display_name":"Qwen3 14B","description":"A 14-billion-parameter LLM from Alibaba's Qwen3 series with strong reasoning and tool-use capabilities for complex instruction-following tasks.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"language","size_in_bn":14,"modalities":{"input":["text"],"output":["text"]},"context_window":131702,"max_output_tokens":40960,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-03-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-28","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["accounts/fireworks/models/qwen3-14b","alibaba-qwen3-14b","alibaba/qwen-3-14b","deepinfra/Qwen/Qwen3-14B","fireworks_ai/accounts/fireworks/models/qwen3-14b","huggingface-reasoning-qwen3-14b","nebius/Qwen/Qwen3-14B","qwen/qwen3-14b","Qwen/Qwen3-14B","qwen3-14b","qwen3-14b-instruct","qwen3-14b-instruct-reasoning","vercel_ai_gateway/alibaba/qwen-3-14b"],"hf_likes":386,"hf_downloads":3005499,"hf_downloads_all_time":14478982,"hf_trending_score":3,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-32b","name":"qwen3-32b","display_name":"Qwen3 32B","description":"A dense 32B-parameter LLM from the Qwen3 series with strong reasoning and tool-use capabilities, suitable for a wide range of language tasks.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"language","size_in_bn":32,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":40960,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-03-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-28","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":15,"ids":["accounts/fireworks/models/qwen3-32b","alibaba-qwen3-32b","alibaba/qwen-3-32b","cerebras/qwen-3-32b","deepinfra/Qwen/Qwen3-32B","fireworks_ai/accounts/fireworks/models/qwen3-32b","gradient_ai/alibaba-qwen3-32b","groq/qwen/qwen3-32b","huggingface-reasoning-qwen3-32b","lambda_ai/qwen3-32b-fp8","nebius/Qwen/Qwen3-32B","novita/qwen/qwen3-32b-fp8","ovhcloud/Qwen3-32B","qwen.qwen3-32b-v1:0","qwen/qwen3-32b","Qwen/Qwen3-32B","qwen/qwen3-32b-fp8","qwen3-32b","qwen3-32b-instruct","qwen3-32b-instruct-reasoning","sambanova/Qwen3-32B","vercel_ai_gateway/alibaba/qwen-3-32b"],"hf_likes":685,"hf_downloads":2337650,"hf_downloads_all_time":26634596,"hf_trending_score":4,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-4b","name":"qwen3-4b","display_name":"Qwen3 4B","description":"A compact 4B-parameter dense LLM from the Qwen3 series supporting hybrid thinking and non-thinking modes for efficient on-device or low-latency deployment.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"language","size_in_bn":4,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":20000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/qwen3-4b","alibaba-qwen3-4b","fireworks_ai/accounts/fireworks/models/qwen3-4b","huggingface-reasoning-qwen3-4b","nebius/Qwen/Qwen3-4B","novita/qwen/qwen3-4b-fp8","qwen/qwen3-4b-fp8","qwen3-4b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-8b","name":"qwen3-8b","display_name":"Qwen3 8B","description":"An 8B-parameter dense LLM from the Qwen3 series with strong reasoning capabilities and support for hybrid thinking and non-thinking inference modes.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"language","size_in_bn":8,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":20000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-03-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-28","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["accounts/fireworks/models/qwen3-8b","alibaba-qwen3-8b","fireworks_ai/accounts/fireworks/models/qwen3-8b","huggingface-reasoning-qwen3-8b","llamagate/qwen3-8b","novita/qwen/qwen3-8b-fp8","qwen/qwen3-8b","qwen/qwen3-8b-fp8","qwen3-8b","qwen3-8b-instruct","qwen3-8b-instruct-reasoning"],"hf_likes":1051,"hf_downloads":8692944,"hf_downloads_all_time":50107992,"hf_trending_score":9,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-embedding-0-6b","name":"qwen3-embedding-0-6b","display_name":"Qwen3 Embedding 0.6B","description":"A compact 0.6B-parameter text embedding model from the Qwen3 series, supporting retrieval, classification, clustering, and bitext mining tasks.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"embedding","size_in_bn":0.6,"modalities":{"input":["text"],"output":["embedding"]},"context_window":32768,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-11-14","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["@cf/qwen/qwen3-embedding-0.6b","accounts/fireworks/models/qwen3-embedding-0p6b","alibaba-qwen3-embedding-0-6b","alibaba/qwen3-embedding-0.6b","fireworks_ai/accounts/fireworks/models/qwen3-embedding-0p6b","huggingface-textembedding-qwen3-embedding-0-6b","novita/qwen/qwen3-embedding-0.6b","Qwen/Qwen3-Embedding-0.6B"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-embedding-4b","name":"qwen3-embedding-4b","display_name":"Qwen3 Embedding 4B","description":"A 4B-parameter text embedding model from the Qwen3 series, delivering strong multilingual retrieval, classification, and clustering performance.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"embedding","size_in_bn":4,"modalities":{"input":["text"],"output":["embedding"]},"context_window":40960,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-06-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["accounts/fireworks/models/qwen3-embedding-4b","alibaba-qwen3-embedding-4b","alibaba/qwen3-embedding-4b","fireworks_ai/accounts/fireworks/models/qwen3-embedding-4b","Qwen/Qwen3-Embedding-4B"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-embedding-8b","name":"qwen3-embedding-8b","display_name":"Qwen3 Embedding 8B","description":"An 8B-parameter text embedding model from the Qwen3 series with strong multilingual capabilities and long-context support for retrieval and ranking tasks.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"embedding","size_in_bn":8,"modalities":{"input":["text"],"output":["embedding"]},"context_window":40960,"max_output_tokens":4096,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-06-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["accounts/fireworks/models/qwen3-embedding-8b","alibaba-qwen3-embedding-8b","alibaba/qwen3-embedding-8b","llamagate/qwen3-embedding-8b","novita/qwen/qwen3-embedding-8b","Qwen/Qwen3-Embedding-8B"],"hf_likes":656,"hf_downloads":1900241,"hf_downloads_all_time":10616532,"hf_trending_score":9,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-reranker-0-6b","name":"qwen3-reranker-0-6b","display_name":"Qwen3 Reranker 0.6B","description":"A compact 0.6B-parameter reranker from the Qwen3 series, supporting text retrieval, code retrieval, classification, and multilingual ranking tasks.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"reranking","size_in_bn":0.6,"modalities":{"input":["text"],"output":[]},"context_window":40960,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["accounts/fireworks/models/qwen3-reranker-0p6b","alibaba-qwen3-reranker-0-6b","fireworks_ai/accounts/fireworks/models/qwen3-reranker-0p6b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-reranker-4b","name":"qwen3-reranker-4b","display_name":"Qwen3 Reranker 4B","description":"A 4B-parameter reranker from the Qwen3 series, delivering strong performance on text and code retrieval, classification, and bitext mining tasks.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"reranking","size_in_bn":4,"modalities":{"input":["text"],"output":[]},"context_window":40960,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["accounts/fireworks/models/qwen3-reranker-4b","alibaba-qwen3-reranker-4b","fireworks_ai/accounts/fireworks/models/qwen3-reranker-4b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"alibaba-qwen3-reranker-8b","name":"qwen3-reranker-8b","display_name":"Qwen3 Reranker 8B","description":"An 8B-parameter reranker from the Qwen3 series, offering high-accuracy multilingual ranking for retrieval, classification, and clustering pipelines.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"reranking","size_in_bn":8,"modalities":{"input":["text"],"output":[]},"context_window":40960,"max_output_tokens":4096,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["accounts/fireworks/models/qwen3-reranker-8b","alibaba-qwen3-reranker-8b","fireworks_ai/accounts/fireworks/models/qwen3-reranker-8b","novita/qwen/qwen3-reranker-8b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"voyage-4-nano","name":"voyage-4-nano","display_name":"Voyage 4 Nano","description":"A compact text embedding model from Voyage AI built on a bidirectional Qwen3 backbone (~340M parameters, 32k context), optimized for high-performance semantic search and retrieval.","creator":"voyage","family":"qwen3","tier":"nano","version":"4","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["accounts/fireworks/models/voyage-4-nano","voyage-4-nano"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"}],"pagination":{"page_size":50,"has_next":false,"next_token":null,"total_count":15},"meta":{"updated_at":"2026-06-11","request_id":"23e7d96b-3f17-45c7-b2b3-afe350f4411d","execution_ms":10}}