{"data":[{"id":"zhipu-glm-5","name":"glm-5","display_name":"GLM-5","description":"An open-source MoE LLM from Z AI designed for long-context reasoning, multi-step tool orchestration, and complex agentic engineering tasks.","creator":"zhipu","family":"glm_moe_dsa","tier":"","version":"5","type":"language","size_in_bn":753.864,"modalities":{"input":["pdf","text"],"output":["text"]},"context_window":202800,"max_output_tokens":131100,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-11","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["accounts/fireworks/models/glm-5","baseten/zai-org/GLM-5","bedrock/us-east-1/zai.glm-5","bedrock/us-west-2/zai.glm-5","glm-5","glm-5-maas","glm-5-non-reasoning","openrouter/z-ai/glm-5","publishers/google/models/glm-5-maas","vertex_ai/zai-org/glm-5-maas","z-ai/glm-5","zai-org/glm-5","zai-org/GLM-5","zai.glm-5","zai/glm-5","zhipu-glm-5"],"hf_likes":2070,"hf_downloads":477667,"hf_downloads_all_time":777726,"hf_trending_score":5,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"zhipu-glm-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.573,"max_input_per_1m":1,"min_output_per_1m":1.92,"max_output_per_1m":3.2,"min_cache_read_per_1m":0.1,"min_cache_write_per_1m":0.1,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"moonshot-kimi-k2-5","name":"kimi-k2-5","display_name":"Kimi K2.5","description":"An updated iteration of Kimi K2 with enhanced reasoning, vision, and tool-use capabilities, supporting implicit caching for efficient inference.","creator":"moonshot","family":"kimi_k25","tier":"","version":"k2-5","type":"language","size_in_bn":1058.589,"modalities":{"input":["image","text","video"],"output":["text"]},"context_window":262144,"max_output_tokens":98304,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-01-27","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":12,"ids":["@cf/moonshotai/kimi-k2.5","accounts/fireworks/models/kimi-k2p5","azure_ai/kimi-k2.5","baseten/moonshotai/Kimi-K2.5","bedrock/ap-northeast-1/moonshotai.kimi-k2.5","bedrock/ap-south-1/moonshotai.kimi-k2.5","bedrock/ap-southeast-3/moonshotai.kimi-k2.5","bedrock/eu-north-1/moonshotai.kimi-k2.5","bedrock/moonshotai.kimi-k2.5","bedrock/sa-east-1/moonshotai.kimi-k2.5","bedrock/us-east-1/moonshotai.kimi-k2.5","bedrock/us-east-2/moonshotai.kimi-k2.5","bedrock/us-west-2/moonshotai.kimi-k2.5","fireworks_ai/accounts/fireworks/models/kimi-k2p5","fireworks_ai/kimi-k2p5","huggingface-llm-kimi-k2-5","kimi-k2-5","kimi-k2-5-non-reasoning","kimi-k2.5","moonshot-kimi-k2-5","moonshot/kimi-k2.5","moonshotai.kimi-k2.5","moonshotai/kimi-k2.5","moonshotai/Kimi-K2.5","openrouter/moonshotai/kimi-k2.5","together_ai/moonshotai/Kimi-K2.5","wandb/moonshotai/Kimi-K2.5"],"hf_likes":2753,"hf_downloads":5222216,"hf_downloads_all_time":9851195,"hf_trending_score":34,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"moonshot-kimi-k2-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.375,"max_input_per_1m":0.6,"min_output_per_1m":2.025,"max_output_per_1m":3.011,"min_cache_read_per_1m":0.1,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":12},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-5-397b-a17b","name":"qwen3-5-397b-a17b","display_name":"Qwen3.5 397B A17B","description":"Alibaba's largest Qwen3.5 MoE model with 397B total parameters and 17B activated per token, targeting maximum capability for complex reasoning and generation.","creator":"alibaba","family":"qwen3_5_moe","tier":"","version":null,"type":"language","size_in_bn":397,"modalities":{"input":["image","text","video"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-16","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/qwen3p5-397b-a17b","alibaba-qwen3-5-397b-a17b","openrouter/qwen/qwen3.5-397b-a17b","qwen/qwen3.5-397b-a17b","Qwen/Qwen3.5-397B-A17B","qwen3-5-397b-a17b","qwen3-5-397b-a17b-non-reasoning","qwen3.5-397b-a17b","together_ai/Qwen/Qwen3.5-397B-A17B"],"hf_likes":1462,"hf_downloads":710153,"hf_downloads_all_time":2631436,"hf_trending_score":11,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-5-397b-a17b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.39,"max_input_per_1m":0.71,"min_output_per_1m":2.34,"max_output_per_1m":4.25,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"zhipu-glm-4-7","name":"glm-4-7","display_name":"GLM-4.7","description":"A multilingual MoE LLM from Z AI designed for complex reasoning, agentic coding, and tool use, building on the GLM-4.6 architecture.","creator":"zhipu","family":"glm4_moe","tier":"","version":"4-7","type":"language","size_in_bn":358.338,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":204800,"max_output_tokens":131072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-22","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":13,"ids":["accounts/fireworks/models/glm-4p7","baseten/zai-org/GLM-4.7","cerebras/zai-glm-4.7","fireworks_ai/accounts/fireworks/models/glm-4p7","fireworks_ai/glm-4p7","glm-4-7","glm-4-7-251222","glm-4-7-non-reasoning","glm-4.7","glm-4.7-maas","novita/zai-org/glm-4.7","openrouter/z-ai/glm-4.7","publishers/google/models/glm-4.7-maas","together_ai/zai-org/GLM-4.7","vertex_ai/zai-org/glm-4.7-maas","z-ai/glm-4.7","zai-org/glm-4.7","zai-org/GLM-4.7","zai.glm-4.7","zai/glm-4.7","zhipu-glm-4-7"],"hf_likes":2026,"hf_downloads":117151,"hf_downloads_all_time":436300,"hf_trending_score":4,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"zhipu-glm-4-7","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.4,"max_input_per_1m":2.25,"min_output_per_1m":1.75,"max_output_per_1m":2.75,"min_cache_read_per_1m":0.08,"min_cache_write_per_1m":0.06,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":13},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-5-122b-a10b","name":"qwen3-5-122b-a10b","display_name":"Qwen3.5 122B A10B","description":"A large Qwen3.5 Mixture-of-Experts model with 122B total parameters and 10B activated per token, featuring a 262K token context window for complex reasoning tasks.","creator":"alibaba","family":"qwen3_5_moe","tier":"","version":null,"type":"language","size_in_bn":122,"modalities":{"input":["image","text","video"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-25","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["accounts/fireworks/models/qwen3p5-122b-a10b","alibaba-qwen3-5-122b-a10b","openrouter/qwen/qwen3.5-122b-a10b","qwen/qwen3.5-122b-a10b","Qwen/Qwen3.5-122B-A10B","qwen3-5-122b-a10b","qwen3-5-122b-a10b-non-reasoning","qwen3.5-122b-a10b"],"hf_likes":523,"hf_downloads":906547,"hf_downloads_all_time":1516880,"hf_trending_score":8,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-5-122b-a10b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.26,"max_input_per_1m":0.4,"min_output_per_1m":2.08,"max_output_per_1m":3.2,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-v3-2","name":"v3-2","display_name":"DeepSeek V3.2","description":"DeepSeek's V3.2 MoE LLM featuring implicit caching support and improved tool-use capabilities over the V3.1 generation.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.2","type":"language","size_in_bn":685.397,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":163840,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-01","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":12,"ids":["accounts/fireworks/models/deepseek-v3p2","azure_ai/deepseek-v3.2","bedrock/ap-northeast-1/deepseek.v3.2","bedrock/ap-south-1/deepseek.v3.2","bedrock/ap-southeast-3/deepseek.v3.2","bedrock/eu-north-1/deepseek.v3.2","bedrock/sa-east-1/deepseek.v3.2","bedrock/us-east-1/deepseek.v3.2","bedrock/us-east-2/deepseek.v3.2","bedrock/us-west-2/deepseek.v3.2","deepseek-ai/DeepSeek-V3.2","deepseek-llm-deepseek-v3-2","deepseek-v3-2","deepseek-v3-2-251201","deepseek-v3-2-reasoning","deepseek-v3.2-maas","deepseek-v3.2685","deepseek.v3.2","deepseek/deepseek-v3.2","eu.deepseek.v3.2","fireworks_ai/accounts/fireworks/models/deepseek-v3p2","gmi/deepseek-ai/DeepSeek-V3.2","novita/deepseek/deepseek-v3.2","openrouter/deepseek/deepseek-v3.2","publishers/google/models/deepseek-v3.2-maas","us.deepseek.v3.2","vertex_ai/deepseek-ai/deepseek-v3.2-maas"],"hf_likes":1413,"hf_downloads":10366446,"hf_downloads_all_time":11229842,"hf_trending_score":6,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-v3-2","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2288,"max_input_per_1m":0.62,"min_output_per_1m":0.3432,"max_output_per_1m":1.85,"min_cache_read_per_1m":0.028,"min_cache_write_per_1m":0.056,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":12},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-max","name":"qwen3-max","display_name":"Qwen3 Max","description":"Alibaba's top-tier flagship LLM in the Qwen3 series, delivering leading performance across knowledge, reasoning, coding, and instruction-following benchmarks.","creator":"alibaba","family":"qwen","tier":"max","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-06-30","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-09-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["alibaba-qwen3-max","alibaba/qwen3-max","dashscope/qwen3-max","dashscope/qwen3-max-2026-01-23","novita/qwen/qwen3-max","qwen/qwen3-max","Qwen/Qwen3-Max","qwen3-max","qwen3-max-2025-09-23","qwen3-max-2026-01-23"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-max","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.359,"max_input_per_1m":2.11,"min_output_per_1m":1.434,"max_output_per_1m":8.45,"min_cache_read_per_1m":0.156,"min_cache_write_per_1m":0.975,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-coder-next","name":"qwen3-coder-next","display_name":"Qwen3 Coder Next","description":"A next-generation Qwen3 coding model with enhanced reasoning and tool-use capabilities for advanced agentic programming tasks.","creator":"alibaba","family":"qwen3_next","tier":"","version":null,"type":"language","size_in_bn":79.674,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-04","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["alibaba-qwen3-coder-next","alibaba/qwen3-coder-next","bedrock/ap-northeast-1/qwen.qwen3-coder-next","bedrock/ap-south-1/qwen.qwen3-coder-next","bedrock/ap-southeast-3/qwen.qwen3-coder-next","bedrock/eu-central-1/qwen.qwen3-coder-next","bedrock/eu-south-1/qwen.qwen3-coder-next","bedrock/eu-west-1/qwen.qwen3-coder-next","bedrock/eu-west-2/qwen.qwen3-coder-next","bedrock/sa-east-1/qwen.qwen3-coder-next","bedrock/us-east-1/qwen.qwen3-coder-next","bedrock/us-east-2/qwen.qwen3-coder-next","bedrock/us-west-2/qwen.qwen3-coder-next","huggingface-reasoning-qwen3-coder-next","qwen.qwen3-coder-next","qwen/qwen3-coder-next","qwen3-coder-next"],"hf_likes":1313,"hf_downloads":646521,"hf_downloads_all_time":2269042,"hf_trending_score":28,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-coder-next","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.11,"max_input_per_1m":0.5,"min_output_per_1m":0.8,"max_output_per_1m":1.5,"min_cache_read_per_1m":0.07,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-max-preview","name":"qwen3-max-preview","display_name":"Qwen3 Max Preview","description":"A preview release of the Qwen3 Max flagship LLM, showcasing substantial gains in Chinese-English understanding and complex instruction following over the 2.5 series.","creator":"alibaba","family":"qwen","tier":"max","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-09-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["alibaba-qwen3-max-preview","alibaba/qwen3-max-preview","dashscope/qwen3-max-preview","qwen3-max-preview"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-max-preview","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.2,"max_input_per_1m":1.2,"min_output_per_1m":6,"max_output_per_1m":6,"min_cache_read_per_1m":0.24,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen","vercel_ai_gateway"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-coder-480b-a35b-instruct","name":"qwen3-coder-480b-a35b-instruct","display_name":"Qwen3 Coder 480B A35B Instruct","description":"Qwen3's flagship agentic code model with 480B total and 35B activated parameters, excelling at autonomous programming, tool calling, and browser-use tasks.","creator":"alibaba","family":"qwen3_moe","tier":"","version":null,"type":"language","size_in_bn":480,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["accounts/fireworks/models/qwen3-coder-480b-a35b-instruct","alibaba-qwen3-coder-480b-a35b-instruct","deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct","fireworks_ai/accounts/fireworks/models/qwen3-coder-480b-a35b-instruct","novita/qwen/qwen3-coder-480b-a35b-instruct","qwen/qwen3-coder-480b-a35b-instruct","Qwen/Qwen3-Coder-480B-A35B-Instruct","qwen3-coder-480b-a35b-instruct","wandb/Qwen/Qwen3-Coder-480B-A35B-Instruct"],"hf_likes":1325,"hf_downloads":57687,"hf_downloads_all_time":885858,"hf_trending_score":0.5,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-coder-480b-a35b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.22,"max_input_per_1m":100,"min_output_per_1m":1.3,"max_output_per_1m":150,"min_cache_read_per_1m":null,"min_cache_write_per_1m":0.022,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-vl-235b-a22b-instruct","name":"qwen3-vl-235b-a22b-instruct","display_name":"Qwen3 VL 235B A22B Instruct","description":"The flagship instruction-tuned vision-language MoE model in the Qwen3 series, with 235B total and 22B activated parameters for superior visual perception and reasoning.","creator":"alibaba","family":"qwen3_vl_moe","tier":"","version":null,"type":"language","size_in_bn":235,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":262144,"max_output_tokens":129024,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-03-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["accounts/fireworks/models/qwen3-vl-235b-a22b-instruct","alibaba-qwen3-vl-235b-a22b-instruct","alibaba/qwen3-vl-235b-a22b-instruct","dashscope/qwen3-vl-235b-a22b-instruct","fireworks_ai/accounts/fireworks/models/qwen3-vl-235b-a22b-instruct","gmi/Qwen/Qwen3-VL-235B-A22B-Instruct-FP8","novita/qwen/qwen3-vl-235b-a22b-instruct","qwen/qwen3-vl-235b-a22b-instruct","Qwen/Qwen3-VL-235B-A22B-Instruct","qwen3-vl-235b-a22b-instruct"],"hf_likes":383,"hf_downloads":947793,"hf_downloads_all_time":2172030,"hf_trending_score":0,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-vl-235b-a22b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2,"max_input_per_1m":0.4,"min_output_per_1m":0.88,"max_output_per_1m":1.6,"min_cache_read_per_1m":0.11,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-next-80b-a3b-instruct","name":"qwen3-next-80b-a3b-instruct","display_name":"Qwen3 Next 80B A3B Instruct","description":"An instruction-tuned Qwen3 Next MoE model with 80B total and 3B activated parameters, optimized for text generation and conversational tasks.","creator":"alibaba","family":"qwen3_next","tier":"","version":null,"type":"language","size_in_bn":80,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-09-30","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-11","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":10,"ids":["accounts/fireworks/models/qwen3-next-80b-a3b-instruct","alibaba-qwen3-next-80b-a3b-instruct","alibaba/qwen3-next-80b-a3b-instruct","dashscope/qwen3-next-80b-a3b-instruct","deepinfra/Qwen/Qwen3-Next-80B-A3B-Instruct","fireworks_ai/accounts/fireworks/models/qwen3-next-80b-a3b-instruct","huggingface-reasoning-qwen3-next-80b-a3b-instruct","novita/qwen/qwen3-next-80b-a3b-instruct","qwen/qwen3-next-80b-a3b-instruct","Qwen/Qwen3-Next-80B-A3B-Instruct","qwen/qwen3-next-80b-a3b-instruct:free","qwen3-next-80b-a3b-instruct","together_ai/Qwen/Qwen3-Next-80B-A3B-Instruct"],"hf_likes":1012,"hf_downloads":292470,"hf_downloads_all_time":14864763,"hf_trending_score":4,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-next-80b-a3b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.09,"max_input_per_1m":0.9,"min_output_per_1m":0.9,"max_output_per_1m":1.5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":10},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-coder-30b-a3b-instruct","name":"qwen3-coder-30b-a3b-instruct","display_name":"Qwen3 Coder 30B A3B Instruct","description":"An instruction-tuned Qwen3 MoE coding model with 30B total and 3B active parameters, designed for agentic programming tasks and tool-integrated workflows.","creator":"alibaba","family":"qwen3_moe","tier":"","version":null,"type":"language","size_in_bn":30,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-06-30","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-07-31","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["accounts/fireworks/models/qwen3-coder-30b-a3b-instruct","alibaba-qwen3-coder-30b-a3b-instruct","fireworks_ai/accounts/fireworks/models/qwen3-coder-30b-a3b-instruct","huggingface-reasoning-qwen3-coder-30b-a3b-instruct","lemonade/Qwen3-Coder-30B-A3B-Instruct-GGUF","novita/qwen/qwen3-coder-30b-a3b-instruct","qwen/qwen3-coder-30b-a3b-instruct","qwen3-coder-30b-a3b-instruct"],"hf_likes":1018,"hf_downloads":2406663,"hf_downloads_all_time":7798034,"hf_trending_score":10,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-coder-30b-a3b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.07,"max_input_per_1m":0.45,"min_output_per_1m":0.26,"max_output_per_1m":2.25,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["huggingface","novita","openrouter"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwq-32b","name":"qwq-32b","display_name":"QwQ 32B","description":"A 32B reasoning-focused LLM from Alibaba's Qwen team, designed to match frontier closed-model performance on complex reasoning and problem-solving tasks.","creator":"alibaba","family":"qwen2","tier":"","version":null,"type":"language","size_in_bn":32,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06-30","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":false,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-03-05","earliest_deprecation_date":"2026-04-29","deprecated":false,"has_pricing":true,"provider_count":9,"ids":["@cf/qwen/qwq-32b","accounts/fireworks/models/qwq-32b","alibaba-qwq-32b","deepinfra/Qwen/QwQ-32B","fireworks_ai/accounts/fireworks/models/qwq-32b","huggingface-llm-qwq-32b","hyperbolic/Qwen/QwQ-32B","nebius/Qwen/QwQ-32B","nscale/Qwen/QwQ-32B","qwen/qwq-32b","qwq-32b","sambanova/QwQ-32B"],"hf_likes":2906,"hf_downloads":73024,"hf_downloads_all_time":2875672,"hf_trending_score":1,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwq-32b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.15,"max_input_per_1m":0.9,"min_output_per_1m":0.2,"max_output_per_1m":1,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["deepinfra","nebius"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-r1","name":"r1","display_name":"DeepSeek R1","description":"DeepSeek's flagship reasoning-focused LLM with strong performance in mathematics, coding, and logical inference, comparable to leading closed-source models.","creator":"deepseek","family":"deepseek-r1","tier":"","version":"1.0","type":"language","size_in_bn":684.531,"modalities":{"input":["text"],"output":["text"]},"context_window":163840,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-07-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-01-20","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":14,"ids":["accounts/fireworks/models/deepseek-r1","azure_ai/deepseek-r1","deepinfra/deepseek-ai/DeepSeek-R1","deepseek-llm-r1","deepseek-r1","deepseek-r1-0120","deepseek-r1-qwen3-8b","deepseek-r1685","deepseek-reasoner","deepseek.r1-v1:0","deepseek/deepseek-r1","deepseek/deepseek-reasoner","fireworks_ai/accounts/fireworks/models/deepseek-r1","hyperbolic/deepseek-ai/DeepSeek-R1","nebius/deepseek-ai/DeepSeek-R1","openrouter/deepseek/deepseek-r1","replicate/deepseek-ai/deepseek-r1","sambanova/DeepSeek-R1","snowflake/deepseek-r1","together_ai/deepseek-ai/DeepSeek-R1","us.deepseek.r1-v1:0","vercel_ai_gateway/deepseek/deepseek-r1"],"hf_likes":13288,"hf_downloads":4020320,"hf_downloads_all_time":20204112,"hf_trending_score":20,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-r1","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.28,"max_input_per_1m":5,"min_output_per_1m":0.4,"max_output_per_1m":10,"min_cache_read_per_1m":0.028,"min_cache_write_per_1m":null,"min_reasoning_per_1m":10,"cheapest_providers":["deepseek"],"provider_count":14},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-vl-32b-instruct","name":"qwen3-vl-32b-instruct","display_name":"Qwen3 VL 32B Instruct","description":"A 32B dense vision-language model from the Qwen3 series with significantly enhanced text understanding, visual perception, and multimodal reasoning capabilities.","creator":"alibaba","family":"qwen3_vl","tier":"","version":null,"type":"language","size_in_bn":32,"modalities":{"input":["image","text"],"output":["text"]},"context_window":262144,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-10-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["accounts/fireworks/models/qwen3-vl-32b-instruct","alibaba-qwen3-vl-32b-instruct","dashscope/qwen3-vl-32b-instruct","fireworks_ai/accounts/fireworks/models/qwen3-vl-32b-instruct","qwen/qwen3-vl-32b-instruct","qwen3-vl-32b-instruct"],"hf_likes":202,"hf_downloads":2356383,"hf_downloads_all_time":8776345,"hf_trending_score":0,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-vl-32b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.104,"max_input_per_1m":0.9,"min_output_per_1m":0.416,"max_output_per_1m":0.9,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-r1-distill-qwen-32b","name":"deepseek-r1-distill-qwen-32b","display_name":"DeepSeek R1 Distill Qwen 32B","description":"A 32B Qwen-based model distilled from DeepSeek R1's reasoning capabilities, offering high-quality chain-of-thought performance at a mid-scale parameter count.","creator":"deepseek","family":"deepseek-r1","tier":"","version":"1.0","type":"language","size_in_bn":32,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-07-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-01-29","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["@cf/deepseek-ai/deepseek-r1-distill-qwen-32b","accounts/fireworks/models/deepseek-r1-distill-qwen-32b","deepinfra/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B","deepseek-llm-r1-distill-qwen-32b","deepseek-r1-distill-qwen-32b","deepseek/deepseek-r1-distill-qwen-32b","fireworks_ai/accounts/fireworks/models/deepseek-r1-distill-qwen-32b","novita/deepseek/deepseek-r1-distill-qwen-32b","nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-32B"],"hf_likes":1545,"hf_downloads":1046750,"hf_downloads_all_time":23929632,"hf_trending_score":3,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-r1-distill-qwen-32b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.15,"max_input_per_1m":0.9,"min_output_per_1m":0.15,"max_output_per_1m":4.881,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["nscale"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-235b-a22b-instruct","name":"qwen3-235b-a22b-instruct","display_name":"Qwen3 235B A22B Instruct","description":"An instruction-tuned update of the Qwen3 235B A22B MoE model with significant improvements in instruction following, logical reasoning, and general capabilities.","creator":"alibaba","family":"qwen3_moe","tier":"","version":null,"type":"language","size_in_bn":235,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":10,"ids":["accounts/fireworks/models/qwen3-235b-a22b-instruct-2507","alibaba-qwen3-235b-a22b-instruct","crusoe/Qwen/Qwen3-235B-A22B-Instruct-2507","deepinfra/Qwen/Qwen3-235B-A22B-Instruct-2507","fireworks_ai/accounts/fireworks/models/qwen3-235b-a22b-instruct-2507","novita/qwen/qwen3-235b-a22b-instruct-2507","qwen/qwen3-235b-a22b-instruct-2507","Qwen/Qwen3-235B-A22B-Instruct-2507","qwen3-235b-a22b-instruct","qwen3-235b-a22b-instruct-2507","replicate/qwen/qwen3-235b-a22b-instruct-2507","wandb/Qwen/Qwen3-235B-A22B-Instruct-2507"],"hf_likes":773,"hf_downloads":150781,"hf_downloads_all_time":1182969,"hf_trending_score":1,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-235b-a22b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.09,"max_input_per_1m":10,"min_output_per_1m":0.58,"max_output_per_1m":10,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["deepinfra","huggingface","novita"],"provider_count":10},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-vl-30b-a3b-instruct","name":"qwen3-vl-30b-a3b-instruct","display_name":"Qwen3 VL 30B A3B Instruct","description":"An instruction-tuned vision-language MoE model with 30B total and 3B activated parameters, offering strong multimodal understanding and generation capabilities.","creator":"alibaba","family":"qwen3_vl_moe","tier":"","version":null,"type":"language","size_in_bn":30,"modalities":{"input":["image","text"],"output":["text"]},"context_window":262144,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-03-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-10-06","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["accounts/fireworks/models/qwen3-vl-30b-a3b-instruct","alibaba-qwen3-vl-30b-a3b-instruct","fireworks_ai/accounts/fireworks/models/qwen3-vl-30b-a3b-instruct","novita/qwen/qwen3-vl-30b-a3b-instruct","qwen/qwen3-vl-30b-a3b-instruct","Qwen/Qwen3-VL-30B-A3B-Instruct","qwen3-vl-30b-a3b-instruct"],"hf_likes":562,"hf_downloads":2219395,"hf_downloads_all_time":14070852,"hf_trending_score":2,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-vl-30b-a3b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.13,"max_input_per_1m":0.2,"min_output_per_1m":0.52,"max_output_per_1m":0.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-r1-distill-qwen-14b","name":"deepseek-r1-distill-qwen-14b","display_name":"DeepSeek R1 Distill Qwen 14B","description":"A 14B Qwen-based model distilled from DeepSeek R1, balancing strong reasoning performance with moderate computational requirements.","creator":"deepseek","family":"deepseek-r1","tier":"","version":"1.0","type":"language","size_in_bn":14,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["accounts/fireworks/models/deepseek-r1-distill-qwen-14b","deepseek-llm-r1-distill-qwen-14b","deepseek-r1-distill-qwen-14b","deepseek/deepseek-r1-distill-qwen-14b","fireworks_ai/accounts/fireworks/models/deepseek-r1-distill-qwen-14b","novita/deepseek/deepseek-r1-distill-qwen-14b","nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-14B"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-r1-distill-qwen-14b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.07,"max_input_per_1m":0.2,"min_output_per_1m":0.07,"max_output_per_1m":0.431,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["nscale"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen2-5-72b-instruct","name":"qwen2-5-72b-instruct","display_name":"Qwen2.5 72B Instruct","description":"A 72-billion-parameter instruction-tuned LLM from Alibaba's Qwen2.5 series, excelling at natural language understanding, summarization, and dialogue.","creator":"alibaba","family":"qwen2","tier":"","version":null,"type":"language","size_in_bn":72,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06-30","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-09-19","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["accounts/fireworks/models/qwen2p5-72b-instruct","alibaba-qwen2-5-72b-instruct","deepinfra/Qwen/Qwen2.5-72B-Instruct","fireworks_ai/accounts/fireworks/models/qwen2p5-72b-instruct","huggingface-llm-qwen2-5-72b-instruct","hyperbolic/Qwen/Qwen2.5-72B-Instruct","nebius/Qwen/Qwen2.5-72B-Instruct","novita/qwen/qwen-2.5-72b-instruct","qwen/qwen-2.5-72b-instruct","Qwen/Qwen2.5-72B-Instruct","qwen2-5-72b-instruct","qwen2.5-72b-instruct"],"hf_likes":927,"hf_downloads":457915,"hf_downloads_all_time":5817981,"hf_trending_score":1,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen2-5-72b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.12,"max_input_per_1m":1.4,"min_output_per_1m":0.3,"max_output_per_1m":5.6,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["deepinfra","hyperbolic"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwq-32b-preview","name":"qwq-32b-preview","display_name":"QwQ 32B Preview","description":"An experimental 32B reasoning LLM from Alibaba's Qwen team, showcasing open-model capabilities comparable to leading closed frontier models on reasoning benchmarks.","creator":"alibaba","family":"qwen2","tier":"","version":null,"type":"language","size_in_bn":32,"modalities":{"input":["text"],"output":["text"]},"context_window":32768,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["accounts/fireworks/models/qwen-qwq-32b-preview","alibaba-qwq-32b-preview","fireworks_ai/accounts/fireworks/models/qwen-qwq-32b-preview","qwq-32b-preview","QwQ-32B-Preview"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwq-32b-preview","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.287,"max_input_per_1m":0.9,"min_output_per_1m":0.861,"max_output_per_1m":0.9,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-vl-8b-instruct","name":"qwen3-vl-8b-instruct","display_name":"Qwen3 VL 8B Instruct","description":"An instruction-tuned 8B vision-language model from the Qwen3 series, optimized for conversational multimodal tasks involving text and image inputs.","creator":"alibaba","family":"qwen3_vl","tier":"","version":null,"type":"language","size_in_bn":8,"modalities":{"input":["image","text"],"output":["text"]},"context_window":256000,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-10-14","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["accounts/fireworks/models/qwen3-vl-8b-instruct","alibaba-qwen3-vl-8b-instruct","fireworks_ai/accounts/fireworks/models/qwen3-vl-8b-instruct","huggingface-vlm-qwen3-vl-8b-instruct","novita/qwen/qwen3-vl-8b-instruct","qwen/qwen3-vl-8b-instruct","qwen3-vl-8b-instruct"],"hf_likes":874,"hf_downloads":3765920,"hf_downloads_all_time":23111974,"hf_trending_score":15,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-vl-8b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.08,"max_input_per_1m":0.2,"min_output_per_1m":0.2,"max_output_per_1m":0.7,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["huggingface","novita","openrouter"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen2-5-32b-instruct","name":"qwen2-5-32b-instruct","display_name":"Qwen2.5 32B Instruct","description":"A 32-billion-parameter instruction-tuned LLM from Alibaba's Qwen2.5 series, optimized for following complex instructions and text generation tasks.","creator":"alibaba","family":"qwen2","tier":"","version":null,"type":"language","size_in_bn":32,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["accounts/fireworks/models/qwen2p5-32b-instruct","alibaba-qwen2-5-32b-instruct","fireworks_ai/accounts/fireworks/models/qwen2p5-32b-instruct","huggingface-llm-qwen2-5-32b-instruct","nebius/Qwen/Qwen2.5-32B-Instruct","qwen2.5-32b-instruct"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen2-5-32b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.06,"max_input_per_1m":0.9,"min_output_per_1m":0.2,"max_output_per_1m":2.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["nebius"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen2-5-coder-32b-instruct","name":"qwen2-5-coder-32b-instruct","display_name":"Qwen2.5 Coder 32B Instruct","description":"A 32-billion-parameter instruction-tuned code LLM from Alibaba's Qwen2.5-Coder series, excelling at code generation, debugging, and explanation across many programming languages.","creator":"alibaba","family":"qwen2","tier":"","version":null,"type":"language","size_in_bn":32,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06-30","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-11-11","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["@cf/qwen/qwen2.5-coder-32b-instruct","accounts/fireworks/models/qwen2p5-coder-32b-instruct","accounts/fireworks/models/qwen2p5-coder-32b-instruct-128k","accounts/fireworks/models/qwen2p5-coder-32b-instruct-32k-rope","accounts/fireworks/models/qwen2p5-coder-32b-instruct-64k","alibaba-qwen2-5-coder-32b-instruct","fireworks_ai/accounts/fireworks/models/qwen2p5-coder-32b-instruct","fireworks_ai/accounts/fireworks/models/qwen2p5-coder-32b-instruct-128k","fireworks_ai/accounts/fireworks/models/qwen2p5-coder-32b-instruct-32k-rope","fireworks_ai/accounts/fireworks/models/qwen2p5-coder-32b-instruct-64k","huggingface-llm-qwen2-5-coder-32b-instruct","hyperbolic/Qwen/Qwen2.5-Coder-32B-Instruct","lambda_ai/qwen25-coder-32b-instruct","nscale/Qwen/Qwen2.5-Coder-32B-Instruct","openrouter/qwen/qwen-2.5-coder-32b-instruct","ovhcloud/Qwen2.5-Coder-32B-Instruct","qwen/qwen-2.5-coder-32b-instruct","qwen2-5-coder-32b-instruct","qwen2.5-coder-32b-instruct"],"hf_likes":2008,"hf_downloads":1257495,"hf_downloads_all_time":5998607,"hf_trending_score":0,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen2-5-coder-32b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.05,"max_input_per_1m":0.9,"min_output_per_1m":0.1,"max_output_per_1m":1,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["lambda"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-30b-a3b-instruct","name":"qwen3-30b-a3b-instruct","display_name":"Qwen3 30B A3B Instruct","description":"An instruction-tuned Qwen3 MoE model with 30B total and 3B active parameters, optimized for text generation and instruction-following tasks.","creator":"alibaba","family":"qwen3_moe","tier":"","version":null,"type":"language","size_in_bn":30,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-06-30","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-07-29","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["accounts/fireworks/models/qwen3-30b-a3b-instruct-2507","alibaba-qwen3-30b-a3b-instruct","fireworks_ai/accounts/fireworks/models/qwen3-30b-a3b-instruct-2507","huggingface-reasoning-qwen3-30b-a3b-instruct-2507","qwen/qwen3-30b-a3b-instruct-2507","qwen3-30b-a3b-instruct","qwen3-30b-a3b-instruct-2507"],"hf_likes":801,"hf_downloads":983022,"hf_downloads_all_time":10380022,"hf_trending_score":2,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-30b-a3b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.04815,"max_input_per_1m":0.5,"min_output_per_1m":0.19305,"max_output_per_1m":0.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen-turbo","name":"qwen-turbo","display_name":"Qwen Turbo","description":"A fast, cost-efficient Qwen LLM from Alibaba with a 1M context window suited for high-throughput simple tasks.","creator":"alibaba","family":"qwen","tier":"turbo","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":1000000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-03-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-02-01","earliest_deprecation_date":"2026-05-13","deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-qwen-turbo","dashscope/qwen-turbo","dashscope/qwen-turbo-2024-11-01","dashscope/qwen-turbo-2025-04-28","dashscope/qwen-turbo-latest","qwen-turbo","qwen-turbo-2024-09-19","qwen/qwen-turbo"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen-turbo","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.044,"max_input_per_1m":0.05,"min_output_per_1m":0.087,"max_output_per_1m":0.5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":0.5,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen2-5-coder-7b-instruct","name":"qwen2-5-coder-7b-instruct","display_name":"Qwen2.5 Coder 7B Instruct","description":"A 7-billion-parameter instruction-tuned code LLM from Alibaba's Qwen2.5-Coder series, designed for responsive code generation and developer assistance.","creator":"alibaba","family":"qwen2","tier":"","version":null,"type":"language","size_in_bn":7,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/qwen2p5-coder-7b-instruct","alibaba-qwen2-5-coder-7b-instruct","fireworks_ai/accounts/fireworks/models/qwen2p5-coder-7b-instruct","huggingface-llm-qwen2-5-coder-7b-instruct","nscale/Qwen/Qwen2.5-Coder-7B-Instruct","qwen2-5-coder-7b-instruct","qwen2.5-coder-7b-instruct"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen2-5-coder-7b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.01,"max_input_per_1m":0.2,"min_output_per_1m":0.03,"max_output_per_1m":0.287,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["huggingface","nscale"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-coder","name":"coder","display_name":"Coder","description":"Alibaba's code-focused LLM designed for programming assistance, code generation, and software development tasks.","creator":"alibaba","family":"alibaba","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":1000000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-coder","dashscope/qwen-coder"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-coder","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.3,"max_input_per_1m":0.3,"min_output_per_1m":1.5,"max_output_per_1m":1.5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-coder-plus","name":"coder-plus","display_name":"Coder Plus","description":"An enhanced tier of Alibaba's Coder model offering improved code generation quality and broader programming language support.","creator":"alibaba","family":"alibaba","tier":"plus","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-coder-plus","qwen-coder-plus"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-coder-plus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.502,"max_input_per_1m":0.502,"min_output_per_1m":1.004,"max_output_per_1m":1.004,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-coder-turbo","name":"coder-turbo","display_name":"Coder Turbo","description":"A fast, cost-efficient LLM variant from Alibaba's Qwen ecosystem optimized for code generation and programming assistance tasks.","creator":"alibaba","family":"alibaba","tier":"turbo","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-coder-turbo","qwen-coder-turbo"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-coder-turbo","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.287,"max_input_per_1m":0.287,"min_output_per_1m":0.861,"max_output_per_1m":0.861,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-deep-research","name":"deep-research","display_name":"Deep Research","description":"An Alibaba LLM designed for in-depth, multi-step research tasks requiring extended reasoning and information synthesis.","creator":"alibaba","family":"alibaba","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":1000000,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-deep-research","qwen-deep-research"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-deep-research","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":7.742,"max_input_per_1m":7.742,"min_output_per_1m":23.367,"max_output_per_1m":23.367,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-r1-528b","name":"deepseek-r1-528b","display_name":"DeepSeek R1 528B","description":"A 528B-parameter variant of the DeepSeek R1 reasoning model, offering large-scale chain-of-thought reasoning capabilities.","creator":"deepseek","family":"deepseek-r1","tier":"","version":"1.0","type":"language","size_in_bn":528,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["deepseek-r1-0528685","deepseek-r1-528b","together_ai/deepseek-ai/DeepSeek-R1-0528-tput"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-r1-528b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.55,"max_input_per_1m":0.574,"min_output_per_1m":2.19,"max_output_per_1m":2.294,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["together_ai"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-r1-distill-qwen-7b","name":"deepseek-r1-distill-qwen-7b","display_name":"DeepSeek R1 Distill Qwen 7B","description":"A 7B Qwen-based model distilled from DeepSeek R1, providing efficient reasoning capabilities suitable for resource-constrained deployments.","creator":"deepseek","family":"deepseek-r1","tier":"","version":"1.0","type":"language","size_in_bn":7,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/deepseek-r1-distill-qwen-7b","deepseek-llm-r1-distill-qwen-7b","deepseek-r1-distill-qwen-7b","fireworks_ai/accounts/fireworks/models/deepseek-r1-distill-qwen-7b","nscale/deepseek-ai/DeepSeek-R1-Distill-Qwen-7B"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-r1-distill-qwen-7b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.072,"max_input_per_1m":0.2,"min_output_per_1m":0.144,"max_output_per_1m":0.2,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-v3-671b","name":"deepseek-v3-671b","display_name":"DeepSeek V3 671B","description":"The full 671B-parameter release of DeepSeek V3, a MoE LLM with 37B activated parameters per token for efficient large-scale inference.","creator":"deepseek","family":"v3","tier":"","version":null,"type":"language","size_in_bn":671,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["deepseek-v3-671b","deepseek-v3671"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-v3-671b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.287,"max_input_per_1m":0.287,"min_output_per_1m":1.147,"max_output_per_1m":1.147,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-v3-2-exp","name":"deepseek-v3-2-exp","display_name":"DeepSeek V3.2 Exp","description":"An experimental DeepSeek V3.2 variant introducing the DeepSeek Sparse Attention mechanism for enhanced long-context processing efficiency.","creator":"deepseek","family":"deepseek-v3","tier":"exp","version":"3.2","type":"language","size_in_bn":685.397,"modalities":{"input":["text"],"output":["text"]},"context_window":163840,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-07-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-29","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["deepseek-v3-2-exp","deepseek-v3.2-exp685","deepseek/deepseek-v3.2-exp","novita/deepseek/deepseek-v3.2-exp","openrouter/deepseek/deepseek-v3.2-exp"],"hf_likes":988,"hf_downloads":218917,"hf_downloads_all_time":636879,"hf_trending_score":5,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-v3-2-exp","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.27,"max_input_per_1m":0.287,"min_output_per_1m":0.41,"max_output_per_1m":0.431,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["huggingface","novita","openrouter"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-doc-turbo","name":"doc-turbo","display_name":"Doc Turbo","description":"A fast Alibaba LLM variant optimized for document understanding and processing tasks.","creator":"alibaba","family":"alibaba","tier":"turbo","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-doc-turbo","qwen-doc-turbo"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-doc-turbo","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.087,"max_input_per_1m":0.087,"min_output_per_1m":0.144,"max_output_per_1m":0.144,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-flash","name":"flash","display_name":"Flash","description":"A lightweight, high-speed Alibaba LLM tier designed for low-latency inference on everyday tasks.","creator":"alibaba","family":"alibaba","tier":"flash","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":1000000,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-flash","dashscope/qwen-flash","dashscope/qwen-flash-2025-07-28","qwen-flash"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-flash","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.05,"max_input_per_1m":0.05,"min_output_per_1m":0.4,"max_output_per_1m":0.4,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-flash-us","name":"flash-us","display_name":"Flash US","description":"A US-region-routed variant of Alibaba's Flash-tier LLM for low-latency inference.","creator":"alibaba","family":"alibaba","tier":"flash","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":1000000,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-flash-us","qwen-flash-us"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-flash-us","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.05,"max_input_per_1m":0.05,"min_output_per_1m":0.4,"max_output_per_1m":0.4,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-long","name":"long","display_name":"Long","description":"An Alibaba LLM variant optimized for processing and generating content over extended context windows.","creator":"alibaba","family":"alibaba","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":10000000,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-long","qwen-long-latest"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-long","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.072,"max_input_per_1m":0.072,"min_output_per_1m":0.287,"max_output_per_1m":0.287,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-math-plus","name":"math-plus","display_name":"Math Plus","description":"An Alibaba LLM variant specialized for mathematical reasoning and problem-solving with enhanced accuracy.","creator":"alibaba","family":"alibaba","tier":"plus","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":4096,"max_output_tokens":3072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-math-plus","qwen-math-plus"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-math-plus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.574,"max_input_per_1m":0.574,"min_output_per_1m":1.721,"max_output_per_1m":1.721,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-math-turbo","name":"math-turbo","display_name":"Math Turbo","description":"A fast Alibaba LLM variant tuned for mathematical reasoning tasks with a focus on speed and efficiency.","creator":"alibaba","family":"alibaba","tier":"turbo","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":4096,"max_output_tokens":3072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-math-turbo","qwen-math-turbo"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-math-turbo","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.287,"max_input_per_1m":0.287,"min_output_per_1m":0.861,"max_output_per_1m":0.861,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-mt-flash","name":"mt-flash","display_name":"MT Flash","description":"A fast-tier Alibaba machine translation model supporting multilingual translation with low latency.","creator":"alibaba","family":"alibaba","tier":"flash","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":16384,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-mt-flash","qwen-mt-flash"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-mt-flash","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.16,"max_input_per_1m":0.16,"min_output_per_1m":0.49,"max_output_per_1m":0.49,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-mt-lite","name":"mt-lite","display_name":"MT Lite","description":"A lightweight Alibaba machine translation model designed for efficient multilingual translation at reduced cost.","creator":"alibaba","family":"alibaba","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":16384,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-mt-lite","qwen-mt-lite"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-mt-lite","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.12,"max_input_per_1m":0.12,"min_output_per_1m":0.36,"max_output_per_1m":0.36,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-mt-plus","name":"mt-plus","display_name":"MT Plus","description":"An enhanced Alibaba machine translation model built on Qwen foundations, supporting translation across 92 languages with strong quality.","creator":"alibaba","family":"alibaba","tier":"plus","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":16384,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["alibaba-mt-plus","novita/qwen/qwen-mt-plus","qwen-mt-plus","qwen/qwen-mt-plus"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-mt-plus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.25,"max_input_per_1m":2.46,"min_output_per_1m":0.75,"max_output_per_1m":7.37,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["novita"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-mt-turbo","name":"mt-turbo","display_name":"MT Turbo","description":"A high-speed Alibaba machine translation model optimized for throughput across a wide range of language pairs.","creator":"alibaba","family":"alibaba","tier":"turbo","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":16384,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-mt-turbo","qwen-mt-turbo"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-mt-turbo","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.16,"max_input_per_1m":0.16,"min_output_per_1m":0.49,"max_output_per_1m":0.49,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-plus-character","name":"plus-character","display_name":"Plus Character","description":"An Alibaba LLM variant from the Plus tier with enhanced character-level or persona-driven conversational capabilities.","creator":"alibaba","family":"alibaba","tier":"plus","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":32768,"max_output_tokens":4000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-plus-character","qwen-plus-character"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-plus-character","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.5,"max_input_per_1m":0.5,"min_output_per_1m":1.4,"max_output_per_1m":1.4,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-plus-character-ja","name":"plus-character-ja","display_name":"Plus Character JA","description":"A Japanese-language variant of Alibaba's Plus Character LLM, optimized for persona-driven Japanese conversation.","creator":"alibaba","family":"alibaba","tier":"plus","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":8192,"max_output_tokens":512,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-plus-character-ja","qwen-plus-character-ja"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-plus-character-ja","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.5,"max_input_per_1m":0.5,"min_output_per_1m":1.4,"max_output_per_1m":1.4,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qvq-72b-preview","name":"qvq-72b-preview","display_name":"QVQ 72B Preview","description":"A 72B multimodal reasoning model from Alibaba's QvQ series designed for complex image-text-to-text understanding tasks.","creator":"alibaba","family":"qvq","tier":"","version":null,"type":"language","size_in_bn":72,"modalities":{"input":["text"],"output":["text"]},"context_window":32768,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-qvq-72b-preview","huggingface-vlm-qvq-72b-preview","qvq-72b-preview"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qvq-72b-preview","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.721,"max_input_per_1m":1.721,"min_output_per_1m":5.161,"max_output_per_1m":5.161,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qvq-max","name":"qvq-max","display_name":"QVQ Max","description":"The top-tier variant of Alibaba's QvQ multimodal reasoning model for demanding visual question answering and analysis.","creator":"alibaba","family":"qvq","tier":"max","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["alibaba-qvq-max","qvq-max"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qvq-max","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.2,"max_input_per_1m":1.2,"min_output_per_1m":4.8,"max_output_per_1m":4.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}}],"pagination":{"page_size":50,"has_next":true,"next_token":"NTA","total_count":93},"meta":{"updated_at":"2026-06-13","request_id":"5355a172-eaf3-4819-82b5-eb0d751efb55","execution_ms":11}}