{"data":[{"id":"alibaba-qwen3-5-397b-a17b","name":"qwen3-5-397b-a17b","display_name":"Qwen3.5 397B A17B","description":"Alibaba's largest Qwen3.5 MoE model with 397B total parameters and 17B activated per token, targeting maximum capability for complex reasoning and generation.","creator":"alibaba","family":"qwen3_5_moe","tier":"","version":null,"type":"language","size_in_bn":397,"modalities":{"input":["image","text","video"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-16","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["accounts/fireworks/models/qwen3p5-397b-a17b","alibaba-qwen3-5-397b-a17b","openrouter/qwen/qwen3.5-397b-a17b","qwen/qwen3.5-397b-a17b","Qwen/Qwen3.5-397B-A17B","qwen3-5-397b-a17b","qwen3-5-397b-a17b-non-reasoning","qwen3.5-397b-a17b","scaleway/qwen/qwen3.5-397b-a17b","together_ai/Qwen/Qwen3.5-397B-A17B"],"hf_likes":1462,"hf_downloads":710153,"hf_downloads_all_time":2631436,"hf_trending_score":11,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"alibaba-qwen3-5-397b-a17b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.385,"max_input_per_1m":0.71,"min_output_per_1m":2.45,"max_output_per_1m":4.25,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-6-35b-a3b","name":"qwen3-6-35b-a3b","display_name":"Qwen3.6 35B A3B","description":"Alibaba's flagship Qwen3.6 MoE model with 35B total parameters and 3B activated per token, built with 256 experts and direct community feedback integration.","creator":"alibaba","family":"qwen","tier":"","version":null,"type":"language","size_in_bn":35,"modalities":{"input":["image","text","video"],"output":["text"]},"context_window":262144,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-27","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["accounts/fireworks/models/qwen3p6-35b-a3b","alibaba-qwen3-6-35b-a3b","huggingface-vlm-qwen3-6-35b-a3b","libertai/qwen3.6-35b-a3b","pinstripes/ps/qwen3.6-35b-a3b","qwen/qwen3.6-35b-a3b","Qwen/Qwen3.6-35B-A3B","qwen3-6-35b-a3b","qwen3-6-35b-a3b-non-reasoning","qwen3.6-35b-a3b","scaleway/qwen/qwen3.6-35b-a3b"],"hf_likes":1495,"hf_downloads":1510129,"hf_downloads_all_time":1510129,"hf_trending_score":292,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"alibaba-qwen3-6-35b-a3b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.14,"max_input_per_1m":0.375,"min_output_per_1m":0.45,"max_output_per_1m":2.25,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","other/pinstripes"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-oss-120b","name":"gpt-oss-120b","display_name":"GPT OSS 120B","description":"A 120-billion-parameter open-weights GPT model from OpenAI designed for reasoning-intensive tasks with implicit caching support.","creator":"openai","family":"gpt_oss","tier":"","version":null,"type":"language","size_in_bn":120,"modalities":{"input":["image","text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":23,"ids":["@cf/openai/gpt-oss-120b","accounts/fireworks/models/gpt-oss-120b","azure_ai/gpt-oss-120b","baseten/openai/gpt-oss-120b","bedrock_mantle/openai.gpt-oss-120b","cerebras/gpt-oss-120b","cloudflare/@cf/openai/gpt-oss-120b","crusoe/openai/gpt-oss-120b","databricks/databricks-gpt-oss-120b","deepinfra/openai/gpt-oss-120b","fireworks_ai/accounts/fireworks/models/gpt-oss-120b","fireworks_ai/gpt-oss-120b","gpt-oss-120b","gpt-oss-120b-low","gpt-oss-120b-maas","groq/openai/gpt-oss-120b","lemonade/gpt-oss-120b-mxfp-GGUF","novita/openai/gpt-oss-120b","ollama/gpt-oss:120b-cloud","openai-gpt-oss-120b","openai-reasoning-gpt-oss-120b","openai.gpt-oss-120b-1:0","openai/gpt-oss-120b","openai/gpt-oss-120b:free","openrouter/openai/gpt-oss-120b","ovhcloud/gpt-oss-120b","publishers/google/models/gpt-oss-120b-maas","replicate/openai/gpt-oss-120b","sambanova/gpt-oss-120b","scaleway/openai/gpt-oss-120b","tensormesh/openai/gpt-oss-120b","together_ai/openai/gpt-oss-120b","vertex_ai/openai/gpt-oss-120b-maas","wandb/openai/gpt-oss-120b","watsonx/openai/gpt-oss-120b"],"hf_likes":4719,"hf_downloads":3524674,"hf_downloads_all_time":32348365,"hf_trending_score":25,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"openai-gpt-oss-120b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.03,"max_input_per_1m":15,"min_output_per_1m":0.15,"max_output_per_1m":60,"min_cache_read_per_1m":0.015,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":23},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-coder-30b-a3b-instruct","name":"qwen3-coder-30b-a3b-instruct","display_name":"Qwen3 Coder 30B A3B Instruct","description":"An instruction-tuned Qwen3 MoE coding model with 30B total and 3B active parameters, designed for agentic programming tasks and tool-integrated workflows.","creator":"alibaba","family":"qwen3_moe","tier":"","version":null,"type":"language","size_in_bn":30,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-06-30","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-07-31","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["accounts/fireworks/models/qwen3-coder-30b-a3b-instruct","alibaba-qwen3-coder-30b-a3b-instruct","fireworks_ai/accounts/fireworks/models/qwen3-coder-30b-a3b-instruct","huggingface-reasoning-qwen3-coder-30b-a3b-instruct","lemonade/Qwen3-Coder-30B-A3B-Instruct-GGUF","novita/qwen/qwen3-coder-30b-a3b-instruct","qwen/qwen3-coder-30b-a3b-instruct","qwen3-coder-30b-a3b-instruct","scaleway/qwen/qwen3-coder-30b-a3b-instruct"],"hf_likes":1018,"hf_downloads":2406663,"hf_downloads_all_time":7798034,"hf_trending_score":10,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"alibaba-qwen3-coder-30b-a3b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.07,"max_input_per_1m":0.45,"min_output_per_1m":0.26,"max_output_per_1m":2.25,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["huggingface","novita","openrouter"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-235b-a22b-instruct","name":"qwen3-235b-a22b-instruct","display_name":"Qwen3 235B A22B Instruct","description":"An instruction-tuned update of the Qwen3 235B A22B MoE model with significant improvements in instruction following, logical reasoning, and general capabilities.","creator":"alibaba","family":"qwen3_moe","tier":"","version":null,"type":"language","size_in_bn":235,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":11,"ids":["accounts/fireworks/models/qwen3-235b-a22b-instruct-2507","alibaba-qwen3-235b-a22b-instruct","crusoe/Qwen/Qwen3-235B-A22B-Instruct-2507","deepinfra/Qwen/Qwen3-235B-A22B-Instruct-2507","fireworks_ai/accounts/fireworks/models/qwen3-235b-a22b-instruct-2507","novita/qwen/qwen3-235b-a22b-instruct-2507","qwen/qwen3-235b-a22b-instruct-2507","Qwen/Qwen3-235B-A22B-Instruct-2507","qwen3-235b-a22b-instruct","qwen3-235b-a22b-instruct-2507","replicate/qwen/qwen3-235b-a22b-instruct-2507","scaleway/qwen/qwen3-235b-a22b-instruct-2507","wandb/Qwen/Qwen3-235B-A22B-Instruct-2507"],"hf_likes":773,"hf_downloads":150781,"hf_downloads_all_time":1182969,"hf_trending_score":1,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"alibaba-qwen3-235b-a22b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.09,"max_input_per_1m":10,"min_output_per_1m":0.58,"max_output_per_1m":10,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["deepinfra","huggingface","novita"],"provider_count":11},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-3-70b-instruct","name":"llama-3-3-70b-instruct","display_name":"Llama 3.3 70B Instruct","description":"Meta's 70B instruction-tuned LLM from Llama 3.3, optimized for complex instruction-following and deployed across multiple cloud regions.","creator":"meta","family":"llama","tier":"","version":"3-3","type":"language","size_in_bn":70,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":120000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-12","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Llama3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-12-06","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":21,"ids":["accounts/fireworks/models/llama-v3p3-70b-instruct","azure_ai/Llama-3.3-70B-Instruct","crusoe/meta-llama/Llama-3.3-70B-Instruct","databricks/databricks-meta-llama-3-3-70b-instruct","deepinfra/meta-llama/Llama-3.3-70B-Instruct","fireworks_ai/accounts/fireworks/models/llama-v3p3-70b-instruct","gradient_ai/llama3.3-70b-instruct","groq/llama-3.3-70b-versatile","hyperbolic/meta-llama/Llama-3.3-70B-Instruct","lambda_ai/llama3.3-70b-instruct-fp8","llama-3-3-instruct-70b","llama-3.3-70b-instruct-maas","meta_llama/Llama-3.3-70B-Instruct","meta-llama-3-3-70b-instruct","meta-llama/llama-3.3-70b-instruct","meta-llama/llama-3.3-70b-instruct:free","meta-textgeneration-llama-3-3-70b-instruct","meta.llama3-3-70b-instruct-v1:0","meta.llama3-3-70b-instruct-v1:0:128k","nebius/meta-llama/Llama-3.3-70B-Instruct","novita/meta-llama/llama-3.3-70b-instruct","nscale/meta-llama/Llama-3.3-70B-Instruct","oci/meta.llama-3.3-70b-instruct","oci/meta.llama-3.3-70b-instruct-fp8-dynamic","ovhcloud/Meta-Llama-3_3-70B-Instruct","publishers/google/models/llama-3.3-70b-instruct-maas","publishers/meta/models/llama-3.3-70b-instruct-maas","sambanova/Meta-Llama-3.3-70B-Instruct","scaleway/meta/llama-3.3-70b-instruct","together_ai/meta-llama/Llama-3.3-70B-Instruct-Turbo-Free","us.meta.llama3-3-70b-instruct-v1:0","wandb/meta-llama/Llama-3.3-70B-Instruct","watsonx/meta-llama/llama-3-3-70b-instruct"],"hf_likes":2731,"hf_downloads":496024,"hf_downloads_all_time":10779619,"hf_trending_score":1.5,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"meta-llama-3-3-70b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.1,"max_input_per_1m":71,"min_output_per_1m":0.2,"max_output_per_1m":71,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":21},"providers":[],"regions":[],"region_info":{}}},{"id":"baai-bge-multilingual-gemma2","name":"bge-multilingual-gemma2","display_name":"BGE Multilingual Gemma2","description":"A multilingual text embedding model built on the Gemma 2 architecture, enabling high-quality cross-lingual semantic representations.","creator":"baai","family":"embed","tier":"","version":null,"type":"embedding","size_in_bn":null,"modalities":{"input":["text"],"output":["embedding"]},"context_window":8192,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["baai-bge-multilingual-gemma2","nebius/BAAI/bge-multilingual-gemma2","scaleway/BAAI/bge-multilingual-gemma2"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"baai-bge-multilingual-gemma2","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.01,"max_input_per_1m":0.1,"min_output_per_1m":null,"max_output_per_1m":null,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["nebius"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-devstral-2-123b-instruct","name":"devstral-2-123b-instruct","display_name":"Devstral 2 123B Instruct","description":"A 123B-parameter instruction-tuned LLM in Mistral's Devstral series, purpose-built for software engineering and agentic coding tasks.","creator":"mistral","family":"devstral","tier":"","version":"2","type":"language","size_in_bn":123,"modalities":{"input":["text"],"output":["text"]},"context_window":200000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["mistral-devstral-2-123b-instruct","scaleway/mistralai/devstral-2-123b-instruct-2512"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"mistral-devstral-2-123b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.4,"max_input_per_1m":0.4,"min_output_per_1m":2,"max_output_per_1m":2,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["scaleway"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemma-3-27b-instruct","name":"gemma-3-27b-instruct","display_name":"Gemma 3 27B Instruct","description":"An instruction-tuned 27B Gemma 3 LLM with multimodal vision-language input and 128k context window.","creator":"google","family":"gemma3","tier":"","version":"3","type":"language","size_in_bn":27,"modalities":{"input":["image","text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-08-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-03-12","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["accounts/fireworks/models/gemma-3-27b-it","deepinfra/google/gemma-3-27b-it","fireworks_ai/accounts/fireworks/models/gemma-3-27b-it","gemini/gemma-3-27b-it","google-gemma-3-27b-instruct","google.gemma-3-27b-it","google/gemma-3-27b-it","google/gemma-3-27b-it:free","huggingface-vlm-gemma-3-27b-instruct","nebius/google/gemma-3-27b-it","novita/google/gemma-3-27b-it","scaleway/google/gemma-3-27b-it"],"hf_likes":1956,"hf_downloads":567671,"hf_downloads_all_time":12733530,"hf_trending_score":2,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"google-gemma-3-27b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.06,"max_input_per_1m":0.9,"min_output_per_1m":0.16,"max_output_per_1m":0.9,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["nebius"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemma-4-26b-a4b-instruct","name":"gemma-4-26b-a4b-instruct","display_name":"Gemma 4 26B A4B IT","description":"Instruction-tuned MoE variant of Gemma 4 with 26B total and 4B active parameters, supporting vision, tool use, and file input.","creator":"google","family":"gemma4","tier":"","version":"4","type":"language","size_in_bn":26,"modalities":{"input":["image","pdf","text","video"],"output":["text"]},"context_window":262144,"max_output_tokens":131072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemma","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-03","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["@cf/google/gemma-4-26b-a4b-it","accounts/fireworks/models/gemma-4-26b-a4b-it","cloudflare/@cf/google/gemma-4-26b-a4b-it","gemma-4-26b-a4b-it-maas","google-gemma-4-26b-a4b-instruct","google/gemma-4-26b-a4b-it","google/gemma-4-26B-A4B-it","google/gemma-4-26b-a4b-it:free","huggingface-vlm-gemma-4-26b-a4b-it","publishers/google/models/gemma-4-26b-a4b-it-maas","scaleway/google/gemma-4-26b-a4b-it","vertex_ai/google/gemma-4-26b-a4b-it-maas"],"hf_likes":751,"hf_downloads":3113602,"hf_downloads_all_time":3115675,"hf_trending_score":92,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"google-gemma-4-26b-a4b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.06,"max_input_per_1m":0.25,"min_output_per_1m":0.3,"max_output_per_1m":0.6,"min_cache_read_per_1m":0.015,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"hcompany-holo-2-30b-a3b","name":"holo-2-30b-a3b","display_name":"Holo 2 30B A3B","description":"A 30B-parameter MoE LLM from H Company with 3B active parameters, representing the second generation of the Holo model series.","creator":"hcompany","family":"holo","tier":"","version":"2","type":"language","size_in_bn":30,"modalities":{"input":["image"],"output":["text"]},"context_window":22000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["hcompany-holo-2-30b-a3b","scaleway/hcompany/holo2-30b-a3b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"hcompany-holo-2-30b-a3b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.3,"max_input_per_1m":0.3,"min_output_per_1m":0.7,"max_output_per_1m":0.7,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["scaleway"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-medium-3-5-128b","name":"mistral-medium-3-5-128b","display_name":"Mistral Medium 3.5 128B","description":"A 128B-parameter mid-tier LLM from Mistral at version 3.5, balancing strong reasoning capability with practical deployment scale.","creator":"mistral","family":"mistral","tier":"","version":"3-5-128b","type":"language","size_in_bn":null,"modalities":{"input":["image"],"output":["text"]},"context_window":256000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["mistral-medium-3-5-128b","scaleway/mistralai/mistral-medium-3.5-128b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"mistral-medium-3-5-128b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":1.5,"max_input_per_1m":1.5,"min_output_per_1m":7.5,"max_output_per_1m":7.5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["scaleway"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-small-3-2-24b-instruct","name":"mistral-small-3-2-24b-instruct","display_name":"Mistral Small 3.2 24B Instruct","description":"A 24B-parameter instruction-tuned multimodal LLM representing the 3.2 update of Mistral's Small series with enhanced vision and text capabilities.","creator":"mistral","family":"mistral","tier":"","version":"3-2","type":"language","size_in_bn":24,"modalities":{"input":["image","text"],"output":["text"]},"context_window":128000,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-10-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Mistral","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-06-20","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["deepinfra/mistralai/Mistral-Small-3.2-24B-Instruct-2506","huggingface-vlm-mistral-small-3-2-24b-instruct-2506","mistral-small-3-2-24b-instruct","mistralai/mistral-small-3.2-24b-instruct","mistralai/Mistral-Small-3.2-24B-Instruct-2506","openrouter/mistralai/mistral-small-3.2-24b-instruct","ovhcloud/Mistral-Small-3.2-24B-Instruct-2506","scaleway/mistralai/mistral-small-3.2-24b-instruct-2506"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"mistral-small-3-2-24b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.075,"max_input_per_1m":0.15,"min_output_per_1m":0.2,"max_output_per_1m":0.35,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["deepinfra","openrouter"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-pixtral-12b","name":"mistral-pixtral-12b","display_name":"Pixtral 12B","description":"A 12B-parameter multimodal LLM from Mistral supporting vision and tool-use, capable of processing both images and text for image-text-to-text tasks.","creator":"mistral","family":"pixtral","tier":"","version":null,"type":"language","size_in_bn":12,"modalities":{"input":["image"],"output":["text"]},"context_window":128000,"max_output_tokens":4096,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-09-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["huggingface-vlm-mistral-pixtral-12b-2409","mistral-pixtral-12b","mistral/pixtral-12b","mistral/pixtral-12b-2409","scaleway/mistralai/pixtral-12b-2409","vercel_ai_gateway/mistral/pixtral-12b","watsonx/mistralai/pixtral-12b-2409"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"mistral-pixtral-12b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.15,"max_input_per_1m":0.35,"min_output_per_1m":0.15,"max_output_per_1m":0.35,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["mistral","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-embedding-8b","name":"qwen3-embedding-8b","display_name":"Qwen3 Embedding 8B","description":"An 8B-parameter text embedding model from the Qwen3 series with strong multilingual capabilities and long-context support for retrieval and ranking tasks.","creator":"alibaba","family":"qwen3","tier":"","version":null,"type":"embedding","size_in_bn":8,"modalities":{"input":["text"],"output":["embedding"]},"context_window":40960,"max_output_tokens":4096,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-06-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/qwen3-embedding-8b","alibaba-qwen3-embedding-8b","alibaba/qwen3-embedding-8b","llamagate/qwen3-embedding-8b","novita/qwen/qwen3-embedding-8b","Qwen/Qwen3-Embedding-8B","scaleway/qwen/qwen3-embedding-8b"],"hf_likes":656,"hf_downloads":1900241,"hf_downloads_all_time":10616532,"hf_trending_score":9,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"alibaba-qwen3-embedding-8b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.02,"max_input_per_1m":0.1,"min_output_per_1m":null,"max_output_per_1m":null,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["other/llamagate"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-voxtral-small","name":"voxtral-small","display_name":"Voxtral Small 24B","description":"A 24B-parameter audio-language model from Mistral built on Mistral Small 3, excelling at speech transcription, translation, and audio understanding.","creator":"mistral","family":"voxtral","tier":"small","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["audio","text"],"output":["text"]},"context_window":128000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Mistral","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-10-30","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["mistral-voxtral-small","mistral.voxtral-small-24b-2507","mistralai/voxtral-small-24b-2507","mistralai/Voxtral-Small-24B-2507","scaleway/mistralai/voxtral-small-24b-2507"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-26 08:02:07","pricing":{"model_id":"mistral-voxtral-small","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-27","ingestion_date":"2026-06-26","summary":{"currency":"USD","min_input_per_1m":0.1,"max_input_per_1m":0.15,"min_output_per_1m":0.3,"max_output_per_1m":0.35,"min_cache_read_per_1m":0.01,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","openrouter"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}}],"pagination":{"page_size":50,"has_next":false,"next_token":null,"total_count":16},"meta":{"updated_at":"2026-06-26","request_id":"5ff481cc-98a9-49a0-a94a-423844e392df","execution_ms":10}}