{"data":[{"id":"anthropic-claude-5-fable","name":"claude-5-fable","display_name":"Claude Fable 5","description":"A highly capable Claude LLM optimized for demanding reasoning and long-horizon agentic tasks, with vision, tool-use, and explicit-caching support.","creator":"anthropic","family":"claude","tier":"fable","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default","xhigh"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-06-09","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["anthropic-claude-5-fable","anthropic.claude-fable-5","anthropic/claude-fable-5","au.anthropic.claude-fable-5","azure_ai/claude-fable-5","claude-fable-5","eu.anthropic.claude-fable-5","global.anthropic.claude-fable-5","publishers/anthropic/models/claude-fable-5","publishers/google/models/claude-fable-5","us.anthropic.claude-fable-5","vertex_ai/claude-fable-5","vertex_ai/claude-fable-5@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-5-fable","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":10,"max_input_per_1m":12,"min_output_per_1m":50,"max_output_per_1m":60,"min_cache_read_per_1m":1,"min_cache_write_per_1m":12.5,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-8-opus","name":"claude-4-8-opus","display_name":"Claude Opus 4.8","description":"A flagship Anthropic LLM in the Claude Opus tier at version 4.8, supporting adaptive reasoning, vision, tool use, file input, and web search across multiple geographic regions.","creator":"anthropic","family":"claude","tier":"opus","version":"4-8","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","xhigh"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-05-28","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-8-opus","anthropic.claude-opus-4-8","anthropic/claude-opus-4-8","anthropic/claude-opus-4.8","au.anthropic.claude-opus-4-8","azure_ai/claude-opus-4-8","claude-opus-4-8","eu.anthropic.claude-opus-4-8","global.anthropic.claude-opus-4-8","jp.anthropic.claude-opus-4-8","publishers/anthropic/models/claude-opus-4-8","publishers/google/models/claude-opus-4-8","us.anthropic.claude-opus-4-8","vertex_ai/claude-opus-4-8","vertex_ai/claude-opus-4-8@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-8-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-7-opus","name":"claude-4-7-opus","display_name":"Claude Opus 4.7","description":"Anthropic's Claude 4.7 Opus model with adaptive reasoning at maximum effort, vision, and tool-use for complex enterprise tasks.","creator":"anthropic","family":"claude","tier":"opus","version":"4-7","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","minimal","xhigh"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-04-16","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-7-opus","anthropic.claude-opus-4-7","anthropic/claude-opus-4-7","anthropic/claude-opus-4.7","au.anthropic.claude-opus-4-7","azure_ai/claude-opus-4-7","claude-opus-4-7","claude-opus-4-7-20260416","claude-opus-4-7-non-reasoning","eu.anthropic.claude-opus-4-7","global.anthropic.claude-opus-4-7","jp.anthropic.claude-opus-4-7","openrouter/anthropic/claude-opus-4.7","perplexity/anthropic/claude-opus-4-7","publishers/anthropic/models/claude-opus-4-7","publishers/google/models/claude-opus-4-7","us.anthropic.claude-opus-4-7","vertex_ai/claude-opus-4-7","vertex_ai/claude-opus-4-7@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-7-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-3-1-pro-preview","name":"gemini-3-1-pro-preview","display_name":"Gemini 3.1 Pro Preview","description":"A preview release of Gemini 3.1 Pro providing early access to its frontier reasoning, vision, and tool-use capabilities.","creator":"google","family":"gemini","tier":"pro","version":"3-1","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-19","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["gemini-3-1-pro-preview","gemini-3.1-pro-preview","gemini/gemini-3.1-pro-preview","google-gemini-3-1-pro-preview","google/gemini-3.1-pro-preview","openrouter/google/gemini-3.1-pro-preview","publishers/google/models/gemini-3.1-pro-preview","vertex_ai/gemini-3.1-pro-preview"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-3-1-pro-preview","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2,"max_input_per_1m":2,"min_output_per_1m":12,"max_output_per_1m":12,"min_cache_read_per_1m":0.2,"min_cache_write_per_1m":0.375,"min_reasoning_per_1m":12,"cheapest_providers":["google_gemini","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-3-5-flash","name":"gemini-3-5-flash","display_name":"Gemini 3.5 Flash","description":"A fast, efficient Gemini 3.5 model optimized for high-throughput tasks with support for reasoning, vision, tool use, and web search.","creator":"google","family":"gemini","tier":"flash","version":"3-5","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-05-19","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["gemini-3-5-flash","gemini-3-5-flash-medium","gemini-3-5-flash-minimal","gemini-3.5-flash","gemini/gemini-3.5-flash","google-gemini-3-5-flash","google/gemini-3.5-flash","publishers/google/models/gemini-3.5-flash","vertex_ai/gemini-3.5-flash"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-3-5-flash","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.5,"max_input_per_1m":1.8,"min_output_per_1m":9,"max_output_per_1m":10.8,"min_cache_read_per_1m":0.15,"min_cache_write_per_1m":0.0833333333,"min_reasoning_per_1m":9,"cheapest_providers":["google_gemini","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"zhipu-glm-5","name":"glm-5","display_name":"GLM-5","description":"An open-source MoE LLM from Z AI designed for long-context reasoning, multi-step tool orchestration, and complex agentic engineering tasks.","creator":"zhipu","family":"glm_moe_dsa","tier":"","version":"5","type":"language","size_in_bn":753.864,"modalities":{"input":["pdf","text"],"output":["text"]},"context_window":202800,"max_output_tokens":131100,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-11","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["accounts/fireworks/models/glm-5","baseten/zai-org/GLM-5","bedrock/us-east-1/zai.glm-5","bedrock/us-west-2/zai.glm-5","glm-5","glm-5-maas","glm-5-non-reasoning","openrouter/z-ai/glm-5","publishers/google/models/glm-5-maas","vertex_ai/zai-org/glm-5-maas","z-ai/glm-5","zai-org/glm-5","zai-org/GLM-5","zai.glm-5","zai/glm-5","zhipu-glm-5"],"hf_likes":2070,"hf_downloads":477667,"hf_downloads_all_time":777726,"hf_trending_score":5,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"zhipu-glm-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.573,"max_input_per_1m":1,"min_output_per_1m":1.92,"max_output_per_1m":3.2,"min_cache_read_per_1m":0.1,"min_cache_write_per_1m":0.1,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-3-pro","name":"gemini-3-pro","display_name":"Gemini 3 Pro","description":"Google's pro-tier LLM in the Gemini 3 generation offering frontier multimodal reasoning, coding, and tool-use capabilities.","creator":"google","family":"gemini","tier":"pro","version":"3","type":"language","size_in_bn":null,"modalities":{"input":["image"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["gemini-3-pro","gemini-3-pro-low","google-gemini-3-pro","replicate/google/gemini-3-pro"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-3-pro","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2,"max_input_per_1m":4,"min_output_per_1m":12,"max_output_per_1m":18,"min_cache_read_per_1m":null,"min_cache_write_per_1m":0.2,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai","replicate"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-6-opus","name":"claude-4-6-opus","display_name":"Claude Opus 4.6","description":"Anthropic's high-capability Claude 4.6 Opus model with advanced reasoning, vision, and tool-use for demanding workloads.","creator":"anthropic","family":"claude","tier":"opus","version":"4-6","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-05","training_data_cutoff":"2025-08","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-02-05","earliest_deprecation_date":"2026-06-29","deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-6-opus","anthropic.claude-opus-4-6-v1","anthropic/claude-opus-4.6","anthropic/claude-opus-4.6-fast","au.anthropic.claude-opus-4-6-v1","azure_ai/claude-opus-4-6","claude-opus-4-6","claude-opus-4-6-20260205","claude-opus-4-6-adaptive","eu.anthropic.claude-opus-4-6-v1","github_copilot/claude-opus-4.6-fast","global.anthropic.claude-opus-4-6-v1","openrouter/anthropic/claude-opus-4.6","perplexity/anthropic/claude-opus-4-6","publishers/anthropic/models/claude-opus-4-6","publishers/google/models/claude-opus-4-6","us.anthropic.claude-opus-4-6-v1","vercel_ai_gateway/anthropic/claude-opus-4.6","vertex_ai/claude-opus-4-6","vertex_ai/claude-opus-4-6@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-6-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":30,"min_output_per_1m":25,"max_output_per_1m":150,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-6-sonnet","name":"claude-4-6-sonnet","display_name":"Claude Sonnet 4.6","description":"A capable Claude 4.6 Sonnet model with reasoning, vision, and tool-use support for a wide range of applications.","creator":"anthropic","family":"claude","tier":"sonnet","version":"4-6","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-02-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-6-sonnet","anthropic.claude-sonnet-4-6","anthropic/claude-sonnet-4-6","anthropic/claude-sonnet-4.6","au.anthropic.claude-sonnet-4-6","azure_ai/claude-sonnet-4-6","claude-sonnet-4-6","claude-sonnet-4-6-adaptive","claude-sonnet-4-6-non-reasoning-low-effort","eu.anthropic.claude-sonnet-4-6","global.anthropic.claude-sonnet-4-6","jp.anthropic.claude-sonnet-4-6","openrouter/anthropic/claude-sonnet-4.6","publishers/anthropic/models/claude-sonnet-4-6","publishers/google/models/claude-sonnet-4-6","snowflake/claude-sonnet-4-6","us.anthropic.claude-sonnet-4-6","vertex_ai/claude-sonnet-4-6","vertex_ai/claude-sonnet-4-6@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-6-sonnet","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":3,"max_input_per_1m":3.6,"min_output_per_1m":15,"max_output_per_1m":18,"min_cache_read_per_1m":0.3,"min_cache_write_per_1m":3.75,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-5-opus","name":"claude-4-5-opus","display_name":"Claude Opus 4.5","description":"Anthropic's flagship Claude 4.5 model with top-tier reasoning, vision, and tool-use capabilities for complex tasks.","creator":"anthropic","family":"claude","tier":"opus","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":64000,"tool_use_system_prompt_tokens":159,"output_vector_sizes":[],"knowledge_cutoff":"2025-05","training_data_cutoff":"2025-08","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-11-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["anthropic-claude-4-5-opus","anthropic.claude-opus-4-5-20251101-v1:0","anthropic/claude-opus-4.5","azure_ai/claude-opus-4-5","claude-opus-4-5","claude-opus-4-5-20251101","claude-opus-4-5-thinking","claude-opus-4-5@20251101","databricks/databricks-claude-opus-4-5","eu.anthropic.claude-opus-4-5-20251101-v1:0","github_copilot/claude-opus-4.5","global.anthropic.claude-opus-4-5-20251101-v1:0","gmi/anthropic/claude-opus-4.5","openrouter/anthropic/claude-opus-4.5","perplexity/anthropic/claude-opus-4-5","publishers/anthropic/models/claude-opus-4-5","publishers/google/models/claude-opus-4-5","us.anthropic.claude-opus-4-5-20251101-v1:0","vercel_ai_gateway/anthropic/claude-opus-4.5","vertex_ai/claude-opus-4-5","vertex_ai/claude-opus-4-5@20251101"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-5-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","gmi","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"zhipu-glm-4-7","name":"glm-4-7","display_name":"GLM-4.7","description":"A multilingual MoE LLM from Z AI designed for complex reasoning, agentic coding, and tool use, building on the GLM-4.6 architecture.","creator":"zhipu","family":"glm4_moe","tier":"","version":"4-7","type":"language","size_in_bn":358.338,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":204800,"max_output_tokens":131072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-22","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":13,"ids":["accounts/fireworks/models/glm-4p7","baseten/zai-org/GLM-4.7","cerebras/zai-glm-4.7","fireworks_ai/accounts/fireworks/models/glm-4p7","fireworks_ai/glm-4p7","glm-4-7","glm-4-7-251222","glm-4-7-non-reasoning","glm-4.7","glm-4.7-maas","novita/zai-org/glm-4.7","openrouter/z-ai/glm-4.7","publishers/google/models/glm-4.7-maas","together_ai/zai-org/GLM-4.7","vertex_ai/zai-org/glm-4.7-maas","z-ai/glm-4.7","zai-org/glm-4.7","zai-org/GLM-4.7","zai.glm-4.7","zai/glm-4.7","zhipu-glm-4-7"],"hf_likes":2026,"hf_downloads":117151,"hf_downloads_all_time":436300,"hf_trending_score":4,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"zhipu-glm-4-7","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.4,"max_input_per_1m":2.25,"min_output_per_1m":1.75,"max_output_per_1m":2.75,"min_cache_read_per_1m":0.08,"min_cache_write_per_1m":0.06,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":13},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-5-sonnet","name":"claude-4-5-sonnet","display_name":"Claude Sonnet 4.5","description":"A versatile Claude 4.5 model with strong reasoning, vision, and tool-use capabilities suited for a broad range of tasks.","creator":"anthropic","family":"claude","tier":"sonnet","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":64000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":"2025-07","supported_reasoning_efforts":["default"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-29","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":10,"ids":["anthropic-claude-4-5-sonnet","anthropic.claude-sonnet-4-5-20250929-v1:0","anthropic/claude-sonnet-4.5","au.anthropic.claude-sonnet-4-5-20250929-v1:0","azure_ai/claude-sonnet-4-5","bedrock/us-gov-east-1/anthropic.claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-east-1/claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-west-1/anthropic.claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-west-1/claude-sonnet-4-5-20250929-v1:0","claude-4-5-sonnet","claude-4-5-sonnet-thinking","claude-sonnet-4-5","claude-sonnet-4-5-20250929","claude-sonnet-4-5-20250929-v1:0","claude-sonnet-4-5@20250929","databricks/databricks-claude-sonnet-4-5","eu.anthropic.claude-sonnet-4-5-20250929-v1:0","github_copilot/claude-sonnet-4.5","global.anthropic.claude-sonnet-4-5-20250929-v1:0","gmi/anthropic/claude-sonnet-4.5","jp.anthropic.claude-sonnet-4-5-20250929-v1:0","openrouter/anthropic/claude-sonnet-4.5","perplexity/anthropic/claude-sonnet-4-5","publishers/anthropic/models/claude-sonnet-4-5","publishers/google/models/claude-sonnet-4-5","replicate/anthropic/claude-4.5-sonnet","snowflake/claude-sonnet-4-5","us-gov.anthropic.claude-sonnet-4-5-20250929-v1:0","us.anthropic.claude-sonnet-4-5-20250929-v1:0","vercel_ai_gateway/anthropic/claude-sonnet-4.5","vertex_ai/claude-sonnet-4-5","vertex_ai/claude-sonnet-4-5@20250929"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-5-sonnet","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2.99999,"max_input_per_1m":3.6,"min_output_per_1m":15,"max_output_per_1m":18,"min_cache_read_per_1m":0.3,"min_cache_write_per_1m":3.75,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":10},"providers":[],"regions":[],"region_info":{}}},{"id":"minimax-m2","name":"minimax-m2","display_name":"MiniMax M2","description":"MiniMax's second-generation MoE language model with reasoning and tool-use capabilities, built for complex agentic and productivity workflows.","creator":"minimax","family":"mixtral","tier":"","version":null,"type":"language","size_in_bn":228.704,"modalities":{"input":["text"],"output":["text"]},"context_window":205000,"max_output_tokens":196608,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-10-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["accounts/fireworks/models/minimax-m2","fireworks_ai/accounts/fireworks/models/minimax-m2","huggingface-llm-minimax-m2","minimax-m2","minimax.minimax-m2","minimax/minimax-m2","minimax/MiniMax-M2","novita/minimax/minimax-m2","openrouter/minimax/minimax-m2"],"hf_likes":1491,"hf_downloads":69357,"hf_downloads_all_time":1925616,"hf_trending_score":0,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"minimax-m2","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.255,"max_input_per_1m":0.3,"min_output_per_1m":1,"max_output_per_1m":1.2,"min_cache_read_per_1m":0.03,"min_cache_write_per_1m":0.03,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-3-flash","name":"gemini-3-flash","display_name":"Gemini 3 Flash","description":"Google's fast, frontier-intelligence LLM in the Gemini 3 generation combining speed with strong reasoning, search grounding, and multimodal capabilities.","creator":"google","family":"gemini","tier":"flash","version":"3","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf"],"output":["text"]},"context_window":1000000,"max_output_tokens":65000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-12-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["gemini-3-flash","gemini-3-flash-reasoning","google-gemini-3-flash","google/gemini-3-flash"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-3-flash","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.5,"max_input_per_1m":0.5,"min_output_per_1m":3,"max_output_per_1m":3,"min_cache_read_per_1m":0.05,"min_cache_write_per_1m":0.05,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai","vercel_ai_gateway"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-3-1-flash-lite-preview","name":"gemini-3-1-flash-lite-preview","display_name":"Gemini 3.1 Flash Lite Preview","description":"A preview release of Gemini 3.1 Flash Lite offering early evaluation of its lightweight reasoning, vision, and tool-use capabilities.","creator":"google","family":"gemini","tier":"flash-lite","version":"3-1","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-03","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["gemini-3-1-flash-lite-preview","gemini-3.1-flash-lite-preview","gemini/gemini-3.1-flash-lite-preview","google-gemini-3-1-flash-lite-preview","google/gemini-3.1-flash-lite-preview","openrouter/google/gemini-3.1-flash-lite-preview","publishers/google/models/gemini-3.1-flash-lite-preview","vertex_ai/gemini-3.1-flash-lite-preview"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-3-1-flash-lite-preview","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.25,"max_input_per_1m":0.25,"min_output_per_1m":1.5,"max_output_per_1m":1.5,"min_cache_read_per_1m":0.025,"min_cache_write_per_1m":0.025,"min_reasoning_per_1m":1.5,"cheapest_providers":["google_gemini","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-oss-120b","name":"gpt-oss-120b","display_name":"GPT OSS 120B","description":"A 120-billion-parameter open-weights GPT model from OpenAI designed for reasoning-intensive tasks with implicit caching support.","creator":"openai","family":"gpt_oss","tier":"","version":null,"type":"language","size_in_bn":120,"modalities":{"input":["image","text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":21,"ids":["@cf/openai/gpt-oss-120b","accounts/fireworks/models/gpt-oss-120b","azure_ai/gpt-oss-120b","baseten/openai/gpt-oss-120b","bedrock_mantle/openai.gpt-oss-120b","cerebras/gpt-oss-120b","crusoe/openai/gpt-oss-120b","databricks/databricks-gpt-oss-120b","deepinfra/openai/gpt-oss-120b","fireworks_ai/accounts/fireworks/models/gpt-oss-120b","gpt-oss-120b","gpt-oss-120b-low","gpt-oss-120b-maas","groq/openai/gpt-oss-120b","lemonade/gpt-oss-120b-mxfp-GGUF","novita/openai/gpt-oss-120b","ollama/gpt-oss:120b-cloud","openai-gpt-oss-120b","openai-reasoning-gpt-oss-120b","openai.gpt-oss-120b-1:0","openai/gpt-oss-120b","openai/gpt-oss-120b:free","openrouter/openai/gpt-oss-120b","ovhcloud/gpt-oss-120b","publishers/google/models/gpt-oss-120b-maas","replicate/openai/gpt-oss-120b","sambanova/gpt-oss-120b","together_ai/openai/gpt-oss-120b","vertex_ai/openai/gpt-oss-120b-maas","wandb/openai/gpt-oss-120b","watsonx/openai/gpt-oss-120b"],"hf_likes":4719,"hf_downloads":3524674,"hf_downloads_all_time":32348365,"hf_trending_score":25,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-oss-120b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.039,"max_input_per_1m":15,"min_output_per_1m":0.18,"max_output_per_1m":60,"min_cache_read_per_1m":0.075,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":21},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-v3-2","name":"v3-2","display_name":"DeepSeek V3.2","description":"DeepSeek's V3.2 MoE LLM featuring implicit caching support and improved tool-use capabilities over the V3.1 generation.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.2","type":"language","size_in_bn":685.397,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":163840,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-01","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":12,"ids":["accounts/fireworks/models/deepseek-v3p2","azure_ai/deepseek-v3.2","bedrock/ap-northeast-1/deepseek.v3.2","bedrock/ap-south-1/deepseek.v3.2","bedrock/ap-southeast-3/deepseek.v3.2","bedrock/eu-north-1/deepseek.v3.2","bedrock/sa-east-1/deepseek.v3.2","bedrock/us-east-1/deepseek.v3.2","bedrock/us-east-2/deepseek.v3.2","bedrock/us-west-2/deepseek.v3.2","deepseek-ai/DeepSeek-V3.2","deepseek-llm-deepseek-v3-2","deepseek-v3-2","deepseek-v3-2-251201","deepseek-v3-2-reasoning","deepseek-v3.2-maas","deepseek-v3.2685","deepseek.v3.2","deepseek/deepseek-v3.2","eu.deepseek.v3.2","fireworks_ai/accounts/fireworks/models/deepseek-v3p2","gmi/deepseek-ai/DeepSeek-V3.2","novita/deepseek/deepseek-v3.2","openrouter/deepseek/deepseek-v3.2","publishers/google/models/deepseek-v3.2-maas","us.deepseek.v3.2","vertex_ai/deepseek-ai/deepseek-v3.2-maas"],"hf_likes":1413,"hf_downloads":10366446,"hf_downloads_all_time":11229842,"hf_trending_score":6,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-v3-2","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2288,"max_input_per_1m":0.62,"min_output_per_1m":0.3432,"max_output_per_1m":1.85,"min_cache_read_per_1m":0.028,"min_cache_write_per_1m":0.056,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":12},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-5-haiku","name":"claude-4-5-haiku","display_name":"Claude Haiku 4.5","description":"A fast, lightweight Claude 4.5 model with vision, file input, and tool-use support optimized for low-latency applications.","creator":"anthropic","family":"claude","tier":"haiku","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":200000,"max_output_tokens":64000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-02","training_data_cutoff":"2025-07","supported_reasoning_efforts":["default"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-10-15","earliest_deprecation_date":"2026-10-15","deprecated":false,"has_pricing":true,"provider_count":9,"ids":["anthropic-claude-4-5-haiku","anthropic.claude-haiku-4-5-20251001-v1:0","anthropic.claude-haiku-4-5@20251001","anthropic/claude-haiku-4-5","anthropic/claude-haiku-4.5","apac.anthropic.claude-haiku-4-5-20251001-v1:0","au.anthropic.claude-haiku-4-5-20251001-v1:0","azure_ai/claude-haiku-4-5","bedrock/us-gov-east-1/anthropic.claude-haiku-4-5-20251001-v1:0","bedrock/us-gov-west-1/anthropic.claude-haiku-4-5-20251001-v1:0","claude-4-5-haiku","claude-4-5-haiku-reasoning","claude-haiku-4-5","claude-haiku-4-5-20251001","claude-haiku-4-5@20251001","databricks/databricks-claude-haiku-4-5","eu.anthropic.claude-haiku-4-5-20251001-v1:0","github_copilot/claude-haiku-4.5","global.anthropic.claude-haiku-4-5-20251001-v1:0","jp.anthropic.claude-haiku-4-5-20251001-v1:0","openrouter/anthropic/claude-haiku-4.5","perplexity/anthropic/claude-haiku-4-5","publishers/anthropic/models/claude-haiku-4-5","publishers/google/models/claude-haiku-4-5","replicate/anthropic/claude-4.5-haiku","snowflake/claude-haiku-4-5","us.anthropic.claude-haiku-4-5-20251001-v1:0","vercel_ai_gateway/anthropic/claude-haiku-4.5","vertex_ai/claude-haiku-4-5","vertex_ai/claude-haiku-4-5@20251001"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-5-haiku","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1,"max_input_per_1m":1.2,"min_output_per_1m":5,"max_output_per_1m":6,"min_cache_read_per_1m":0.1,"min_cache_write_per_1m":1.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","replicate","vercel_ai_gateway"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-2-5-pro","name":"gemini-2-5-pro","display_name":"Gemini 2.5 Pro","description":"Google's most capable thinking model in the Gemini 2.5 family, excelling at complex reasoning, coding, and multimodal tasks with leading benchmark performance.","creator":"google","family":"gemini","tier":"pro","version":"2-5","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["audio","text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-06-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["databricks/databricks-gemini-2-5-pro","deepinfra/google/gemini-2.5-pro","gemini-2-5-pro","gemini-2-5-pro-03-25","gemini-2-5-pro-05-06","gemini-2-5-pro-dec-2025","gemini-2.5-pro","gemini/gemini-2.5-pro","github_copilot/gemini-2.5-pro","google-gemini-2-5-pro","google/gemini-2.5-pro","oci/google.gemini-2.5-pro","openrouter/google/gemini-2.5-pro","perplexity/google/gemini-2.5-pro","publishers/google/models/gemini-2.5-pro","vercel_ai_gateway/google/gemini-2.5-pro"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-2-5-pro","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.24999,"max_input_per_1m":1.25,"min_output_per_1m":9.99999,"max_output_per_1m":10,"min_cache_read_per_1m":0.125,"min_cache_write_per_1m":0.125,"min_reasoning_per_1m":10,"cheapest_providers":["databricks"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"xai-grok-4-20-non-reasoning","name":"grok-4-20-non-reasoning","display_name":"Grok 4.20 Non-Reasoning","description":"The non-reasoning variant of xAI's Grok 4.20 flagship LLM, optimized for fast agentic tool calling and low hallucination rates without chain-of-thought overhead.","creator":"xai","family":"grok","tier":"","version":"4-20","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":2000000,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2026-03-09","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["grok-4-20-0309-non-reasoning","grok-4-20-non-reasoning","grok-4.20-0309-non-reasoning","grok-4.20-non-reasoning","publishers/google/models/grok-4.20-non-reasoning","vertex_ai/xai/grok-4.20-non-reasoning","xai-grok-4-20-non-reasoning","xai/grok-4.20-beta-0309-non-reasoning","xai/grok-4.20-non-reasoning","xai/grok-4.20-non-reasoning-beta"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"xai-grok-4-20-non-reasoning","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.25,"max_input_per_1m":2,"min_output_per_1m":2.5,"max_output_per_1m":6,"min_cache_read_per_1m":0.2,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["vercel_ai_gateway","xai"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-2-5-flash-preview","name":"gemini-2-5-flash-preview","display_name":"Gemini 2.5 Flash Preview","description":"A preview release of Gemini 2.5 Flash, offering early access to its fast reasoning and multimodal capabilities before stable release.","creator":"google","family":"gemini","tier":"flash","version":"2-5","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["text"]},"context_window":1048576,"max_output_tokens":65535,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":false,"url_context":true,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["gemini-2-5-flash-preview-09-2025","gemini-2-5-flash-preview-09-2025-reasoning","gemini-2.5-flash-preview-09-2025","gemini/gemini-2.5-flash-preview-09-2025","google-gemini-2-5-flash-preview","publishers/google/models/gemini-2.5-flash-preview-09-2025"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-2-5-flash-preview","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.3,"max_input_per_1m":0.3,"min_output_per_1m":2.5,"max_output_per_1m":2.5,"min_cache_read_per_1m":0.075,"min_cache_write_per_1m":null,"min_reasoning_per_1m":2.5,"cheapest_providers":["google_gemini","google_vertex_ai"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-coder-480b-a35b-instruct","name":"qwen3-coder-480b-a35b-instruct","display_name":"Qwen3 Coder 480B A35B Instruct","description":"Qwen3's flagship agentic code model with 480B total and 35B activated parameters, excelling at autonomous programming, tool calling, and browser-use tasks.","creator":"alibaba","family":"qwen3_moe","tier":"","version":null,"type":"language","size_in_bn":480,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["accounts/fireworks/models/qwen3-coder-480b-a35b-instruct","alibaba-qwen3-coder-480b-a35b-instruct","deepinfra/Qwen/Qwen3-Coder-480B-A35B-Instruct","fireworks_ai/accounts/fireworks/models/qwen3-coder-480b-a35b-instruct","novita/qwen/qwen3-coder-480b-a35b-instruct","qwen/qwen3-coder-480b-a35b-instruct","Qwen/Qwen3-Coder-480B-A35B-Instruct","qwen3-coder-480b-a35b-instruct","wandb/Qwen/Qwen3-Coder-480B-A35B-Instruct"],"hf_likes":1325,"hf_downloads":57687,"hf_downloads_all_time":885858,"hf_trending_score":0.5,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-coder-480b-a35b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.22,"max_input_per_1m":100,"min_output_per_1m":1.3,"max_output_per_1m":150,"min_cache_read_per_1m":null,"min_cache_write_per_1m":0.022,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-oss-20b","name":"gpt-oss-20b","display_name":"GPT OSS 20B","description":"A 20-billion-parameter open-weights GPT model from OpenAI suited for reasoning and tool-use tasks at a smaller, more efficient scale.","creator":"openai","family":"gpt_oss","tier":"","version":null,"type":"language","size_in_bn":20,"modalities":{"input":["image","text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":16,"ids":["@cf/openai/gpt-oss-20b","accounts/fireworks/models/gpt-oss-20b","bedrock_mantle/openai.gpt-oss-20b","databricks/databricks-gpt-oss-20b","deepinfra/openai/gpt-oss-20b","fireworks_ai/accounts/fireworks/models/gpt-oss-20b","gpt-oss-20b","gpt-oss-20b-low","gpt-oss-20b-maas","groq/openai/gpt-oss-20b","lemonade/gpt-oss-20b-mxfp4-GGUF","novita/openai/gpt-oss-20b","ollama/gpt-oss:20b-cloud","openai-gpt-oss-20b","openai-reasoning-gpt-oss-20b","openai.gpt-oss-20b-1:0","openai/gpt-oss-20b","openai/gpt-oss-20b:free","openrouter/openai/gpt-oss-20b","ovhcloud/gpt-oss-20b","publishers/google/models/gpt-oss-20b-maas","replicateopenai/gpt-oss-20b","together_ai/openai/gpt-oss-20b","vertex_ai/openai/gpt-oss-20b-maas","wandb/openai/gpt-oss-20b"],"hf_likes":4552,"hf_downloads":6455272,"hf_downloads_all_time":59707566,"hf_trending_score":12,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-oss-20b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.029,"max_input_per_1m":5,"min_output_per_1m":0.14,"max_output_per_1m":20,"min_cache_read_per_1m":0.0375,"min_cache_write_per_1m":0.007,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":16},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-next-80b-a3b-instruct","name":"qwen3-next-80b-a3b-instruct","display_name":"Qwen3 Next 80B A3B Instruct","description":"An instruction-tuned Qwen3 Next MoE model with 80B total and 3B activated parameters, optimized for text generation and conversational tasks.","creator":"alibaba","family":"qwen3_next","tier":"","version":null,"type":"language","size_in_bn":80,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-09-30","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-11","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":10,"ids":["accounts/fireworks/models/qwen3-next-80b-a3b-instruct","alibaba-qwen3-next-80b-a3b-instruct","alibaba/qwen3-next-80b-a3b-instruct","dashscope/qwen3-next-80b-a3b-instruct","deepinfra/Qwen/Qwen3-Next-80B-A3B-Instruct","fireworks_ai/accounts/fireworks/models/qwen3-next-80b-a3b-instruct","huggingface-reasoning-qwen3-next-80b-a3b-instruct","novita/qwen/qwen3-next-80b-a3b-instruct","qwen/qwen3-next-80b-a3b-instruct","Qwen/Qwen3-Next-80B-A3B-Instruct","qwen/qwen3-next-80b-a3b-instruct:free","qwen3-next-80b-a3b-instruct","together_ai/Qwen/Qwen3-Next-80B-A3B-Instruct"],"hf_likes":1012,"hf_downloads":292470,"hf_downloads_all_time":14864763,"hf_trending_score":4,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-next-80b-a3b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.09,"max_input_per_1m":0.9,"min_output_per_1m":0.9,"max_output_per_1m":1.5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":10},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-medium-3","name":"mistral-medium-3","display_name":"Mistral Medium 3","description":"Mistral AI's third-generation medium-tier enterprise model balancing frontier reasoning capabilities with significantly lower operational cost.","creator":"mistral","family":"mistral","tier":"","version":"3","type":"language","size_in_bn":null,"modalities":{"input":["image","text"],"output":["text"]},"context_window":131072,"max_output_tokens":8191,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-03-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Mistral","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-05-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["mistral-medium-3","mistralai/mistral-medium-3","publishers/google/models/mistral-medium-3","vertex_ai/mistral-medium-3","vertex_ai/mistral-medium-3@001","vertex_ai/mistralai/mistral-medium-3","vertex_ai/mistralai/mistral-medium-3@001"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-medium-3","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.4,"max_input_per_1m":1.5,"min_output_per_1m":2,"max_output_per_1m":7.5,"min_cache_read_per_1m":0.04,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["google_vertex_ai","openrouter"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-3-5-haiku","name":"claude-3-5-haiku","display_name":"Claude Haiku 3.5","description":"A fast, compact Claude model balancing speed and capability with support for vision, file input, and tool use.","creator":"anthropic","family":"claude","tier":"haiku","version":"3-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":200000,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-07-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-11-04","earliest_deprecation_date":"2026-06","deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-3-5-haiku","anthropic.claude-3-5-haiku-20241022-v1:0","anthropic/claude-3.5-haiku","bedrock/us.anthropic.claude-3-5-haiku-20241022-v1:0","claude-3-5-haiku","eu.anthropic.claude-3-5-haiku-20241022-v1:0","gradient_ai/anthropic-claude-3.5-haiku","heroku/claude-3-5-haiku","replicate/anthropic/claude-3.5-haiku","us.anthropic.claude-3-5-haiku-20241022-v1:0","vercel_ai_gateway/anthropic/claude-3.5-haiku","vertex_ai/claude-3-5-haiku","vertex_ai/claude-3-5-haiku@20241022"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-3-5-haiku","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.8,"max_input_per_1m":1,"min_output_per_1m":4,"max_output_per_1m":5,"min_cache_read_per_1m":0.08,"min_cache_write_per_1m":1,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","gradient_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-4-maverick","name":"llama-4-maverick","display_name":"Llama 4 Maverick","description":"Meta's Llama 4 Maverick MoE LLM with 128 experts and 17B active parameters, delivering high-capacity multimodal language and vision understanding.","creator":"meta","family":"llama4","tier":"","version":"4","type":"language","size_in_bn":401.584,"modalities":{"input":["image","text"],"output":["text"]},"context_window":1048576,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-08-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Llama4","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["databricks/databricks-llama-4-maverick","llama-4-maverick","meta-llama-4-maverick","meta-llama/llama-4-maverick","meta/llama-4-maverick","snowflake/llama4-maverick","vercel_ai_gateway/meta/llama-4-maverick"],"hf_likes":478,"hf_downloads":30421,"hf_downloads_all_time":554732,"hf_trending_score":1,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-4-maverick","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.12,"max_input_per_1m":0.50001,"min_output_per_1m":0.485,"max_output_per_1m":1.50003,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-2-5-flash","name":"gemini-2-5-flash","display_name":"Gemini 2.5 Flash","description":"A fast, cost-efficient Gemini 2.5 thinking model with strong reasoning, vision, and tool-use capabilities designed for high-throughput applications.","creator":"google","family":"gemini","tier":"flash","version":"2-5","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["audio","text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-06-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["databricks/databricks-gemini-2-5-flash","deepinfra/google/gemini-2.5-flash","gemini-2-5-flash","gemini-2-5-flash-04-2025","gemini-2-5-flash-dec-2025","gemini-2-5-flash-reasoning","gemini-2-5-flash-reasoning-04-2025","gemini-2.5-flash","gemini/gemini-2.5-flash","google_gemini-2-5-flash","google-gemini-2-5-flash","google/gemini-2.5-flash","oci/google.gemini-2.5-flash","openrouter/google/gemini-2.5-flash","perplexity/google/gemini-2.5-flash","publishers/google/models/gemini-2.5-flash","replicate/google/gemini-2.5-flash","vercel_ai_gateway/google/gemini-2.5-flash"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-2-5-flash","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.15,"max_input_per_1m":2.5,"min_output_per_1m":0.6,"max_output_per_1m":3,"min_cache_read_per_1m":0.03,"min_cache_write_per_1m":0.03,"min_reasoning_per_1m":2.5,"cheapest_providers":["google_gemini","google_vertex_ai","oracle_oci"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-1-405b-instruct","name":"llama-3-1-405b-instruct","display_name":"Llama 3.1 405B Instruct","description":"Meta's 405B instruction-tuned LLM optimized for following complex instructions, with FP8 quantization for efficient large-scale inference.","creator":"meta","family":"llama","tier":"","version":"3-1","type":"language","size_in_bn":405,"modalities":{"input":["image","text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-07-23","earliest_deprecation_date":"2026-07","deprecated":false,"has_pricing":true,"provider_count":11,"ids":["accounts/fireworks/models/llama-v3p1-405b-instruct","azure_ai/Meta-Llama-3.1-405B-Instruct","databricks/databricks-meta-llama-3-1-405b-instruct","fireworks_ai/accounts/fireworks/models/llama-v3p1-405b-instruct","hyperbolic/meta-llama/Meta-Llama-3.1-405B-Instruct","lambda_ai/llama3.1-405b-instruct-fp8","llama-3-1-instruct-405b","meta-llama-3-1-405b-instruct","meta-textgeneration-llama-3-1-405b-instruct-fp8","meta.llama3-1-405b-instruct-v1:0","nebius/meta-llama/Meta-Llama-3.1-405B-Instruct","oci/meta.llama-3.1-405b-instruct","sambanova/Meta-Llama-3.1-405B-Instruct","together_ai/meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo","us.meta.llama3-1-405b-instruct-v1:0","vertex_ai/meta/llama-3.1-405b-instruct-maas"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-1-405b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.12,"max_input_per_1m":10.68,"min_output_per_1m":0.3,"max_output_per_1m":16,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["hyperbolic"],"provider_count":11},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-235b-a22b-instruct","name":"qwen3-235b-a22b-instruct","display_name":"Qwen3 235B A22B Instruct","description":"An instruction-tuned update of the Qwen3 235B A22B MoE model with significant improvements in instruction following, logical reasoning, and general capabilities.","creator":"alibaba","family":"qwen3_moe","tier":"","version":null,"type":"language","size_in_bn":235,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":10,"ids":["accounts/fireworks/models/qwen3-235b-a22b-instruct-2507","alibaba-qwen3-235b-a22b-instruct","crusoe/Qwen/Qwen3-235B-A22B-Instruct-2507","deepinfra/Qwen/Qwen3-235B-A22B-Instruct-2507","fireworks_ai/accounts/fireworks/models/qwen3-235b-a22b-instruct-2507","novita/qwen/qwen3-235b-a22b-instruct-2507","qwen/qwen3-235b-a22b-instruct-2507","Qwen/Qwen3-235B-A22B-Instruct-2507","qwen3-235b-a22b-instruct","qwen3-235b-a22b-instruct-2507","replicate/qwen/qwen3-235b-a22b-instruct-2507","wandb/Qwen/Qwen3-235B-A22B-Instruct-2507"],"hf_likes":773,"hf_downloads":150781,"hf_downloads_all_time":1182969,"hf_trending_score":1,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-235b-a22b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.09,"max_input_per_1m":10,"min_output_per_1m":0.58,"max_output_per_1m":10,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["deepinfra","huggingface","novita"],"provider_count":10},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-3-5-sonnet","name":"claude-3-5-sonnet","display_name":"Claude Sonnet 3.5","description":"A mid-tier Claude model offering strong reasoning and instruction-following across text and multimodal tasks.","creator":"anthropic","family":"claude","tier":"sonnet","version":"3-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":159,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-06-20","earliest_deprecation_date":"2026-07","deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-3-5-sonnet","anthropic.claude-3-5-sonnet-20240620-v1:0","anthropic.claude-3-5-sonnet-20241022-v2:0","apac.anthropic.claude-3-5-sonnet-20240620-v1:0","apac.anthropic.claude-3-5-sonnet-20241022-v2:0","bedrock/invoke/anthropic.claude-3-5-sonnet-20240620-v1:0","bedrock/us-gov-east-1/anthropic.claude-3-5-sonnet-20240620-v1:0","bedrock/us-gov-west-1/anthropic.claude-3-5-sonnet-20240620-v1:0","claude-35-sonnet","claude-35-sonnet-june-24","eu.anthropic.claude-3-5-sonnet-20240620-v1:0","eu.anthropic.claude-3-5-sonnet-20241022-v2:0","gradient_ai/anthropic-claude-3.5-sonnet","heroku/claude-3-5-sonnet-latest","openrouter/anthropic/claude-3.5-sonnet","replicate/anthropic/claude-3.5-sonnet","snowflake/claude-3-5-sonnet","us.anthropic.claude-3-5-sonnet-20240620-v1:0","vercel_ai_gateway/anthropic/claude-3-5-sonnet","vercel_ai_gateway/anthropic/claude-3-5-sonnet-20241022","vercel_ai_gateway/anthropic/claude-3.5-sonnet","vertex_ai/claude-3-5-sonnet","vertex_ai/claude-3-5-sonnet@20240620"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-3-5-sonnet","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":3,"max_input_per_1m":3.75,"min_output_per_1m":15,"max_output_per_1m":18.75,"min_cache_read_per_1m":0.3,"min_cache_write_per_1m":3.75,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","google_vertex_ai","gradient_ai","openrouter","snowflake","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-4-scout","name":"llama-4-scout","display_name":"Llama 4 Scout","description":"Meta's Llama 4 Scout MoE LLM with 17B active parameters and 16 experts, offering efficient multimodal inference with native image and text support.","creator":"meta","family":"llama4","tier":"","version":"4","type":"language","size_in_bn":108.642,"modalities":{"input":["image","text"],"output":["text"]},"context_window":10000000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-08-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Llama4","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["llama-4-scout","meta-llama-4-scout","meta-llama/llama-4-scout","meta/llama-4-scout","vercel_ai_gateway/meta/llama-4-scout"],"hf_likes":1274,"hf_downloads":399353,"hf_downloads_all_time":5433902,"hf_trending_score":1,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-4-scout","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.1,"max_input_per_1m":0.25,"min_output_per_1m":0.3,"max_output_per_1m":0.792,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-2-5-flash-lite","name":"gemini-2-5-flash-lite","display_name":"Gemini 2.5 Flash Lite","description":"A lightweight Gemini 2.5 Flash variant optimized for ultra-low latency and cost efficiency while retaining reasoning capabilities.","creator":"google","family":"gemini","tier":"flash-lite","version":"2-5","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-07-22","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["gemini-2-5-flash-lite","gemini-2-5-flash-lite-reasoning","gemini-2.5-flash-lite","gemini/gemini-2.5-flash-lite","google-gemini-2-5-flash-lite","google/gemini-2.5-flash-lite","oci/google.gemini-2.5-flash-lite","publishers/google/models/gemini-2.5-flash-lite"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-2-5-flash-lite","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.075,"max_input_per_1m":0.12,"min_output_per_1m":0.3,"max_output_per_1m":0.48,"min_cache_read_per_1m":0.01,"min_cache_write_per_1m":0.01,"min_reasoning_per_1m":0.4,"cheapest_providers":["oracle_oci"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-1-5-pro","name":"gemini-1-5-pro","display_name":"Gemini 1.5 Pro","description":"Google's high-capability multimodal model with a long context window, designed for complex reasoning, document analysis, and rich media understanding.","creator":"google","family":"gemini","tier":"pro","version":"1-5","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["gemini-1-5-pro","gemini-1-5-pro-may-2024","google-gemini-1-5-pro"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-1-5-pro","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.25,"max_input_per_1m":1.25,"min_output_per_1m":5,"max_output_per_1m":5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":0.312,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-1-5-flash-8b","name":"gemini-1-5-flash-8b","display_name":"Gemini 1.5 Flash 8B","description":"A lightweight 8B-parameter variant of Gemini 1.5 Flash, balancing speed and multimodal capability for cost-efficient deployments.","creator":"google","family":"gemini","tier":"flash","version":"1-5","type":"language","size_in_bn":8,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["gemini-1-5-flash-8b","google-gemini-1-5-flash-8b","google/gemini-1.5-flash-8b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-1-5-flash-8b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.037,"max_input_per_1m":0.037,"min_output_per_1m":0.3,"max_output_per_1m":0.3,"min_cache_read_per_1m":0.02,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"ai21-jamba-1-5-large","name":"jamba-1-5-large","display_name":"Jamba 1.5 Large","description":"The large-tier variant of AI21's Jamba 1.5 hybrid SSM-Transformer model, delivering high-quality output for complex enterprise language tasks.","creator":"ai21","family":"jamba","tier":"large","version":"1-5","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":256000,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-09-23","earliest_deprecation_date":"2026-11","deprecated":false,"has_pricing":true,"provider_count":3,"ids":["ai21-jamba-1-5-large","ai21.jamba-1-5-large-v1:0","jamba-1-5-large","jamba-1.5-large","jamba-1.5-large@001","snowflake/jamba-1.5-large","vertex_ai/jamba-1.5-large","vertex_ai/jamba-1.5-large@001"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"ai21-jamba-1-5-large","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2,"max_input_per_1m":2,"min_output_per_1m":8,"max_output_per_1m":8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["ai21_labs","amazon_bedrock","google_vertex_ai"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-large","name":"mistral-large","display_name":"Mistral Large","description":"Mistral AI's flagship large language model excelling at reasoning, code generation, JSON output, and multilingual tasks.","creator":"mistral","family":"mistral","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","text"],"output":["text"]},"context_window":262144,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-11-30","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Mistral","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-02-26","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["azure_ai/mistral-large","azure_ai/mistral-large-2407","azure_ai/mistral-large-latest","azure/mistral-large-2402","azure/mistral-large-latest","bedrock/eu-west-3/mistral.mistral-large-2402-v1:0","bedrock/us-east-1/mistral.mistral-large-2402-v1:0","bedrock/us-west-2/mistral.mistral-large-2402-v1:0","mistral-large","mistral-large-2407","mistral-large-2512","mistral-large-latest","mistral.mistral-large-2402-v1:0","mistral.mistral-large-2407-v1:0","mistral/mistral-large-2402","mistral/mistral-large-2407","mistral/mistral-large-2411","mistral/mistral-large-2512","mistral/mistral-large-latest","mistralai/mistral-large","mistralai/mistral-large-2407","mistralai/mistral-large-2411","mistralai/mistral-large-2512","openrouter/mistralai/mistral-large","openrouter/mistralai/mistral-large-2512","snowflake/mistral-large","vercel_ai_gateway/mistral/mistral-large","vertex_ai/mistral-large-2411","vertex_ai/mistral-large@2407","vertex_ai/mistral-large@2411-001","vertex_ai/mistral-large@latest","watsonx/mistralai/mistral-large"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-large","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.5,"max_input_per_1m":8,"min_output_per_1m":1.5,"max_output_per_1m":24,"min_cache_read_per_1m":0.05,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-small","name":"mistral-small","display_name":"Mistral Small","description":"A compact yet capable LLM from Mistral balancing efficiency and performance across reasoning, vision, and instruction-following tasks.","creator":"mistral","family":"mistral","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":262144,"max_output_tokens":8191,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Mistral","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-05-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["azure_ai/mistral-small","azure_ai/mistral-small-2503","mistral-small","mistral-small-2402","mistral-small-2503","mistral-small-2603","mistral-small-latest","mistral.mistral-small-2402-v1:0","mistral/mistral-small","mistral/mistral-small-latest","mistralai/mistral-small-2603","publishers/google/models/mistral-small-2503","vercel_ai_gateway/mistral/mistral-small","vertex_ai/mistral-small-2503","vertex_ai/mistral-small-2503@001","watsonx/mistralai/mistral-small-2503"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-small","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.1,"max_input_per_1m":1,"min_output_per_1m":0.3,"max_output_per_1m":3,"min_cache_read_per_1m":0.015,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["ibm_watsonx","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-1-pro","name":"gemini-1-pro","display_name":"Gemini 1.0 Pro","description":"Google's first-generation Pro-tier multimodal model, capable of understanding text, images, and code for a broad range of reasoning tasks.","creator":"google","family":"gemini","tier":"pro","version":"1","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["gemini-1-0-pro","google-gemini-1-pro"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-1-pro","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.5,"max_input_per_1m":0.5,"min_output_per_1m":1.5,"max_output_per_1m":1.5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"ai21-jamba-1-5-mini","name":"jamba-1-5-mini","display_name":"Jamba 1.5 Mini","description":"A compact mini-tier variant of AI21's Jamba 1.5 hybrid SSM-Transformer model, optimized for speed and cost efficiency.","creator":"ai21","family":"jamba","tier":"mini","version":"1-5","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":256000,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-09-23","earliest_deprecation_date":"2026-11","deprecated":false,"has_pricing":true,"provider_count":3,"ids":["ai21-jamba-1-5-mini","ai21.jamba-1-5-mini-v1:0","jamba-1-5-mini","jamba-1.5-mini","jamba-1.5-mini@001","snowflake/jamba-1.5-mini","vertex_ai/jamba-1.5-mini","vertex_ai/jamba-1.5-mini@001"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"ai21-jamba-1-5-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2,"max_input_per_1m":0.2,"min_output_per_1m":0.4,"max_output_per_1m":0.4,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["ai21_labs","amazon_bedrock","google_vertex_ai"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"google-chirp","name":"chirp","display_name":"Chirp","description":"Google's large-scale automatic speech recognition model supporting a wide range of languages with high transcription accuracy.","creator":"google","family":"chirp","tier":"","version":null,"type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["google-chirp","vertex_ai/chirp"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30"},{"id":"mistral-codestral","name":"codestral","display_name":"Codestral","description":"Mistral AI's dedicated code generation model supporting fill-in-the-middle, code correction, and agentic software engineering tasks.","creator":"mistral","family":"codestral","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":256000,"max_output_tokens":8191,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-03-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Mistral","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-01","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["codestral-2508","codestral-latest","codestral/codestral-2405","codestral/codestral-latest","mistral-codestral","mistral/codestral","mistral/codestral-2405","mistral/codestral-2508","mistral/codestral-latest","mistralai/codestral-2508","text-completion-codestral/codestral-2405","text-completion-codestral/codestral-latest","vercel_ai_gateway/mistral/codestral","vertex_ai/codestral-2501","vertex_ai/codestral@2405","vertex_ai/codestral@latest"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-codestral","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2,"max_input_per_1m":0.3,"min_output_per_1m":0.6,"max_output_per_1m":0.9,"min_cache_read_per_1m":0.03,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["google_vertex_ai"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-codestral-2","name":"codestral-2","display_name":"Codestral 2","description":"The second generation of Mistral AI's Codestral code-focused language model, designed for low-latency coding assistance.","creator":"mistral","family":"codestral","tier":"","version":"2","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":128000,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["codestral-2","mistral-codestral-2","publishers/google/models/codestral-2","vertex_ai/codestral-2","vertex_ai/codestral-2@001","vertex_ai/mistralai/codestral-2","vertex_ai/mistralai/codestral-2@001"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-codestral-2","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.3,"max_input_per_1m":0.3,"min_output_per_1m":0.9,"max_output_per_1m":0.9,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["google_vertex_ai"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-r1-528","name":"deepseek-r1-528","display_name":"DeepSeek R1 528","description":"The DeepSeek R1 0528 update, a reasoning-focused MoE LLM with improved chain-of-thought capabilities over the original R1 release.","creator":"deepseek","family":"deepseek-r1","tier":"","version":"1.0","type":"language","size_in_bn":684.531,"modalities":{"input":["pdf","text"],"output":["text"]},"context_window":164000,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-03-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-05-28","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":12,"ids":["accounts/fireworks/models/deepseek-r1-0528","crusoe/deepseek-ai/DeepSeek-R1-0528","deepinfra/deepseek-ai/DeepSeek-R1-0528","deepseek-ai/DeepSeek-R1-0528","deepseek-llm-r1-0528","deepseek-r1-0528-maas","deepseek-r1-528","deepseek/deepseek-r1-0528","fireworks_ai/accounts/fireworks/models/deepseek-r1-0528","hyperbolic/deepseek-ai/DeepSeek-R1-0528","lambda_ai/deepseek-r1-0528","nebius/deepseek-ai/DeepSeek-R1-0528","novita/deepseek/deepseek-r1-0528","openrouter/deepseek/deepseek-r1-0528","publishers/google/models/deepseek-r1-0528-maas","vertex_ai/deepseek-ai/deepseek-r1-0528-maas","wandb/deepseek-ai/DeepSeek-R1-0528"],"hf_likes":2445,"hf_downloads":707890,"hf_downloads_all_time":6472632,"hf_trending_score":1,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-r1-528","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2,"max_input_per_1m":135,"min_output_per_1m":0.25,"max_output_per_1m":540,"min_cache_read_per_1m":0.35,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["lambda"],"provider_count":12},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-ocr","name":"deepseek-ocr","display_name":"DeepSeek-OCR","description":"A multimodal OCR model that compresses long document contexts via optical 2D mapping, combining a DeepEncoder with a compact MoE language model.","creator":"deepseek","family":"deepseek-ocr","tier":"","version":null,"type":"image-to-text","size_in_bn":3.336,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":8192,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["deepseek-ai/DeepSeek-OCR","deepseek-ocr","deepseek-ocr-maas","deepseek/deepseek-ocr","novita/deepseek/deepseek-ocr","publishers/google/models/deepseek-ocr-maas","vertex_ai/deepseek-ai/deepseek-ocr-maas"],"hf_likes":3218,"hf_downloads":2082348,"hf_downloads_all_time":22155059,"hf_trending_score":3,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-ocr","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.03,"max_input_per_1m":0.3,"min_output_per_1m":0.03,"max_output_per_1m":1.2,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["huggingface","novita"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini","name":"gemini","display_name":"Gemini","description":"Google's flagship multimodal LLM family supporting text, vision, and code across a range of capability tiers.","creator":"google","family":"gemini","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["google-gemini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2.25,"max_input_per_1m":2.25,"min_output_per_1m":13.5,"max_output_per_1m":13.5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":0.15,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-1-embedding","name":"gemini-1-embedding","display_name":"Gemini 1 Embedding","description":"A Gemini-based text embedding model that produces distributed vector representations for semantic search and similarity tasks.","creator":"google","family":"embed","tier":"","version":"1","type":"embedding","size_in_bn":null,"modalities":{"input":["text"],"output":["embedding"]},"context_window":2048,"max_output_tokens":128,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[3072],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-05-20","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["gemini-embedding-001","gemini/gemini-embedding-001","google-gemini-1-embedding","google/gemini-embedding-001","publishers/google/models/gemini-embedding-001","vercel_ai_gateway/google/gemini-embedding-001"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-1-embedding","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.15,"max_input_per_1m":0.15,"min_output_per_1m":null,"max_output_per_1m":null,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai","vercel_ai_gateway"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-1-live-embedding","name":"gemini-1-live-embedding","display_name":"Gemini 1 Live Embedding","description":"A real-time streaming embedding variant of Gemini 1, enabling live generation of text representations for dynamic retrieval applications.","creator":"google","family":"gemini","tier":"","version":"1","type":"embedding","size_in_bn":null,"modalities":{"input":["text"],"output":["embedding"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["google-gemini-1-live-embedding"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-1-live-embedding","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.15,"max_input_per_1m":0.15,"min_output_per_1m":null,"max_output_per_1m":null,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-1-pro-live","name":"gemini-1-pro-live","display_name":"Gemini 1.0 Pro Live","description":"A real-time streaming variant of Gemini 1.0 Pro, supporting live multimodal dialogue and interaction.","creator":"google","family":"gemini","tier":"pro","version":"1","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["google-gemini-1-pro-live"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-1-pro-live","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.5,"max_input_per_1m":0.5,"min_output_per_1m":1.5,"max_output_per_1m":1.5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-1-5-flash-8b-live","name":"gemini-1-5-flash-8b-live","display_name":"Gemini 1.5 Flash 8B Live","description":"A real-time streaming variant of Gemini 1.5 Flash 8B, enabling low-latency live multimodal interactions.","creator":"google","family":"gemini","tier":"flash","version":"1-5","type":"language","size_in_bn":8,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["google-gemini-1-5-flash-8b-live"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-1-5-flash-8b-live","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.037,"max_input_per_1m":0.037,"min_output_per_1m":0.3,"max_output_per_1m":0.3,"min_cache_read_per_1m":0.02,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["google_gemini","google_vertex_ai"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}}],"pagination":{"page_size":50,"has_next":true,"next_token":"NTA","total_count":158},"meta":{"updated_at":"2026-06-13","request_id":"24ea6874-8d61-4edf-814a-a9cfddd223c2","execution_ms":18}}