{"data":[{"id":"anthropic-claude-4-8-opus","name":"claude-4-8-opus","display_name":"Claude Opus 4.8","description":"A flagship Anthropic LLM in the Claude Opus tier at version 4.8, supporting adaptive reasoning, vision, tool use, file input, and web search across multiple geographic regions.","creator":"anthropic","family":"claude","tier":"opus","version":"4-8","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","xhigh"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-05-28","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-8-opus","anthropic.claude-opus-4-8","anthropic/claude-opus-4-8","anthropic/claude-opus-4.8","au.anthropic.claude-opus-4-8","azure_ai/claude-opus-4-8","claude-opus-4-8","eu.anthropic.claude-opus-4-8","global.anthropic.claude-opus-4-8","jp.anthropic.claude-opus-4-8","publishers/anthropic/models/claude-opus-4-8","publishers/google/models/claude-opus-4-8","us.anthropic.claude-opus-4-8","vertex_ai/claude-opus-4-8","vertex_ai/claude-opus-4-8@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-8-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-5","name":"gpt-5-5","display_name":"GPT-5.5","description":"A GPT-5 series large language model from OpenAI targeting high-capability reasoning and generation tasks at the xhigh performance tier.","creator":"openai","family":"gpt","tier":"","version":"5-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-12","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure/gpt-5.5","azure/gpt-5.5-2026-04-23","bedrock_mantle/openai.gpt-5.5","gpt-5-5","gpt-5-5-high","gpt-5-5-instant-05-26","gpt-5-5-low","gpt-5-5-medium","gpt-5-5-non-reasoning","gpt-5.5","gpt-5.5-2026-04-23","openai-gpt-5-5","openai/gpt-5.5"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":30,"max_output_per_1m":36,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-7-opus","name":"claude-4-7-opus","display_name":"Claude Opus 4.7","description":"Anthropic's Claude 4.7 Opus model with adaptive reasoning at maximum effort, vision, and tool-use for complex enterprise tasks.","creator":"anthropic","family":"claude","tier":"opus","version":"4-7","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","minimal","xhigh"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-04-16","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-7-opus","anthropic.claude-opus-4-7","anthropic/claude-opus-4-7","anthropic/claude-opus-4.7","au.anthropic.claude-opus-4-7","azure_ai/claude-opus-4-7","claude-opus-4-7","claude-opus-4-7-20260416","claude-opus-4-7-non-reasoning","eu.anthropic.claude-opus-4-7","global.anthropic.claude-opus-4-7","jp.anthropic.claude-opus-4-7","openrouter/anthropic/claude-opus-4.7","perplexity/anthropic/claude-opus-4-7","publishers/anthropic/models/claude-opus-4-7","publishers/google/models/claude-opus-4-7","us.anthropic.claude-opus-4-7","vertex_ai/claude-opus-4-7","vertex_ai/claude-opus-4-7@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-7-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-3-1-pro-preview","name":"gemini-3-1-pro-preview","display_name":"Gemini 3.1 Pro Preview","description":"A preview release of Gemini 3.1 Pro providing early access to its frontier reasoning, vision, and tool-use capabilities.","creator":"google","family":"gemini","tier":"pro","version":"3-1","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-19","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["gemini-3-1-pro-preview","gemini-3.1-pro-preview","gemini/gemini-3.1-pro-preview","google-gemini-3-1-pro-preview","google/gemini-3.1-pro-preview","openrouter/google/gemini-3.1-pro-preview","publishers/google/models/gemini-3.1-pro-preview","vertex_ai/gemini-3.1-pro-preview"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-3-1-pro-preview","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2,"max_input_per_1m":2,"min_output_per_1m":12,"max_output_per_1m":12,"min_cache_read_per_1m":0.2,"min_cache_write_per_1m":0.375,"min_reasoning_per_1m":12,"cheapest_providers":["google_gemini","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-4","name":"gpt-5-4","display_name":"GPT-5.4","description":"OpenAI's frontier reasoning model for complex professional work, supporting vision, file input, tool use, and configurable reasoning effort from none to xhigh.","creator":"openai","family":"gpt","tier":"","version":"5-4","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure_ai/gpt-5.4","azure_ai/gpt-5.4-2026-03-05","azure/gpt-5.4","azure/gpt-5.4-2026-03-05","bedrock_mantle/openai.gpt-5.4","chatgpt/gpt-5.4","gpt-5-4","gpt-5-4-low","gpt-5-4-non-reasoning","gpt-5.4","gpt-5.4-2026-03-05","openai-gpt-5-4","openai/gpt-5.4"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-4","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2.5,"max_input_per_1m":3,"min_output_per_1m":15,"max_output_per_1m":18,"min_cache_read_per_1m":0.25,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-7-max","name":"qwen3-7-max","display_name":"Qwen3.7 Max","description":"A Mixture-of-Experts Qwen3 variant tuned for maximum capability, combining reasoning, vision, and multilingual performance in a high-throughput configuration.","creator":"alibaba","family":"qwen","tier":"max","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-05-21","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["alibaba-qwen3-7-max","alibaba/qwen3.7-max","qwen/qwen3.7-max","Qwen/Qwen3.7-Max","qwen3-7-max"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-7-max","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.25,"max_input_per_1m":1.25,"min_output_per_1m":3.75,"max_output_per_1m":3.75,"min_cache_read_per_1m":0.25,"min_cache_write_per_1m":1.5625,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","vercel_ai_gateway"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-3-5-flash","name":"gemini-3-5-flash","display_name":"Gemini 3.5 Flash","description":"A fast, efficient Gemini 3.5 model optimized for high-throughput tasks with support for reasoning, vision, tool use, and web search.","creator":"google","family":"gemini","tier":"flash","version":"3-5","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-05-19","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["gemini-3-5-flash","gemini-3-5-flash-medium","gemini-3-5-flash-minimal","gemini-3.5-flash","gemini/gemini-3.5-flash","google-gemini-3-5-flash","google/gemini-3.5-flash","publishers/google/models/gemini-3.5-flash","vertex_ai/gemini-3.5-flash"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-3-5-flash","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.5,"max_input_per_1m":1.8,"min_output_per_1m":9,"max_output_per_1m":10.8,"min_cache_read_per_1m":0.15,"min_cache_write_per_1m":0.0833333333,"min_reasoning_per_1m":9,"cheapest_providers":["google_gemini","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"minimax-m3","name":"minimax-m3","display_name":"MiniMax M3","description":"A multimodal foundation model supporting text, image, and video inputs with a 1M-token context window, designed for long-horizon agentic tasks, coding, and reasoning.","creator":"minimax","family":"m3","tier":"","version":null,"type":"language","size_in_bn":427.04,"modalities":{"input":["image","pdf","text","video"],"output":["text"]},"context_window":1048576,"max_output_tokens":512000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-05-31","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/minimax-m3","minimax-m3","minimax/minimax-m3","minimax/MiniMax-M3"],"hf_likes":320,"hf_downloads":442,"hf_downloads_all_time":442,"hf_trending_score":314,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"minimax-m3","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.3,"max_input_per_1m":0.6,"min_output_per_1m":1.2,"max_output_per_1m":2.4,"min_cache_read_per_1m":0.06,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["huggingface","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"moonshot-kimi-k2-6","name":"kimi-k2-6","display_name":"Kimi K2.6","description":"An open-source native multimodal agentic LLM specializing in long-horizon coding, coding-driven design, autonomous execution, and swarm-based task orchestration.","creator":"moonshot","family":"kimi_k25","tier":"","version":"k2-6","type":"language","size_in_bn":1058.589,"modalities":{"input":["image","pdf","text","video"],"output":["text"]},"context_window":262144,"max_output_tokens":262142,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-20","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["accounts/fireworks/models/kimi-k2p6","azure_ai/kimi-k2.6","kimi-k2-6","kimi-k2-6-non-reasoning","moonshot-kimi-k2-6","moonshot/kimi-k2.6","moonshotai/kimi-k2.6","moonshotai/Kimi-K2.6","moonshotai/kimi-k2.6:free"],"hf_likes":568,"hf_downloads":8241,"hf_downloads_all_time":8241,"hf_trending_score":560,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"moonshot-kimi-k2-6","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.68,"max_input_per_1m":1.2,"min_output_per_1m":3.4,"max_output_per_1m":4.5,"min_cache_read_per_1m":0.16,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"xiaomi-mimo-2-5-pro","name":"mimo-2-5-pro","display_name":"MiMo V2.5 Pro","description":"Xiaomi's flagship omnimodal LLM excelling in general agentic tasks, complex software engineering, and long-horizon reasoning benchmarks.","creator":"xiaomi","family":"mimo","tier":"","version":"2-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":131072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-22","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["mimo-v2-5-pro","mimo-v2-5-pro-non-reasoning","openrouter/xiaomi/mimo-v2.5-pro","xiaomi-mimo-2-5-pro","xiaomi/mimo-v2.5-pro","xiaomimimo/mimo-v2.5-pro","XiaomiMiMo/MiMo-V2.5-Pro"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"xiaomi-mimo-2-5-pro","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.435,"max_input_per_1m":0.435,"min_output_per_1m":0.87,"max_output_per_1m":0.87,"min_cache_read_per_1m":0.0036,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","vercel_ai_gateway"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-3-codex","name":"gpt-5-3-codex","display_name":"GPT-5.3 Codex","description":"A GPT-5.3 variant optimized for agentic coding tasks in Codex environments, supporting multiple reasoning effort levels from low to xhigh.","creator":"openai","family":"gpt","tier":"","version":"5-3","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":400000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/gpt-5.3-codex","chatgpt/gpt-5.3-codex","github_copilot/gpt-5.3-codex","gpt-5-3-codex","gpt-5.3-codex","openai-gpt-5-3-codex","openai/gpt-5.3-codex"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-3-codex","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.75,"max_input_per_1m":1.75,"min_output_per_1m":14,"max_output_per_1m":14,"min_cache_read_per_1m":0.175,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-7-plus","name":"qwen3-7-plus","display_name":"Qwen3.7 Plus","description":"A cost-effective Qwen3.7-series LLM with strong vision-language, reasoning, and tool-use capabilities, optimized for balanced performance and efficiency.","creator":"alibaba","family":"qwen","tier":"plus","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-06-03","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["accounts/fireworks/models/qwen3p7-plus","alibaba-qwen3-7-plus","alibaba/qwen3.7-plus","qwen/qwen3.7-plus","qwen3-7-plus"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-7-plus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.32,"max_input_per_1m":0.4,"min_output_per_1m":1.28,"max_output_per_1m":1.6,"min_cache_read_per_1m":0.064,"min_cache_write_per_1m":0.4,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"xai-grok-4-3","name":"grok-4-3","display_name":"Grok 4.3","description":"A multimodal reasoning LLM from xAI that accepts text and image inputs, designed for agentic workflows, instruction-following, and tool-use tasks requiring high factual accuracy.","creator":"xai","family":"grok","tier":"","version":"4-3","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Grok","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-30","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["grok-4-3","grok-4-3-low","grok-4-3-medium","grok-4-3-non-reasoning","grok-4.3","publishers/google/models/grok-4.3","x-ai/grok-4.3","xai-grok-4-3","xai/grok-4.3","xai/grok-4.3-latest"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"xai-grok-4-3","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.25,"max_input_per_1m":1.5,"min_output_per_1m":2.5,"max_output_per_1m":3,"min_cache_read_per_1m":0.2,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","vercel_ai_gateway","xai"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-6-max-preview","name":"qwen3-6-max-preview","display_name":"Qwen3.6 Max Preview","description":"A large-scale reasoning and vision-capable LLM with enhanced vibe coding abilities, more efficient coding agent execution, and improved front-end development performance.","creator":"alibaba","family":"qwen","tier":"max","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-27","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["alibaba-qwen3-6-max-preview","alibaba/qwen-3.6-max-preview","qwen/qwen3.6-max-preview","qwen3-6-max"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-6-max-preview","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.04,"max_input_per_1m":1.3,"min_output_per_1m":6.24,"max_output_per_1m":7.8,"min_cache_read_per_1m":0.26,"min_cache_write_per_1m":1.3,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-v4-pro","name":"deepseek-v4-pro","display_name":"DeepSeek V4 Pro","description":"A large-scale Mixture-of-Experts LLM from DeepSeek with 1.6T total and 49B activated parameters, supporting a 1M-token context window for advanced reasoning and tool-use tasks.","creator":"deepseek","family":"v4","tier":"pro","version":null,"type":"language","size_in_bn":861.608,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1048576,"max_output_tokens":384000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/deepseek-v4-pro","deepseek-ai/DeepSeek-V4-Pro","deepseek-v4-pro","deepseek-v4-pro-high","deepseek-v4-pro-non-reasoning","deepseek/deepseek-v4-pro"],"hf_likes":2540,"hf_downloads":78864,"hf_downloads_all_time":78864,"hf_trending_score":2449,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-v4-pro","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.435,"max_input_per_1m":1.74,"min_output_per_1m":0.87,"max_output_per_1m":3.48,"min_cache_read_per_1m":0.0036,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["deepseek","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"zhipu-glm-5-1","name":"glm-5-1","display_name":"GLM-5.1","description":"Z AI's next-generation flagship agentic LLM with significantly stronger coding capabilities, vision support, and file input, achieving top performance on SWE-Bench.","creator":"zhipu","family":"glm_moe_dsa","tier":"","version":"5-1","type":"language","size_in_bn":753.864,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":202800,"max_output_tokens":64000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/glm-5p1","fireworks_ai/accounts/fireworks/models/glm-5p1","fireworks_ai/glm-5p1","glm-5-1","glm-5-1-non-reasoning","huggingface-llm-glm-5-1-fp8","z-ai/glm-5.1","zai-org/glm-5.1","zai-org/GLM-5.1","zai/glm-5.1","zhipu-glm-5-1"],"hf_likes":1449,"hf_downloads":147738,"hf_downloads_all_time":147738,"hf_trending_score":214,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"zhipu-glm-5-1","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.98,"max_input_per_1m":1.4,"min_output_per_1m":3.08,"max_output_per_1m":4.4,"min_cache_read_per_1m":0.182,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-2","name":"gpt-5-2","display_name":"GPT-5.2","description":"A frontier GPT-5 generation LLM for complex professional work with configurable reasoning effort, available via the Responses API.","creator":"openai","family":"gpt","tier":"","version":"5-2","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-11","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure/gpt-5.2","azure/gpt-5.2-2025-12-11","chatgpt/gpt-5.2","github_copilot/gpt-5.2","gmi/openai/gpt-5.2","gpt-5-2","gpt-5-2-medium","gpt-5-2-non-reasoning","gpt-5.2","gpt-5.2-2025-12-11","openai-gpt-5-2","openai/gpt-5.2","openrouter/openai/gpt-5.2","perplexity/openai/gpt-5.2"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-2","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.75,"max_input_per_1m":2.1,"min_output_per_1m":14,"max_output_per_1m":16.8,"min_cache_read_per_1m":0.175,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","gmi","openai","openrouter","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-6-plus","name":"qwen3-6-plus","display_name":"Qwen3.6 Plus","description":"A Plus-tier Qwen3.6 closed model with reasoning, tool use, and vision capabilities, available exclusively through select infrastructure partners.","creator":"alibaba","family":"qwen","tier":"plus","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text","video"],"output":["text"]},"context_window":1000000,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-02","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["accounts/fireworks/models/qwen3p6-plus","alibaba-qwen3-6-plus","alibaba/qwen3.6-plus","openrouter/qwen/qwen3.6-plus","qwen/qwen3.6-plus","qwen3-6-plus"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-6-plus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.325,"max_input_per_1m":0.5,"min_output_per_1m":1.95,"max_output_per_1m":3,"min_cache_read_per_1m":0.1,"min_cache_write_per_1m":0.40625,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"zhipu-glm-5","name":"glm-5","display_name":"GLM-5","description":"An open-source MoE LLM from Z AI designed for long-context reasoning, multi-step tool orchestration, and complex agentic engineering tasks.","creator":"zhipu","family":"glm_moe_dsa","tier":"","version":"5","type":"language","size_in_bn":753.864,"modalities":{"input":["pdf","text"],"output":["text"]},"context_window":202800,"max_output_tokens":131100,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-11","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["accounts/fireworks/models/glm-5","baseten/zai-org/GLM-5","bedrock/us-east-1/zai.glm-5","bedrock/us-west-2/zai.glm-5","glm-5","glm-5-maas","glm-5-non-reasoning","openrouter/z-ai/glm-5","publishers/google/models/glm-5-maas","vertex_ai/zai-org/glm-5-maas","z-ai/glm-5","zai-org/glm-5","zai-org/GLM-5","zai.glm-5","zai/glm-5","zhipu-glm-5"],"hf_likes":2070,"hf_downloads":477667,"hf_downloads_all_time":777726,"hf_trending_score":5,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"zhipu-glm-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.573,"max_input_per_1m":1,"min_output_per_1m":1.92,"max_output_per_1m":3.2,"min_cache_read_per_1m":0.1,"min_cache_write_per_1m":0.1,"min_reasoning_per_1m":null,"cheapest_providers":["alibaba_qwen"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"minimax-m2-7","name":"minimax-m2-7","display_name":"MiniMax M2.7","description":"MiniMax's M2.7 MoE language model with vision support and advanced agent capabilities, designed for complex multi-step productivity tasks and dynamic tool use.","creator":"minimax","family":"minimax_m2","tier":"","version":"7","type":"language","size_in_bn":228.704,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":204800,"max_output_tokens":131072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-18","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/minimax-m2p7","huggingface-llm-minimax-m2-7","minimax-m2-7","minimax/minimax-m2.7","MiniMaxAI/MiniMax-M2.7","sambanova/MiniMax-M2.7"],"hf_likes":1015,"hf_downloads":358255,"hf_downloads_all_time":358255,"hf_trending_score":295,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"minimax-m2-7","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.25,"max_input_per_1m":0.3,"min_output_per_1m":1,"max_output_per_1m":1.2,"min_cache_read_per_1m":0.05,"min_cache_write_per_1m":0.375,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-2-codex","name":"gpt-5-2-codex","display_name":"GPT-5.2 Codex","description":"A GPT-5.2 variant optimized for agentic coding in Codex environments, supporting low through xhigh reasoning effort settings.","creator":"openai","family":"gpt","tier":"","version":"5-2","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":400000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-01-14","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/gpt-5.2-codex","chatgpt/gpt-5.2-codex","gpt-5-2-codex","gpt-5.2-codex","openai-gpt-5-2-codex","openai/gpt-5.2-codex","openrouter/openai/gpt-5.2-codex"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-2-codex","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.75,"max_input_per_1m":1.75,"min_output_per_1m":14,"max_output_per_1m":14,"min_cache_read_per_1m":0.175,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-4-mini","name":"gpt-5-4-mini","display_name":"GPT-5.4 Mini","description":"A faster, cost-efficient variant of GPT-5.4 designed for high-volume workloads while retaining strong reasoning, vision, and tool-use capabilities.","creator":"openai","family":"gpt","tier":"mini","version":"5-4","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["azure_ai/gpt-5.4-mini","azure_ai/gpt-5.4-mini-2026-03-17","azure/gpt-5.4-mini","azure/gpt-5.4-mini-2026-03-17","gpt-5-4-mini","gpt-5-4-mini-medium","gpt-5-4-mini-non-reasoning","gpt-5.4-mini","gpt-5.4-mini-2026-03-17","openai-gpt-5-4-mini","openai/gpt-5.4-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-4-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.75,"max_input_per_1m":0.9,"min_output_per_1m":4.5,"max_output_per_1m":5.4,"min_cache_read_per_1m":0.075,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"nvidia-nemotron-3-ultra-550b-a55b","name":"nemotron-3-ultra-550b-a55b","display_name":"Nemotron 3 Ultra 550B A55B","description":"A 550B-parameter mixture-of-experts Nemotron model with 55B active parameters, built for frontier-scale reasoning, tool use, and agentic tasks.","creator":"nvidia","family":"nemotron","tier":"ultra","version":"3","type":"language","size_in_bn":550,"modalities":{"input":["text"],"output":["text"]},"context_window":1000000,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-06-04","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["huggingface-reasoning-nvidia-nemotron-3-ultra-550b-a55b-nvfp4","nvidia-nemotron-3-ultra-550b-a55b","nvidia/nemotron-3-ultra-550b-a55b","nvidia/nemotron-3-ultra-550b-a55b:free","nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B","nvidia/NVIDIA-Nemotron-3-Ultra-550B-A55B-BF16"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"nvidia-nemotron-3-ultra-550b-a55b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.5,"max_input_per_1m":0.6,"min_output_per_1m":2.4,"max_output_per_1m":3.6,"min_cache_read_per_1m":0.12,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"moonshot-kimi-k2-5","name":"kimi-k2-5","display_name":"Kimi K2.5","description":"An updated iteration of Kimi K2 with enhanced reasoning, vision, and tool-use capabilities, supporting implicit caching for efficient inference.","creator":"moonshot","family":"kimi_k25","tier":"","version":"k2-5","type":"language","size_in_bn":1058.589,"modalities":{"input":["image","text","video"],"output":["text"]},"context_window":262144,"max_output_tokens":98304,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-01-27","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":12,"ids":["@cf/moonshotai/kimi-k2.5","accounts/fireworks/models/kimi-k2p5","azure_ai/kimi-k2.5","baseten/moonshotai/Kimi-K2.5","bedrock/ap-northeast-1/moonshotai.kimi-k2.5","bedrock/ap-south-1/moonshotai.kimi-k2.5","bedrock/ap-southeast-3/moonshotai.kimi-k2.5","bedrock/eu-north-1/moonshotai.kimi-k2.5","bedrock/moonshotai.kimi-k2.5","bedrock/sa-east-1/moonshotai.kimi-k2.5","bedrock/us-east-1/moonshotai.kimi-k2.5","bedrock/us-east-2/moonshotai.kimi-k2.5","bedrock/us-west-2/moonshotai.kimi-k2.5","fireworks_ai/accounts/fireworks/models/kimi-k2p5","fireworks_ai/kimi-k2p5","huggingface-llm-kimi-k2-5","kimi-k2-5","kimi-k2-5-non-reasoning","kimi-k2.5","moonshot-kimi-k2-5","moonshot/kimi-k2.5","moonshotai.kimi-k2.5","moonshotai/kimi-k2.5","moonshotai/Kimi-K2.5","openrouter/moonshotai/kimi-k2.5","together_ai/moonshotai/Kimi-K2.5","wandb/moonshotai/Kimi-K2.5"],"hf_likes":2753,"hf_downloads":5222216,"hf_downloads_all_time":9851195,"hf_trending_score":34,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"moonshot-kimi-k2-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.375,"max_input_per_1m":0.6,"min_output_per_1m":2.025,"max_output_per_1m":3.011,"min_cache_read_per_1m":0.1,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":12},"providers":[],"regions":[],"region_info":{}}},{"id":"zhipu-glm-5-turbo","name":"glm-5-turbo","display_name":"GLM-5 Turbo","description":"A fast-inference variant of Z AI's GLM-5 model, deeply optimized for real-world agent workflows and OpenClaw-style agentic scenarios.","creator":"zhipu","family":"glm","tier":"","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":131100,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2026-03-15","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["glm-5-turbo","z-ai/glm-5-turbo","zai-org/glm-5-turbo","zai/glm-5-turbo","zhipu-glm-5-turbo"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"zhipu-glm-5-turbo","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.2,"max_input_per_1m":1.2,"min_output_per_1m":4,"max_output_per_1m":4,"min_cache_read_per_1m":0.24,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","vercel_ai_gateway"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-6-opus","name":"claude-4-6-opus","display_name":"Claude Opus 4.6","description":"Anthropic's high-capability Claude 4.6 Opus model with advanced reasoning, vision, and tool-use for demanding workloads.","creator":"anthropic","family":"claude","tier":"opus","version":"4-6","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-05","training_data_cutoff":"2025-08","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-02-05","earliest_deprecation_date":"2026-06-29","deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-6-opus","anthropic.claude-opus-4-6-v1","anthropic/claude-opus-4.6","anthropic/claude-opus-4.6-fast","au.anthropic.claude-opus-4-6-v1","azure_ai/claude-opus-4-6","claude-opus-4-6","claude-opus-4-6-20260205","claude-opus-4-6-adaptive","eu.anthropic.claude-opus-4-6-v1","github_copilot/claude-opus-4.6-fast","global.anthropic.claude-opus-4-6-v1","openrouter/anthropic/claude-opus-4.6","perplexity/anthropic/claude-opus-4-6","publishers/anthropic/models/claude-opus-4-6","publishers/google/models/claude-opus-4-6","us.anthropic.claude-opus-4-6-v1","vercel_ai_gateway/anthropic/claude-opus-4.6","vertex_ai/claude-opus-4-6","vertex_ai/claude-opus-4-6@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-6-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":30,"min_output_per_1m":25,"max_output_per_1m":150,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-v4-flash","name":"deepseek-v4-flash","display_name":"DeepSeek V4 Flash","description":"An efficiency-optimized Mixture-of-Experts LLM from DeepSeek with 284B total and 13B activated parameters, supporting a 1M-token context window with reasoning and tool-use capabilities.","creator":"deepseek","family":"v4","tier":"flash","version":null,"type":"language","size_in_bn":158.069,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1048576,"max_output_tokens":384000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/deepseek-v4-flash","deepseek-ai/DeepSeek-V4-Flash","deepseek-v4-flash","deepseek-v4-flash-high","deepseek-v4-flash-non-reasoning","deepseek-v4-flash(1)","deepseek-v4-flash*","deepseek/deepseek-v4-flash","deepseek/deepseek-v4-flash:free"],"hf_likes":649,"hf_downloads":25391,"hf_downloads_all_time":25391,"hf_trending_score":639,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-v4-flash","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.098,"max_input_per_1m":0.14,"min_output_per_1m":0.196,"max_output_per_1m":0.28,"min_cache_read_per_1m":0.0028,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-6-27b","name":"qwen3-6-27b","display_name":"Qwen3.6 27B","description":"A dense vision-language model in the Qwen3 series with 27B parameters, offering improvements in agentic coding, STEM reasoning, and multimodal inference over its predecessor.","creator":"alibaba","family":"qwen","tier":"","version":null,"type":"language","size_in_bn":27,"modalities":{"input":["image","pdf","text","video"],"output":["text"]},"context_window":262144,"max_output_tokens":262140,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen3","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-27","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["accounts/fireworks/models/qwen3p6-27b","alibaba-qwen3-6-27b","alibaba/qwen3.6-27b","huggingface-vlm-qwen3-6-27b","qwen/qwen3.6-27b","Qwen/Qwen3.6-27B","qwen3-6-27b","qwen3-6-27b-non-reasoning"],"hf_likes":1262,"hf_downloads":2772193,"hf_downloads_all_time":2772193,"hf_trending_score":117,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-6-27b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2885,"max_input_per_1m":0.6,"min_output_per_1m":3.17,"max_output_per_1m":3.6,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5","name":"gpt-5","display_name":"GPT-5","description":"OpenAI's frontier LLM with integrated reasoning, vision, image generation, and tool-use capabilities designed for complex coding and agentic tasks.","creator":"openai","family":"gpt","tier":"","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-09","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["azure/eu/gpt-5-2025-08-07","azure/gpt-5","azure/gpt-5-2025-08-07","azure/us/gpt-5-2025-08-07","databricks/databricks-gpt-5","github_copilot/gpt-5","gmi/openai/gpt-5","gpt-5","gpt-5-2025-08-07","gpt-5-chatgpt","gpt-5-low","gpt-5-medium","gpt-5-minimal","oci/openai.gpt-5","openai-gpt-5","openai/gpt-5","openrouter/openai/gpt-5","replicate/openai/gpt-5","snowflake/openai-gpt-5"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.24999,"max_input_per_1m":1.5,"min_output_per_1m":9.99999,"max_output_per_1m":12,"min_cache_read_per_1m":0.125,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-codex","name":"gpt-5-codex","display_name":"GPT-5 Codex","description":"A GPT-5 variant optimized for agentic coding tasks in Codex environments, available via the Responses API with regularly updated snapshots.","creator":"openai","family":"gpt","tier":"","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":400000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-09","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/gpt-5-codex","gpt-5-codex","openai-gpt-5-codex","openai/gpt-5-codex","openrouter/openai/gpt-5-codex"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-codex","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.125,"max_input_per_1m":1.25,"min_output_per_1m":10,"max_output_per_1m":10,"min_cache_read_per_1m":0.125,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-6-sonnet","name":"claude-4-6-sonnet","display_name":"Claude Sonnet 4.6","description":"A capable Claude 4.6 Sonnet model with reasoning, vision, and tool-use support for a wide range of applications.","creator":"anthropic","family":"claude","tier":"sonnet","version":"4-6","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-02-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-6-sonnet","anthropic.claude-sonnet-4-6","anthropic/claude-sonnet-4-6","anthropic/claude-sonnet-4.6","au.anthropic.claude-sonnet-4-6","azure_ai/claude-sonnet-4-6","claude-sonnet-4-6","claude-sonnet-4-6-adaptive","claude-sonnet-4-6-non-reasoning-low-effort","eu.anthropic.claude-sonnet-4-6","global.anthropic.claude-sonnet-4-6","jp.anthropic.claude-sonnet-4-6","openrouter/anthropic/claude-sonnet-4.6","publishers/anthropic/models/claude-sonnet-4-6","publishers/google/models/claude-sonnet-4-6","snowflake/claude-sonnet-4-6","us.anthropic.claude-sonnet-4-6","vertex_ai/claude-sonnet-4-6","vertex_ai/claude-sonnet-4-6@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-6-sonnet","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":3,"max_input_per_1m":3.6,"min_output_per_1m":15,"max_output_per_1m":18,"min_cache_read_per_1m":0.3,"min_cache_write_per_1m":3.75,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-4-nano","name":"gpt-5-4-nano","display_name":"GPT-5.4 Nano","description":"The smallest and fastest GPT-5.4 tier, optimized for speed- and cost-sensitive tasks such as classification, data extraction, ranking, and sub-agent orchestration.","creator":"openai","family":"gpt","tier":"nano","version":"5-4","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["azure_ai/gpt-5.4-nano","azure_ai/gpt-5.4-nano-2026-03-17","azure/gpt-5.4-nano","azure/gpt-5.4-nano-2026-03-17","gpt-5-4-nano","gpt-5-4-nano-medium","gpt-5-4-nano-non-reasoning","gpt-5.4-nano","gpt-5.4-nano-2026-03-17","openai-gpt-5-4-nano","openai/gpt-5.4-nano"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-4-nano","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2,"max_input_per_1m":0.24,"min_output_per_1m":1.25,"max_output_per_1m":1.5,"min_cache_read_per_1m":0.02,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"kwaipilot-kat-2-pro-coder","name":"kat-2-pro-coder","display_name":"KwaiPilot KAT 2 Pro Coder","description":"A high-performance agentic coding LLM from KwaiKAT's KAT series, targeting complex enterprise-grade software engineering and SaaS integration with implicit caching support.","creator":"kwaipilot","family":"kat","tier":"pro","version":"2","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":256000,"max_output_tokens":80000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-27","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["kat-coder-pro-v2","kwaipilot-kat-2-pro-coder","kwaipilot/kat-coder-pro-v2"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"kwaipilot-kat-2-pro-coder","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.3,"max_input_per_1m":0.3,"min_output_per_1m":1.2,"max_output_per_1m":1.2,"min_cache_read_per_1m":0.06,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","vercel_ai_gateway"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-5-opus","name":"claude-4-5-opus","display_name":"Claude Opus 4.5","description":"Anthropic's flagship Claude 4.5 model with top-tier reasoning, vision, and tool-use capabilities for complex tasks.","creator":"anthropic","family":"claude","tier":"opus","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":64000,"tool_use_system_prompt_tokens":159,"output_vector_sizes":[],"knowledge_cutoff":"2025-05","training_data_cutoff":"2025-08","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-11-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["anthropic-claude-4-5-opus","anthropic.claude-opus-4-5-20251101-v1:0","anthropic/claude-opus-4.5","azure_ai/claude-opus-4-5","claude-opus-4-5","claude-opus-4-5-20251101","claude-opus-4-5-thinking","claude-opus-4-5@20251101","databricks/databricks-claude-opus-4-5","eu.anthropic.claude-opus-4-5-20251101-v1:0","github_copilot/claude-opus-4.5","global.anthropic.claude-opus-4-5-20251101-v1:0","gmi/anthropic/claude-opus-4.5","openrouter/anthropic/claude-opus-4.5","perplexity/anthropic/claude-opus-4-5","publishers/anthropic/models/claude-opus-4-5","publishers/google/models/claude-opus-4-5","us.anthropic.claude-opus-4-5-20251101-v1:0","vercel_ai_gateway/anthropic/claude-opus-4.5","vertex_ai/claude-opus-4-5","vertex_ai/claude-opus-4-5@20251101"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-5-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","gmi","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-1-codex","name":"gpt-5-1-codex","display_name":"GPT-5.1 Codex","description":"A GPT-5.1 variant purpose-built for agentic coding tasks in Codex environments, available exclusively via the Responses API.","creator":"openai","family":"gpt","tier":"","version":"5-1","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":400000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-09","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-11-13","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/eu/gpt-5.1-codex","azure/global/gpt-5.1-codex","azure/gpt-5.1-codex","azure/gpt-5.1-codex-2025-11-13","azure/us/gpt-5.1-codex","gpt-5-1-codex","gpt-5.1-codex","openai-gpt-5-1-codex","openai/gpt-5.1-codex"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-1-codex","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.25,"max_input_per_1m":1.25,"min_output_per_1m":10,"max_output_per_1m":10,"min_cache_read_per_1m":0.125,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"zhipu-glm-5v-turbo","name":"glm-5v-turbo","display_name":"GLM-5V Turbo","description":"Z AI's first native multimodal agent foundation model, handling image, video, and text inputs for vision-based coding and long-horizon agentic tasks.","creator":"zhipu","family":"glm","tier":"","version":"5v","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text","video"],"output":["text"]},"context_window":200000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2026-04-01","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["glm-5v-turbo","z-ai/glm-5v-turbo","zai-org/glm-5v-turbo","zai/glm-5v-turbo","zhipu-glm-5v-turbo"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"zhipu-glm-5v-turbo","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.2,"max_input_per_1m":1.2,"min_output_per_1m":4,"max_output_per_1m":4,"min_cache_read_per_1m":0.24,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["vercel_ai_gateway"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"step-3-7-flash","name":"step-3-7-flash","display_name":"Step 3.7 Flash","description":"A high-efficiency multimodal Mixture-of-Experts LLM combining a large language backbone with a vision encoder for native image and video understanding.","creator":"step","family":"step","tier":"flash","version":"3-7","type":"language","size_in_bn":201.365,"modalities":{"input":["image","text","video"],"output":["text"]},"context_window":256000,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-05-28","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["step-3-7-flash","stepfun-ai/Step-3.7-Flash","stepfun/step-3.7-flash"],"hf_likes":370,"hf_downloads":50187,"hf_downloads_all_time":50187,"hf_trending_score":51,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"step-3-7-flash","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2,"max_input_per_1m":0.2,"min_output_per_1m":1.15,"max_output_per_1m":1.15,"min_cache_read_per_1m":0.04,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","vercel_ai_gateway"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"zhipu-glm-4-7","name":"glm-4-7","display_name":"GLM-4.7","description":"A multilingual MoE LLM from Z AI designed for complex reasoning, agentic coding, and tool use, building on the GLM-4.6 architecture.","creator":"zhipu","family":"glm4_moe","tier":"","version":"4-7","type":"language","size_in_bn":358.338,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":204800,"max_output_tokens":131072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-22","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":13,"ids":["accounts/fireworks/models/glm-4p7","baseten/zai-org/GLM-4.7","cerebras/zai-glm-4.7","fireworks_ai/accounts/fireworks/models/glm-4p7","fireworks_ai/glm-4p7","glm-4-7","glm-4-7-251222","glm-4-7-non-reasoning","glm-4.7","glm-4.7-maas","novita/zai-org/glm-4.7","openrouter/z-ai/glm-4.7","publishers/google/models/glm-4.7-maas","together_ai/zai-org/GLM-4.7","vertex_ai/zai-org/glm-4.7-maas","z-ai/glm-4.7","zai-org/glm-4.7","zai-org/GLM-4.7","zai.glm-4.7","zai/glm-4.7","zhipu-glm-4-7"],"hf_likes":2026,"hf_downloads":117151,"hf_downloads_all_time":436300,"hf_trending_score":4,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"zhipu-glm-4-7","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.4,"max_input_per_1m":2.25,"min_output_per_1m":1.75,"max_output_per_1m":2.75,"min_cache_read_per_1m":0.08,"min_cache_write_per_1m":0.06,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":13},"providers":[],"regions":[],"region_info":{}}},{"id":"minimax-m2-5","name":"minimax-m2-5","display_name":"MiniMax M2.5","description":"MiniMax's M2.5 generation MoE language model offering strong reasoning and tool-use performance for complex productivity and agent tasks.","creator":"minimax","family":"minimax_m2","tier":"","version":"5","type":"language","size_in_bn":228.704,"modalities":{"input":["text"],"output":["text"]},"context_window":1000000,"max_output_tokens":196608,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-12","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["accounts/fireworks/models/minimax-m2p5","baseten/MiniMaxAI/MiniMax-M2.5","bedrock/ap-northeast-1/minimax.minimax-m2.5","bedrock/ap-south-1/minimax.minimax-m2.5","bedrock/ap-southeast-2/minimax.minimax-m2.5","bedrock/ap-southeast-3/minimax.minimax-m2.5","bedrock/eu-central-1/minimax.minimax-m2.5","bedrock/eu-north-1/minimax.minimax-m2.5","bedrock/eu-south-1/minimax.minimax-m2.5","bedrock/eu-west-1/minimax.minimax-m2.5","bedrock/eu-west-2/minimax.minimax-m2.5","bedrock/sa-east-1/minimax.minimax-m2.5","bedrock/us-east-1/minimax.minimax-m2.5","bedrock/us-east-2/minimax.minimax-m2.5","bedrock/us-west-2/minimax.minimax-m2.5","huggingface-llm-minimax-m2-5","minimax-m2-5","minimax.minimax-m2.5","minimax/minimax-m2.5","minimax/MiniMax-M2.5","minimax/minimax-m2.5:free","MiniMaxAI/MiniMax-M2.5","openrouter/minimax/minimax-m2.5","wandb/MiniMaxAI/MiniMax-M2.5"],"hf_likes":1461,"hf_downloads":928266,"hf_downloads_all_time":1586202,"hf_trending_score":13,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"minimax-m2-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.15,"max_input_per_1m":0.3,"min_output_per_1m":0.9,"max_output_per_1m":1.2,"min_cache_read_per_1m":0.03,"min_cache_write_per_1m":0.375,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-mini","name":"gpt-5-mini","display_name":"GPT-5 Mini","description":"A faster, cost-efficient variant of GPT-5 suited for well-defined tasks and high-volume, low-latency workloads with vision and tool-use support.","creator":"openai","family":"gpt","tier":"mini","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-05","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["azure/eu/gpt-5-mini-2025-08-07","azure/gpt-5-mini","azure/gpt-5-mini-2025-08-07","azure/us/gpt-5-mini-2025-08-07","databricks/databricks-gpt-5-mini","github_copilot/gpt-5-mini","gpt-5-mini","gpt-5-mini-2025-08-07","gpt-5-mini-medium","gpt-5-mini-minimal","oci/openai.gpt-5-mini","openai-gpt-5-mini","openai/gpt-5-mini","openrouter/openai/gpt-5-mini","perplexity/openai/gpt-5-mini","replicate/openai/gpt-5-mini","snowflake/openai-gpt-5-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.24997,"max_input_per_1m":0.3,"min_output_per_1m":1.99997,"max_output_per_1m":2.4,"min_cache_read_per_1m":0.025,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-o3-pro","name":"o3-pro","display_name":"o3 Pro","description":"A high-compute variant of the o3 reasoning series that uses more compute to think harder, providing consistently reliable answers on the most challenging reasoning tasks.","creator":"openai","family":"o","tier":"pro","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":200000,"max_output_tokens":100000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-06-10","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/o3-pro","azure/o3-pro-2025-06-10","o3-pro","o3-pro-2025-06-10","openai-o3-pro","openai/o3-pro"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-o3-pro","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":20,"max_input_per_1m":20,"min_output_per_1m":80,"max_output_per_1m":80,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"alibaba-qwen3-max-thinking","name":"qwen3-max-thinking","display_name":"Qwen3 Max Thinking","description":"Alibaba's flagship reasoning-focused LLM in the Qwen3 series, featuring adaptive tool-use and advanced test-time scaling for complex problem solving.","creator":"alibaba","family":"qwen","tier":"max","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Qwen","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-09","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["alibaba-qwen3-max-thinking","alibaba/qwen3-max-thinking","qwen/qwen3-max-thinking","Qwen/Qwen3-Max-Thinking","qwen3-max-thinking","qwen3-max-thinking-preview"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"alibaba-qwen3-max-thinking","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.78,"max_input_per_1m":1.2,"min_output_per_1m":3.9,"max_output_per_1m":6,"min_cache_read_per_1m":0.24,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"minimax-m2-1","name":"minimax-m2-1","display_name":"MiniMax M2.1","description":"A refined M2.1 sub-version of MiniMax's MoE language model with improved reasoning, tool-use, and implicit caching for agentic tasks.","creator":"minimax","family":"minimax_m2","tier":"","version":"1","type":"language","size_in_bn":228.704,"modalities":{"input":["image","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":196608,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["accounts/fireworks/models/minimax-m2p1","bedrock/ap-northeast-1/minimax.minimax-m2.1","bedrock/ap-south-1/minimax.minimax-m2.1","bedrock/ap-southeast-3/minimax.minimax-m2.1","bedrock/eu-central-1/minimax.minimax-m2.1","bedrock/eu-north-1/minimax.minimax-m2.1","bedrock/eu-south-1/minimax.minimax-m2.1","bedrock/eu-west-1/minimax.minimax-m2.1","bedrock/eu-west-2/minimax.minimax-m2.1","bedrock/sa-east-1/minimax.minimax-m2.1","bedrock/us-east-1/minimax.minimax-m2.1","bedrock/us-east-2/minimax.minimax-m2.1","bedrock/us-west-2/minimax.minimax-m2.1","fireworks_ai/accounts/fireworks/models/minimax-m2p1","fireworks_ai/minimax-m2p1","gmi/MiniMaxAI/MiniMax-M2.1","huggingface-llm-minimax-m2-1","minimax-m2-1","minimax.minimax-m2.1","minimax/minimax-m2.1","minimax/MiniMax-M2.1","novita/minimax/minimax-m2.1","openrouter/minimax/minimax-m2.1"],"hf_likes":1351,"hf_downloads":35651,"hf_downloads_all_time":408444,"hf_trending_score":3,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"minimax-m2-1","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.29,"max_input_per_1m":0.3,"min_output_per_1m":0.95,"max_output_per_1m":1.2,"min_cache_read_per_1m":0.03,"min_cache_write_per_1m":0.375,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-medium-3-5","name":"mistral-medium-3-5","display_name":"Mistral Medium 3.5","description":"A mid-tier general-purpose LLM from Mistral offering a balance of performance and efficiency, positioned between the small and large tiers of the Mistral model family.","creator":"mistral","family":"mistral","tier":"","version":"3-5","type":"language","size_in_bn":null,"modalities":{"input":["image","text"],"output":["text"]},"context_window":262144,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Mistral","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-30","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["mistral-medium-3-5","mistral-medium-3.5","mistral/mistral-medium-3.5","mistralai/mistral-medium-3-5"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-medium-3-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.5,"max_input_per_1m":1.5,"min_output_per_1m":7.5,"max_output_per_1m":7.5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","mistral","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-1-codex-mini","name":"gpt-5-1-codex-mini","display_name":"GPT-5.1 Codex Mini","description":"A smaller, cost-effective variant of GPT-5.1 Codex optimized for agentic coding tasks with reduced capability and cost.","creator":"openai","family":"gpt","tier":"","version":"5-1","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":400000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-09","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-11-13","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/eu/gpt-5.1-codex-mini","azure/global/gpt-5.1-codex-mini","azure/gpt-5.1-codex-mini","azure/gpt-5.1-codex-mini-2025-11-13","azure/us/gpt-5.1-codex-mini","chatgpt/gpt-5.1-codex-mini","gpt-5-1-codex-mini","gpt-5.1-codex-mini","openai-gpt-5-1-codex-mini","openai/gpt-5.1-codex-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-1-codex-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.25,"max_input_per_1m":0.25,"min_output_per_1m":2,"max_output_per_1m":2,"min_cache_read_per_1m":0.025,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"step-3-5-flash","name":"step-3-5-flash","display_name":"Step 3.5 Flash","description":"An open-source Mixture-of-Experts reasoning model from StepFun with 196B total parameters (11B active), featuring a 256K context window and tool-calling support.","creator":"step","family":"step3p5","tier":"flash","version":"3-5","type":"language","size_in_bn":199.384,"modalities":{"input":["text"],"output":["text"]},"context_window":262144,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2026-01-29","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["step-3-5-flash","step-3-5-flash-0202","stepfun-ai/Step-3.5-Flash","stepfun/step-3.5-flash"],"hf_likes":783,"hf_downloads":147877,"hf_downloads_all_time":532020,"hf_trending_score":5,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"step-3-5-flash","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.09,"max_input_per_1m":0.09,"min_output_per_1m":0.3,"max_output_per_1m":0.3,"min_cache_read_per_1m":0.02,"min_cache_write_per_1m":0.02,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","vercel_ai_gateway"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-5-sonnet","name":"claude-4-5-sonnet","display_name":"Claude Sonnet 4.5","description":"A versatile Claude 4.5 model with strong reasoning, vision, and tool-use capabilities suited for a broad range of tasks.","creator":"anthropic","family":"claude","tier":"sonnet","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":64000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":"2025-07","supported_reasoning_efforts":["default"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-29","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":10,"ids":["anthropic-claude-4-5-sonnet","anthropic.claude-sonnet-4-5-20250929-v1:0","anthropic/claude-sonnet-4.5","au.anthropic.claude-sonnet-4-5-20250929-v1:0","azure_ai/claude-sonnet-4-5","bedrock/us-gov-east-1/anthropic.claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-east-1/claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-west-1/anthropic.claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-west-1/claude-sonnet-4-5-20250929-v1:0","claude-4-5-sonnet","claude-4-5-sonnet-thinking","claude-sonnet-4-5","claude-sonnet-4-5-20250929","claude-sonnet-4-5-20250929-v1:0","claude-sonnet-4-5@20250929","databricks/databricks-claude-sonnet-4-5","eu.anthropic.claude-sonnet-4-5-20250929-v1:0","github_copilot/claude-sonnet-4.5","global.anthropic.claude-sonnet-4-5-20250929-v1:0","gmi/anthropic/claude-sonnet-4.5","jp.anthropic.claude-sonnet-4-5-20250929-v1:0","openrouter/anthropic/claude-sonnet-4.5","perplexity/anthropic/claude-sonnet-4-5","publishers/anthropic/models/claude-sonnet-4-5","publishers/google/models/claude-sonnet-4-5","replicate/anthropic/claude-4.5-sonnet","snowflake/claude-sonnet-4-5","us-gov.anthropic.claude-sonnet-4-5-20250929-v1:0","us.anthropic.claude-sonnet-4-5-20250929-v1:0","vercel_ai_gateway/anthropic/claude-sonnet-4.5","vertex_ai/claude-sonnet-4-5","vertex_ai/claude-sonnet-4-5@20250929"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-5-sonnet","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2.99999,"max_input_per_1m":3.6,"min_output_per_1m":15,"max_output_per_1m":18,"min_cache_read_per_1m":0.3,"min_cache_write_per_1m":3.75,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":10},"providers":[],"regions":[],"region_info":{}}},{"id":"minimax-m2","name":"minimax-m2","display_name":"MiniMax M2","description":"MiniMax's second-generation MoE language model with reasoning and tool-use capabilities, built for complex agentic and productivity workflows.","creator":"minimax","family":"mixtral","tier":"","version":null,"type":"language","size_in_bn":228.704,"modalities":{"input":["text"],"output":["text"]},"context_window":205000,"max_output_tokens":196608,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-10-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["accounts/fireworks/models/minimax-m2","fireworks_ai/accounts/fireworks/models/minimax-m2","huggingface-llm-minimax-m2","minimax-m2","minimax.minimax-m2","minimax/minimax-m2","minimax/MiniMax-M2","novita/minimax/minimax-m2","openrouter/minimax/minimax-m2"],"hf_likes":1491,"hf_downloads":69357,"hf_downloads_all_time":1925616,"hf_trending_score":0,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"minimax-m2","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.255,"max_input_per_1m":0.3,"min_output_per_1m":1,"max_output_per_1m":1.2,"min_cache_read_per_1m":0.03,"min_cache_write_per_1m":0.03,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"kwaipilot-kat-1-pro-coder","name":"kat-1-pro-coder","display_name":"KwaiPilot KAT 1 Pro Coder","description":"An agentic coding LLM from KwaiKAT's KAT series, designed for complex real-world software engineering tasks with strong reasoning and tool-use capabilities.","creator":"kwaipilot","family":"kat","tier":"pro","version":"1","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":256000,"max_output_tokens":32000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-10-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["kat-coder-pro-v1","kwaipilot-kat-1-pro-coder","kwaipilot/kat-coder-pro-v1"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"kwaipilot-kat-1-pro-coder","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.03,"max_input_per_1m":0.03,"min_output_per_1m":1.2,"max_output_per_1m":1.2,"min_cache_read_per_1m":0.06,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["vercel_ai_gateway"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"nvidia-nemotron-super-3-120b-a12b","name":"nvidia-nemotron-super-3-120b-a12b","display_name":"Nemotron Super 3 120B A12B","description":"A 120B-parameter hybrid MoE Nemotron Super 3 model with 12B active parameters, optimized by NVIDIA for compute-efficient reasoning in specialized agentic systems.","creator":"nvidia","family":"nemotron_h","tier":"","version":"3","type":"language","size_in_bn":120,"modalities":{"input":["text"],"output":["text"]},"context_window":1000000,"max_output_tokens":262144,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-11","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["accounts/fireworks/models/nvidia-nemotron-3-super-120b-a12b-fp8","accounts/fireworks/models/nvidia-nemotron-3-super-120b-a12b-nvfp4","huggingface-llm-nvidia-nemotron-3-super-120b-a12b-bf16","nvidia-nemotron-3-super-120b-a12b","nvidia-nemotron-super-3-120b-a12b","nvidia/nemotron-3-super-120b-a12b","nvidia/nemotron-3-super-120b-a12b:free","nvidia/NVIDIA-Nemotron-3-Super-120B-A12B"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"nvidia-nemotron-super-3-120b-a12b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.09,"max_input_per_1m":0.15,"min_output_per_1m":0.45,"max_output_per_1m":0.65,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}}],"pagination":{"page_size":50,"has_next":true,"next_token":"NTA","total_count":260},"meta":{"updated_at":"2026-06-13","request_id":"1d7d34fc-e7b9-4ecf-ab4c-9db7d0377bbc","execution_ms":20}}