{"data":[{"id":"anthropic-claude-5-fable","name":"claude-5-fable","display_name":"Claude Fable 5","description":"A highly capable Claude LLM optimized for demanding reasoning and long-horizon agentic tasks, with vision, tool-use, and explicit-caching support.","creator":"anthropic","family":"claude","tier":"fable","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default","xhigh"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-06-09","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["anthropic-claude-5-fable","anthropic.claude-fable-5","anthropic/claude-fable-5","au.anthropic.claude-fable-5","azure_ai/claude-fable-5","claude-fable-5","eu.anthropic.claude-fable-5","global.anthropic.claude-fable-5","publishers/anthropic/models/claude-fable-5","publishers/google/models/claude-fable-5","us.anthropic.claude-fable-5","vertex_ai/claude-fable-5","vertex_ai/claude-fable-5@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-5-fable","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":10,"max_input_per_1m":12,"min_output_per_1m":50,"max_output_per_1m":60,"min_cache_read_per_1m":1,"min_cache_write_per_1m":12.5,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-8-opus","name":"claude-4-8-opus","display_name":"Claude Opus 4.8","description":"A flagship Anthropic LLM in the Claude Opus tier at version 4.8, supporting adaptive reasoning, vision, tool use, file input, and web search across multiple geographic regions.","creator":"anthropic","family":"claude","tier":"opus","version":"4-8","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","xhigh"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-05-28","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-8-opus","anthropic.claude-opus-4-8","anthropic/claude-opus-4-8","anthropic/claude-opus-4.8","au.anthropic.claude-opus-4-8","azure_ai/claude-opus-4-8","claude-opus-4-8","eu.anthropic.claude-opus-4-8","global.anthropic.claude-opus-4-8","jp.anthropic.claude-opus-4-8","publishers/anthropic/models/claude-opus-4-8","publishers/google/models/claude-opus-4-8","us.anthropic.claude-opus-4-8","vertex_ai/claude-opus-4-8","vertex_ai/claude-opus-4-8@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-8-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-5","name":"gpt-5-5","display_name":"GPT-5.5","description":"A GPT-5 series large language model from OpenAI targeting high-capability reasoning and generation tasks at the xhigh performance tier.","creator":"openai","family":"gpt","tier":"","version":"5-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-12","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure/gpt-5.5","azure/gpt-5.5-2026-04-23","bedrock_mantle/openai.gpt-5.5","gpt-5-5","gpt-5-5-high","gpt-5-5-instant-05-26","gpt-5-5-low","gpt-5-5-medium","gpt-5-5-non-reasoning","gpt-5.5","gpt-5.5-2026-04-23","openai-gpt-5-5","openai/gpt-5.5"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":30,"max_output_per_1m":36,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-7-opus","name":"claude-4-7-opus","display_name":"Claude Opus 4.7","description":"Anthropic's Claude 4.7 Opus model with adaptive reasoning at maximum effort, vision, and tool-use for complex enterprise tasks.","creator":"anthropic","family":"claude","tier":"opus","version":"4-7","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","minimal","xhigh"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-04-16","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-7-opus","anthropic.claude-opus-4-7","anthropic/claude-opus-4-7","anthropic/claude-opus-4.7","au.anthropic.claude-opus-4-7","azure_ai/claude-opus-4-7","claude-opus-4-7","claude-opus-4-7-20260416","claude-opus-4-7-non-reasoning","eu.anthropic.claude-opus-4-7","global.anthropic.claude-opus-4-7","jp.anthropic.claude-opus-4-7","openrouter/anthropic/claude-opus-4.7","perplexity/anthropic/claude-opus-4-7","publishers/anthropic/models/claude-opus-4-7","publishers/google/models/claude-opus-4-7","us.anthropic.claude-opus-4-7","vertex_ai/claude-opus-4-7","vertex_ai/claude-opus-4-7@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-7-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-4","name":"gpt-5-4","display_name":"GPT-5.4","description":"OpenAI's frontier reasoning model for complex professional work, supporting vision, file input, tool use, and configurable reasoning effort from none to xhigh.","creator":"openai","family":"gpt","tier":"","version":"5-4","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure_ai/gpt-5.4","azure_ai/gpt-5.4-2026-03-05","azure/gpt-5.4","azure/gpt-5.4-2026-03-05","bedrock_mantle/openai.gpt-5.4","chatgpt/gpt-5.4","gpt-5-4","gpt-5-4-low","gpt-5-4-non-reasoning","gpt-5.4","gpt-5.4-2026-03-05","openai-gpt-5-4","openai/gpt-5.4"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-4","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2.5,"max_input_per_1m":3,"min_output_per_1m":15,"max_output_per_1m":18,"min_cache_read_per_1m":0.25,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"moonshot-kimi-k2-6","name":"kimi-k2-6","display_name":"Kimi K2.6","description":"An open-source native multimodal agentic LLM specializing in long-horizon coding, coding-driven design, autonomous execution, and swarm-based task orchestration.","creator":"moonshot","family":"kimi_k25","tier":"","version":"k2-6","type":"language","size_in_bn":1058.589,"modalities":{"input":["image","pdf","text","video"],"output":["text"]},"context_window":262144,"max_output_tokens":262142,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-20","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["accounts/fireworks/models/kimi-k2p6","azure_ai/kimi-k2.6","kimi-k2-6","kimi-k2-6-non-reasoning","moonshot-kimi-k2-6","moonshot/kimi-k2.6","moonshotai/kimi-k2.6","moonshotai/Kimi-K2.6","moonshotai/kimi-k2.6:free"],"hf_likes":568,"hf_downloads":8241,"hf_downloads_all_time":8241,"hf_trending_score":560,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"moonshot-kimi-k2-6","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.68,"max_input_per_1m":1.2,"min_output_per_1m":3.4,"max_output_per_1m":4.5,"min_cache_read_per_1m":0.16,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-3-codex","name":"gpt-5-3-codex","display_name":"GPT-5.3 Codex","description":"A GPT-5.3 variant optimized for agentic coding tasks in Codex environments, supporting multiple reasoning effort levels from low to xhigh.","creator":"openai","family":"gpt","tier":"","version":"5-3","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":400000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-02-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/gpt-5.3-codex","chatgpt/gpt-5.3-codex","github_copilot/gpt-5.3-codex","gpt-5-3-codex","gpt-5.3-codex","openai-gpt-5-3-codex","openai/gpt-5.3-codex"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-3-codex","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.75,"max_input_per_1m":1.75,"min_output_per_1m":14,"max_output_per_1m":14,"min_cache_read_per_1m":0.175,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-2","name":"gpt-5-2","display_name":"GPT-5.2","description":"A frontier GPT-5 generation LLM for complex professional work with configurable reasoning effort, available via the Responses API.","creator":"openai","family":"gpt","tier":"","version":"5-2","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-11","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure/gpt-5.2","azure/gpt-5.2-2025-12-11","chatgpt/gpt-5.2","github_copilot/gpt-5.2","gmi/openai/gpt-5.2","gpt-5-2","gpt-5-2-medium","gpt-5-2-non-reasoning","gpt-5.2","gpt-5.2-2025-12-11","openai-gpt-5-2","openai/gpt-5.2","openrouter/openai/gpt-5.2","perplexity/openai/gpt-5.2"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-2","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.75,"max_input_per_1m":2.1,"min_output_per_1m":14,"max_output_per_1m":16.8,"min_cache_read_per_1m":0.175,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","gmi","openai","openrouter","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-2-codex","name":"gpt-5-2-codex","display_name":"GPT-5.2 Codex","description":"A GPT-5.2 variant optimized for agentic coding in Codex environments, supporting low through xhigh reasoning effort settings.","creator":"openai","family":"gpt","tier":"","version":"5-2","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":400000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-01-14","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/gpt-5.2-codex","chatgpt/gpt-5.2-codex","gpt-5-2-codex","gpt-5.2-codex","openai-gpt-5-2-codex","openai/gpt-5.2-codex","openrouter/openai/gpt-5.2-codex"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-2-codex","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.75,"max_input_per_1m":1.75,"min_output_per_1m":14,"max_output_per_1m":14,"min_cache_read_per_1m":0.175,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-4-mini","name":"gpt-5-4-mini","display_name":"GPT-5.4 Mini","description":"A faster, cost-efficient variant of GPT-5.4 designed for high-volume workloads while retaining strong reasoning, vision, and tool-use capabilities.","creator":"openai","family":"gpt","tier":"mini","version":"5-4","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["azure_ai/gpt-5.4-mini","azure_ai/gpt-5.4-mini-2026-03-17","azure/gpt-5.4-mini","azure/gpt-5.4-mini-2026-03-17","gpt-5-4-mini","gpt-5-4-mini-medium","gpt-5-4-mini-non-reasoning","gpt-5.4-mini","gpt-5.4-mini-2026-03-17","openai-gpt-5-4-mini","openai/gpt-5.4-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-4-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.75,"max_input_per_1m":0.9,"min_output_per_1m":4.5,"max_output_per_1m":5.4,"min_cache_read_per_1m":0.075,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-1","name":"gpt-5-1","display_name":"GPT-5.1","description":"OpenAI's flagship LLM for coding and agentic tasks with configurable reasoning effort levels, available via the Responses API.","creator":"openai","family":"gpt","tier":"","version":"5-1","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-09","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","none"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-11-13","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure/eu/gpt-5.1","azure/global/gpt-5.1","azure/gpt-5.1","azure/gpt-5.1-2025-11-13","azure/us/gpt-5.1","databricks/databricks-gpt-5-1","github_copilot/gpt-5.1","gmi/openai/gpt-5.1","gpt-5-1","gpt-5-1-non-reasoning","gpt-5.1","gpt-5.1-2025-11-13","openai-gpt-5-1","openai/gpt-5.1","perplexity/openai/gpt-5.1"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-1","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.24999,"max_input_per_1m":1.5,"min_output_per_1m":9.99999,"max_output_per_1m":12,"min_cache_read_per_1m":0.125,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"moonshot-kimi-k2-5","name":"kimi-k2-5","display_name":"Kimi K2.5","description":"An updated iteration of Kimi K2 with enhanced reasoning, vision, and tool-use capabilities, supporting implicit caching for efficient inference.","creator":"moonshot","family":"kimi_k25","tier":"","version":"k2-5","type":"language","size_in_bn":1058.589,"modalities":{"input":["image","text","video"],"output":["text"]},"context_window":262144,"max_output_tokens":98304,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-01-27","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":12,"ids":["@cf/moonshotai/kimi-k2.5","accounts/fireworks/models/kimi-k2p5","azure_ai/kimi-k2.5","baseten/moonshotai/Kimi-K2.5","bedrock/ap-northeast-1/moonshotai.kimi-k2.5","bedrock/ap-south-1/moonshotai.kimi-k2.5","bedrock/ap-southeast-3/moonshotai.kimi-k2.5","bedrock/eu-north-1/moonshotai.kimi-k2.5","bedrock/moonshotai.kimi-k2.5","bedrock/sa-east-1/moonshotai.kimi-k2.5","bedrock/us-east-1/moonshotai.kimi-k2.5","bedrock/us-east-2/moonshotai.kimi-k2.5","bedrock/us-west-2/moonshotai.kimi-k2.5","fireworks_ai/accounts/fireworks/models/kimi-k2p5","fireworks_ai/kimi-k2p5","huggingface-llm-kimi-k2-5","kimi-k2-5","kimi-k2-5-non-reasoning","kimi-k2.5","moonshot-kimi-k2-5","moonshot/kimi-k2.5","moonshotai.kimi-k2.5","moonshotai/kimi-k2.5","moonshotai/Kimi-K2.5","openrouter/moonshotai/kimi-k2.5","together_ai/moonshotai/Kimi-K2.5","wandb/moonshotai/Kimi-K2.5"],"hf_likes":2753,"hf_downloads":5222216,"hf_downloads_all_time":9851195,"hf_trending_score":34,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"moonshot-kimi-k2-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.375,"max_input_per_1m":0.6,"min_output_per_1m":2.025,"max_output_per_1m":3.011,"min_cache_read_per_1m":0.1,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":12},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-6-opus","name":"claude-4-6-opus","display_name":"Claude Opus 4.6","description":"Anthropic's high-capability Claude 4.6 Opus model with advanced reasoning, vision, and tool-use for demanding workloads.","creator":"anthropic","family":"claude","tier":"opus","version":"4-6","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-05","training_data_cutoff":"2025-08","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-02-05","earliest_deprecation_date":"2026-06-29","deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-6-opus","anthropic.claude-opus-4-6-v1","anthropic/claude-opus-4.6","anthropic/claude-opus-4.6-fast","au.anthropic.claude-opus-4-6-v1","azure_ai/claude-opus-4-6","claude-opus-4-6","claude-opus-4-6-20260205","claude-opus-4-6-adaptive","eu.anthropic.claude-opus-4-6-v1","github_copilot/claude-opus-4.6-fast","global.anthropic.claude-opus-4-6-v1","openrouter/anthropic/claude-opus-4.6","perplexity/anthropic/claude-opus-4-6","publishers/anthropic/models/claude-opus-4-6","publishers/google/models/claude-opus-4-6","us.anthropic.claude-opus-4-6-v1","vercel_ai_gateway/anthropic/claude-opus-4.6","vertex_ai/claude-opus-4-6","vertex_ai/claude-opus-4-6@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-6-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":30,"min_output_per_1m":25,"max_output_per_1m":150,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5","name":"gpt-5","display_name":"GPT-5","description":"OpenAI's frontier LLM with integrated reasoning, vision, image generation, and tool-use capabilities designed for complex coding and agentic tasks.","creator":"openai","family":"gpt","tier":"","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-09","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["azure/eu/gpt-5-2025-08-07","azure/gpt-5","azure/gpt-5-2025-08-07","azure/us/gpt-5-2025-08-07","databricks/databricks-gpt-5","github_copilot/gpt-5","gmi/openai/gpt-5","gpt-5","gpt-5-2025-08-07","gpt-5-chatgpt","gpt-5-low","gpt-5-medium","gpt-5-minimal","oci/openai.gpt-5","openai-gpt-5","openai/gpt-5","openrouter/openai/gpt-5","replicate/openai/gpt-5","snowflake/openai-gpt-5"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.24999,"max_input_per_1m":1.5,"min_output_per_1m":9.99999,"max_output_per_1m":12,"min_cache_read_per_1m":0.125,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-codex","name":"gpt-5-codex","display_name":"GPT-5 Codex","description":"A GPT-5 variant optimized for agentic coding tasks in Codex environments, available via the Responses API with regularly updated snapshots.","creator":"openai","family":"gpt","tier":"","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":400000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-09","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/gpt-5-codex","gpt-5-codex","openai-gpt-5-codex","openai/gpt-5-codex","openrouter/openai/gpt-5-codex"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-codex","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.125,"max_input_per_1m":1.25,"min_output_per_1m":10,"max_output_per_1m":10,"min_cache_read_per_1m":0.125,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-6-sonnet","name":"claude-4-6-sonnet","display_name":"Claude Sonnet 4.6","description":"A capable Claude 4.6 Sonnet model with reasoning, vision, and tool-use support for a wide range of applications.","creator":"anthropic","family":"claude","tier":"sonnet","version":"4-6","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-02-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-6-sonnet","anthropic.claude-sonnet-4-6","anthropic/claude-sonnet-4-6","anthropic/claude-sonnet-4.6","au.anthropic.claude-sonnet-4-6","azure_ai/claude-sonnet-4-6","claude-sonnet-4-6","claude-sonnet-4-6-adaptive","claude-sonnet-4-6-non-reasoning-low-effort","eu.anthropic.claude-sonnet-4-6","global.anthropic.claude-sonnet-4-6","jp.anthropic.claude-sonnet-4-6","openrouter/anthropic/claude-sonnet-4.6","publishers/anthropic/models/claude-sonnet-4-6","publishers/google/models/claude-sonnet-4-6","snowflake/claude-sonnet-4-6","us.anthropic.claude-sonnet-4-6","vertex_ai/claude-sonnet-4-6","vertex_ai/claude-sonnet-4-6@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-6-sonnet","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":3,"max_input_per_1m":3.6,"min_output_per_1m":15,"max_output_per_1m":18,"min_cache_read_per_1m":0.3,"min_cache_write_per_1m":3.75,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-4-nano","name":"gpt-5-4-nano","display_name":"GPT-5.4 Nano","description":"The smallest and fastest GPT-5.4 tier, optimized for speed- and cost-sensitive tasks such as classification, data extraction, ranking, and sub-agent orchestration.","creator":"openai","family":"gpt","tier":"nano","version":"5-4","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["azure_ai/gpt-5.4-nano","azure_ai/gpt-5.4-nano-2026-03-17","azure/gpt-5.4-nano","azure/gpt-5.4-nano-2026-03-17","gpt-5-4-nano","gpt-5-4-nano-medium","gpt-5-4-nano-non-reasoning","gpt-5.4-nano","gpt-5.4-nano-2026-03-17","openai-gpt-5-4-nano","openai/gpt-5.4-nano"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-4-nano","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2,"max_input_per_1m":0.24,"min_output_per_1m":1.25,"max_output_per_1m":1.5,"min_cache_read_per_1m":0.02,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-5-opus","name":"claude-4-5-opus","display_name":"Claude Opus 4.5","description":"Anthropic's flagship Claude 4.5 model with top-tier reasoning, vision, and tool-use capabilities for complex tasks.","creator":"anthropic","family":"claude","tier":"opus","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":64000,"tool_use_system_prompt_tokens":159,"output_vector_sizes":[],"knowledge_cutoff":"2025-05","training_data_cutoff":"2025-08","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-11-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["anthropic-claude-4-5-opus","anthropic.claude-opus-4-5-20251101-v1:0","anthropic/claude-opus-4.5","azure_ai/claude-opus-4-5","claude-opus-4-5","claude-opus-4-5-20251101","claude-opus-4-5-thinking","claude-opus-4-5@20251101","databricks/databricks-claude-opus-4-5","eu.anthropic.claude-opus-4-5-20251101-v1:0","github_copilot/claude-opus-4.5","global.anthropic.claude-opus-4-5-20251101-v1:0","gmi/anthropic/claude-opus-4.5","openrouter/anthropic/claude-opus-4.5","perplexity/anthropic/claude-opus-4-5","publishers/anthropic/models/claude-opus-4-5","publishers/google/models/claude-opus-4-5","us.anthropic.claude-opus-4-5-20251101-v1:0","vercel_ai_gateway/anthropic/claude-opus-4.5","vertex_ai/claude-opus-4-5","vertex_ai/claude-opus-4-5@20251101"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-5-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","gmi","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-1-codex","name":"gpt-5-1-codex","display_name":"GPT-5.1 Codex","description":"A GPT-5.1 variant purpose-built for agentic coding tasks in Codex environments, available exclusively via the Responses API.","creator":"openai","family":"gpt","tier":"","version":"5-1","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":400000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-09","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-11-13","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/eu/gpt-5.1-codex","azure/global/gpt-5.1-codex","azure/gpt-5.1-codex","azure/gpt-5.1-codex-2025-11-13","azure/us/gpt-5.1-codex","gpt-5-1-codex","gpt-5.1-codex","openai-gpt-5-1-codex","openai/gpt-5.1-codex"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-1-codex","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.25,"max_input_per_1m":1.25,"min_output_per_1m":10,"max_output_per_1m":10,"min_cache_read_per_1m":0.125,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-mini","name":"gpt-5-mini","display_name":"GPT-5 Mini","description":"A faster, cost-efficient variant of GPT-5 suited for well-defined tasks and high-volume, low-latency workloads with vision and tool-use support.","creator":"openai","family":"gpt","tier":"mini","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-05","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["azure/eu/gpt-5-mini-2025-08-07","azure/gpt-5-mini","azure/gpt-5-mini-2025-08-07","azure/us/gpt-5-mini-2025-08-07","databricks/databricks-gpt-5-mini","github_copilot/gpt-5-mini","gpt-5-mini","gpt-5-mini-2025-08-07","gpt-5-mini-medium","gpt-5-mini-minimal","oci/openai.gpt-5-mini","openai-gpt-5-mini","openai/gpt-5-mini","openrouter/openai/gpt-5-mini","perplexity/openai/gpt-5-mini","replicate/openai/gpt-5-mini","snowflake/openai-gpt-5-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.24997,"max_input_per_1m":0.3,"min_output_per_1m":1.99997,"max_output_per_1m":2.4,"min_cache_read_per_1m":0.025,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-o3-pro","name":"o3-pro","display_name":"o3 Pro","description":"A high-compute variant of the o3 reasoning series that uses more compute to think harder, providing consistently reliable answers on the most challenging reasoning tasks.","creator":"openai","family":"o","tier":"pro","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":200000,"max_output_tokens":100000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-06-10","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/o3-pro","azure/o3-pro-2025-06-10","o3-pro","o3-pro-2025-06-10","openai-o3-pro","openai/o3-pro"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-o3-pro","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":20,"max_input_per_1m":20,"min_output_per_1m":80,"max_output_per_1m":80,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-medium-3-5","name":"mistral-medium-3-5","display_name":"Mistral Medium 3.5","description":"A mid-tier general-purpose LLM from Mistral offering a balance of performance and efficiency, positioned between the small and large tiers of the Mistral model family.","creator":"mistral","family":"mistral","tier":"","version":"3-5","type":"language","size_in_bn":null,"modalities":{"input":["image","text"],"output":["text"]},"context_window":262144,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Mistral","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-30","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["mistral-medium-3-5","mistral-medium-3.5","mistral/mistral-medium-3.5","mistralai/mistral-medium-3-5"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-medium-3-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.5,"max_input_per_1m":1.5,"min_output_per_1m":7.5,"max_output_per_1m":7.5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","mistral","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-1-codex-mini","name":"gpt-5-1-codex-mini","display_name":"GPT-5.1 Codex Mini","description":"A smaller, cost-effective variant of GPT-5.1 Codex optimized for agentic coding tasks with reduced capability and cost.","creator":"openai","family":"gpt","tier":"","version":"5-1","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":400000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-09","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-11-13","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/eu/gpt-5.1-codex-mini","azure/global/gpt-5.1-codex-mini","azure/gpt-5.1-codex-mini","azure/gpt-5.1-codex-mini-2025-11-13","azure/us/gpt-5.1-codex-mini","chatgpt/gpt-5.1-codex-mini","gpt-5-1-codex-mini","gpt-5.1-codex-mini","openai-gpt-5-1-codex-mini","openai/gpt-5.1-codex-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-1-codex-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.25,"max_input_per_1m":0.25,"min_output_per_1m":2,"max_output_per_1m":2,"min_cache_read_per_1m":0.025,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-5-sonnet","name":"claude-4-5-sonnet","display_name":"Claude Sonnet 4.5","description":"A versatile Claude 4.5 model with strong reasoning, vision, and tool-use capabilities suited for a broad range of tasks.","creator":"anthropic","family":"claude","tier":"sonnet","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":64000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":"2025-07","supported_reasoning_efforts":["default"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-29","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":10,"ids":["anthropic-claude-4-5-sonnet","anthropic.claude-sonnet-4-5-20250929-v1:0","anthropic/claude-sonnet-4.5","au.anthropic.claude-sonnet-4-5-20250929-v1:0","azure_ai/claude-sonnet-4-5","bedrock/us-gov-east-1/anthropic.claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-east-1/claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-west-1/anthropic.claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-west-1/claude-sonnet-4-5-20250929-v1:0","claude-4-5-sonnet","claude-4-5-sonnet-thinking","claude-sonnet-4-5","claude-sonnet-4-5-20250929","claude-sonnet-4-5-20250929-v1:0","claude-sonnet-4-5@20250929","databricks/databricks-claude-sonnet-4-5","eu.anthropic.claude-sonnet-4-5-20250929-v1:0","github_copilot/claude-sonnet-4.5","global.anthropic.claude-sonnet-4-5-20250929-v1:0","gmi/anthropic/claude-sonnet-4.5","jp.anthropic.claude-sonnet-4-5-20250929-v1:0","openrouter/anthropic/claude-sonnet-4.5","perplexity/anthropic/claude-sonnet-4-5","publishers/anthropic/models/claude-sonnet-4-5","publishers/google/models/claude-sonnet-4-5","replicate/anthropic/claude-4.5-sonnet","snowflake/claude-sonnet-4-5","us-gov.anthropic.claude-sonnet-4-5-20250929-v1:0","us.anthropic.claude-sonnet-4-5-20250929-v1:0","vercel_ai_gateway/anthropic/claude-sonnet-4.5","vertex_ai/claude-sonnet-4-5","vertex_ai/claude-sonnet-4-5@20250929"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-5-sonnet","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2.99999,"max_input_per_1m":3.6,"min_output_per_1m":15,"max_output_per_1m":18,"min_cache_read_per_1m":0.3,"min_cache_write_per_1m":3.75,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":10},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-oss-120b","name":"gpt-oss-120b","display_name":"GPT OSS 120B","description":"A 120-billion-parameter open-weights GPT model from OpenAI designed for reasoning-intensive tasks with implicit caching support.","creator":"openai","family":"gpt_oss","tier":"","version":null,"type":"language","size_in_bn":120,"modalities":{"input":["image","text"],"output":["text"]},"context_window":131072,"max_output_tokens":131072,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":21,"ids":["@cf/openai/gpt-oss-120b","accounts/fireworks/models/gpt-oss-120b","azure_ai/gpt-oss-120b","baseten/openai/gpt-oss-120b","bedrock_mantle/openai.gpt-oss-120b","cerebras/gpt-oss-120b","crusoe/openai/gpt-oss-120b","databricks/databricks-gpt-oss-120b","deepinfra/openai/gpt-oss-120b","fireworks_ai/accounts/fireworks/models/gpt-oss-120b","gpt-oss-120b","gpt-oss-120b-low","gpt-oss-120b-maas","groq/openai/gpt-oss-120b","lemonade/gpt-oss-120b-mxfp-GGUF","novita/openai/gpt-oss-120b","ollama/gpt-oss:120b-cloud","openai-gpt-oss-120b","openai-reasoning-gpt-oss-120b","openai.gpt-oss-120b-1:0","openai/gpt-oss-120b","openai/gpt-oss-120b:free","openrouter/openai/gpt-oss-120b","ovhcloud/gpt-oss-120b","publishers/google/models/gpt-oss-120b-maas","replicate/openai/gpt-oss-120b","sambanova/gpt-oss-120b","together_ai/openai/gpt-oss-120b","vertex_ai/openai/gpt-oss-120b-maas","wandb/openai/gpt-oss-120b","watsonx/openai/gpt-oss-120b"],"hf_likes":4719,"hf_downloads":3524674,"hf_downloads_all_time":32348365,"hf_trending_score":25,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-oss-120b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.039,"max_input_per_1m":15,"min_output_per_1m":0.18,"max_output_per_1m":60,"min_cache_read_per_1m":0.075,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":21},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-o4-mini","name":"o4-mini","display_name":"o4 Mini","description":"A compact o-series reasoning model optimized for fast, cost-efficient performance in coding and visual tasks, with strong multimodal reasoning capabilities.","creator":"openai","family":"o","tier":"mini","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":200000,"max_output_tokens":100000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-16","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["azure/o4-mini","azure/o4-mini-2025-04-16","azure/us/o4-mini-2025-04-16","ft:o4-mini-2025-04-16","o4-mini","o4-mini-2025-04-16","openai-o4-mini","openai/o4-mini","replicate/openai/o4-mini","vercel_ai_gateway/openai/o4-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-o4-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1,"max_input_per_1m":4,"min_output_per_1m":4,"max_output_per_1m":16,"min_cache_read_per_1m":0.275,"min_cache_write_per_1m":null,"min_reasoning_per_1m":4,"cheapest_providers":["replicate"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-v3-2","name":"v3-2","display_name":"DeepSeek V3.2","description":"DeepSeek's V3.2 MoE LLM featuring implicit caching support and improved tool-use capabilities over the V3.1 generation.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.2","type":"language","size_in_bn":685.397,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":163840,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-01","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":12,"ids":["accounts/fireworks/models/deepseek-v3p2","azure_ai/deepseek-v3.2","bedrock/ap-northeast-1/deepseek.v3.2","bedrock/ap-south-1/deepseek.v3.2","bedrock/ap-southeast-3/deepseek.v3.2","bedrock/eu-north-1/deepseek.v3.2","bedrock/sa-east-1/deepseek.v3.2","bedrock/us-east-1/deepseek.v3.2","bedrock/us-east-2/deepseek.v3.2","bedrock/us-west-2/deepseek.v3.2","deepseek-ai/DeepSeek-V3.2","deepseek-llm-deepseek-v3-2","deepseek-v3-2","deepseek-v3-2-251201","deepseek-v3-2-reasoning","deepseek-v3.2-maas","deepseek-v3.2685","deepseek.v3.2","deepseek/deepseek-v3.2","eu.deepseek.v3.2","fireworks_ai/accounts/fireworks/models/deepseek-v3p2","gmi/deepseek-ai/DeepSeek-V3.2","novita/deepseek/deepseek-v3.2","openrouter/deepseek/deepseek-v3.2","publishers/google/models/deepseek-v3.2-maas","us.deepseek.v3.2","vertex_ai/deepseek-ai/deepseek-v3.2-maas"],"hf_likes":1413,"hf_downloads":10366446,"hf_downloads_all_time":11229842,"hf_trending_score":6,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-v3-2","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2288,"max_input_per_1m":0.62,"min_output_per_1m":0.3432,"max_output_per_1m":1.85,"min_cache_read_per_1m":0.028,"min_cache_write_per_1m":0.056,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":12},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-5-haiku","name":"claude-4-5-haiku","display_name":"Claude Haiku 4.5","description":"A fast, lightweight Claude 4.5 model with vision, file input, and tool-use support optimized for low-latency applications.","creator":"anthropic","family":"claude","tier":"haiku","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":200000,"max_output_tokens":64000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-02","training_data_cutoff":"2025-07","supported_reasoning_efforts":["default"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-10-15","earliest_deprecation_date":"2026-10-15","deprecated":false,"has_pricing":true,"provider_count":9,"ids":["anthropic-claude-4-5-haiku","anthropic.claude-haiku-4-5-20251001-v1:0","anthropic.claude-haiku-4-5@20251001","anthropic/claude-haiku-4-5","anthropic/claude-haiku-4.5","apac.anthropic.claude-haiku-4-5-20251001-v1:0","au.anthropic.claude-haiku-4-5-20251001-v1:0","azure_ai/claude-haiku-4-5","bedrock/us-gov-east-1/anthropic.claude-haiku-4-5-20251001-v1:0","bedrock/us-gov-west-1/anthropic.claude-haiku-4-5-20251001-v1:0","claude-4-5-haiku","claude-4-5-haiku-reasoning","claude-haiku-4-5","claude-haiku-4-5-20251001","claude-haiku-4-5@20251001","databricks/databricks-claude-haiku-4-5","eu.anthropic.claude-haiku-4-5-20251001-v1:0","github_copilot/claude-haiku-4.5","global.anthropic.claude-haiku-4-5-20251001-v1:0","jp.anthropic.claude-haiku-4-5-20251001-v1:0","openrouter/anthropic/claude-haiku-4.5","perplexity/anthropic/claude-haiku-4-5","publishers/anthropic/models/claude-haiku-4-5","publishers/google/models/claude-haiku-4-5","replicate/anthropic/claude-4.5-haiku","snowflake/claude-haiku-4-5","us.anthropic.claude-haiku-4-5-20251001-v1:0","vercel_ai_gateway/anthropic/claude-haiku-4.5","vertex_ai/claude-haiku-4-5","vertex_ai/claude-haiku-4-5@20251001"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-5-haiku","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1,"max_input_per_1m":1.2,"min_output_per_1m":5,"max_output_per_1m":6,"min_cache_read_per_1m":0.1,"min_cache_write_per_1m":1.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","replicate","vercel_ai_gateway"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-o1","name":"o1","display_name":"o1","description":"A reinforcement-learning-trained reasoning model that produces a long internal chain of thought before responding, excelling at complex multi-step problems across math, science, and coding.","creator":"openai","family":"o","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":200000,"max_output_tokens":100000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-10","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-12-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["azure/eu/o1-2024-12-17","azure/o1","azure/o1-2024-12-17","azure/us/o1-2024-12-17","o1","o1-2024-12-17","openai-o1","openai/o1","openrouter/openai/o1","replicate/openai/o1","vercel_ai_gateway/openai/o1"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-o1","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":15,"max_input_per_1m":15,"min_output_per_1m":60,"max_output_per_1m":60,"min_cache_read_per_1m":7.5,"min_cache_write_per_1m":null,"min_reasoning_per_1m":60,"cheapest_providers":["azure_aifoundry","openai","openrouter","replicate","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-v3-2-speciale","name":"deepseek-v3-2-speciale","display_name":"DeepSeek V3.2 Speciale","description":"A high-compute variant of DeepSeek V3.2 optimized for maximum reasoning and agentic performance using DeepSeek Sparse Attention for long-context tasks.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.2","type":"language","size_in_bn":685.397,"modalities":{"input":["text"],"output":["text"]},"context_window":163840,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-01","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["azure_ai/deepseek-v3.2-speciale","deepseek-v3-2-speciale","deepseek/deepseek-v3.2-speciale"],"hf_likes":703,"hf_downloads":12474,"hf_downloads_all_time":252919,"hf_trending_score":1,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-v3-2-speciale","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.58,"max_input_per_1m":0.58,"min_output_per_1m":1.68,"max_output_per_1m":1.68,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-nano","name":"gpt-5-nano","display_name":"GPT-5 Nano","description":"The smallest and fastest GPT-5 tier, designed for summarization, classification, and other speed- and cost-sensitive workloads with vision and image-generation support.","creator":"openai","family":"gpt","tier":"nano","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":5000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-05","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["azure/eu/gpt-5-nano-2025-08-07","azure/gpt-5-nano","azure/gpt-5-nano-2025-08-07","azure/us/gpt-5-nano-2025-08-07","databricks/databricks-gpt-5-nano","gpt-5-nano","gpt-5-nano-2025-08-07","gpt-5-nano-medium","gpt-5-nano-minimal","oci/openai.gpt-5-nano","openai-gpt-5-nano","openai/gpt-5-nano","openrouter/openai/gpt-5-nano","replicate/openai/gpt-5-nano","snowflake/openai-gpt-5-nano"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-nano","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.04998,"max_input_per_1m":0.066,"min_output_per_1m":0.39998,"max_output_per_1m":0.48,"min_cache_read_per_1m":0.005,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-4-1","name":"gpt-4-1","display_name":"GPT-4.1","description":"An OpenAI LLM excelling at instruction following and tool calling with a 1M-token context window and low latency without a reasoning step.","creator":"openai","family":"gpt","tier":"","version":"4-1","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1047576,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-14","earliest_deprecation_date":"2026-11-04","deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure/gpt-4.1","azure/gpt-4.1-2025-04-14","azure/us/gpt-4.1-2025-04-14","ft:gpt-4.1-2025-04-14","github_copilot/gpt-4.1","github_copilot/gpt-4.1-2025-04-14","gpt-4-1","gpt-4.1","gpt-4.1-2025-04-14","openai-gpt-4-1","openai/gpt-4.1","openrouter/openai/gpt-4.1","replicate/openai/gpt-4.1","snowflake/openai-gpt-4.1","vercel_ai_gateway/openai/gpt-4.1"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-4-1","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2,"max_input_per_1m":2.4,"min_output_per_1m":8,"max_output_per_1m":9.6,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","replicate","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-o3-mini","name":"o3-mini","display_name":"o3 Mini","description":"A small, cost-efficient reasoning model optimized for STEM tasks, supporting structured outputs and function calling at o1-mini cost and latency targets.","creator":"openai","family":"o","tier":"mini","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["pdf","text"],"output":["text"]},"context_window":200000,"max_output_tokens":100000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-10","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-01-31","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["azure/eu/o3-mini-2025-01-31","azure/o3-mini","azure/o3-mini-2025-01-31","azure/us/o3-mini-2025-01-31","gradient_ai/openai-o3-mini","o3-mini","o3-mini-2025-01-31","openai-o3-mini","openai/o3-mini","openrouter/openai/o3-mini","vercel_ai_gateway/openai/o3-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-o3-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.1,"max_input_per_1m":1.1,"min_output_per_1m":4.4,"max_output_per_1m":4.4,"min_cache_read_per_1m":0.55,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","gradient_ai","openai","openrouter","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-o1-pro","name":"o1-pro","display_name":"o1 Pro","description":"A high-compute variant of the o1 reasoning series that uses additional inference compute to think harder and deliver more consistently accurate answers on difficult problems.","creator":"openai","family":"o","tier":"pro","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":200000,"max_output_tokens":100000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-10","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-03-19","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["o1-pro","o1-pro-2025-03-19","openai-o1-pro","openai/o1-pro"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-o1-pro","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":150,"max_input_per_1m":150,"min_output_per_1m":600,"max_output_per_1m":600,"min_cache_read_per_1m":75,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-o1-preview","name":"o1-preview","display_name":"o1 Preview","description":"A research preview of the o1 reasoning series, trained with reinforcement learning to think through complex problems via an internal chain of thought before responding.","creator":"openai","family":"o","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["pdf","text"],"output":["text"]},"context_window":128000,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-10","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["azure/eu/o1-preview-2024-09-12","azure/o1-preview","azure/o1-preview-2024-09-12","azure/us/o1-preview-2024-09-12","o1-preview","openai-o1-preview"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-o1-preview","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":15,"max_input_per_1m":15,"min_output_per_1m":60,"max_output_per_1m":60,"min_cache_read_per_1m":7.5,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-4-1-mini","name":"gpt-4-1-mini","display_name":"GPT-4.1 Mini","description":"A compact tier of GPT-4.1 that excels at instruction following and tool calling with a 1M-token context window and reduced cost.","creator":"openai","family":"gpt","tier":"mini","version":"4-1","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1047576,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-14","earliest_deprecation_date":"2026-11-04","deprecated":false,"has_pricing":true,"provider_count":5,"ids":["azure/gpt-4.1-mini","azure/gpt-4.1-mini-2025-04-14","azure/us/gpt-4.1-mini-2025-04-14","ft:gpt-4.1-mini-2025-04-14","gpt-4-1-mini","gpt-4.1-mini","gpt-4.1-mini-2025-04-14","openai-gpt-4-1-mini","openai/gpt-4.1-mini","openrouter/openai/gpt-4.1-mini","replicate/openai/gpt-4.1-mini","vercel_ai_gateway/openai/gpt-4.1-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-4-1-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.4,"max_input_per_1m":0.4,"min_output_per_1m":1.6,"max_output_per_1m":1.6,"min_cache_read_per_1m":0.1,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","replicate","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-large-3","name":"mistral-large-3","display_name":"Mistral Large 3","description":"Mistral AI's third-generation flagship model, a multimodal Mixture-of-Experts architecture with 675B total parameters and 41B active parameters.","creator":"mistral","family":"mistral3","tier":"","version":"3","type":"language","size_in_bn":null,"modalities":{"input":["image"],"output":["text"]},"context_window":262144,"max_output_tokens":8191,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-12-02","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["accounts/fireworks/models/mistral-large-3-fp8","azure_ai/mistral-large-3","fireworks_ai/accounts/fireworks/models/mistral-large-3-fp8","mistral-large-3","mistral/mistral-large-3"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-large-3","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.5,"max_input_per_1m":1.2,"min_output_per_1m":1.2,"max_output_per_1m":1.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","mistral","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-v3-324","name":"deepseek-v3-324","display_name":"DeepSeek V3 324","description":"The March 2024 update of DeepSeek V3 (V3-0324), a 671B MoE LLM representing an improved iteration over the original V3 release.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.0","type":"language","size_in_bn":684.531,"modalities":{"input":["text"],"output":["text"]},"context_window":163840,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":13,"ids":["accounts/fireworks/models/deepseek-v3-0324","azure_ai/deepseek-v3-0324","baseten/deepseek-ai/DeepSeek-V3-0324","crusoe/deepseek-ai/DeepSeek-V3-0324","deepinfra/deepseek-ai/DeepSeek-V3-0324","deepseek-ai/DeepSeek-V3-0324","deepseek-v3-0324","deepseek-v3-324","deepseek/deepseek-v3-0324","fireworks_ai/accounts/fireworks/models/deepseek-v3-0324","gmi/deepseek-ai/DeepSeek-V3-0324","hyperbolic/deepseek-ai/DeepSeek-V3-0324","lambda_ai/deepseek-v3-0324","nebius/deepseek-ai/DeepSeek-V3-0324","novita/deepseek/deepseek-v3-0324","sambanova/DeepSeek-V3-0324","wandb/deepseek-ai/DeepSeek-V3-0324"],"hf_likes":3101,"hf_downloads":617973,"hf_downloads_all_time":4563386,"hf_trending_score":0,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-v3-324","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2,"max_input_per_1m":114,"min_output_per_1m":0.4,"max_output_per_1m":275,"min_cache_read_per_1m":0.135,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["lambda"],"provider_count":13},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-o1-mini","name":"o1-mini","display_name":"o1 Mini","description":"A faster and more affordable variant of the o1 reasoning model, optimized for STEM tasks while maintaining strong chain-of-thought reasoning capabilities.","creator":"openai","family":"o","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":128000,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-10","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":false,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["azure/eu/o1-mini-2024-09-12","azure/o1-mini","azure/o1-mini-2024-09-12","azure/us/o1-mini-2024-09-12","o1-mini","openai-o1-mini","replicate/openai/o1-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-o1-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.1,"max_input_per_1m":1.1,"min_output_per_1m":4.4,"max_output_per_1m":4.4,"min_cache_read_per_1m":0.55,"min_cache_write_per_1m":null,"min_reasoning_per_1m":4.4,"cheapest_providers":["azure_aifoundry","openai","replicate"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-4-5","name":"gpt-4-5","display_name":"GPT-4.5","description":"OpenAI's GPT-4.5 model, a high-capability LLM positioned between GPT-4 and GPT-5 for advanced reasoning and instruction-following tasks.","creator":"openai","family":"gpt","tier":"","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["gpt-4-5","openai-gpt-4-5"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-4-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":75,"max_input_per_1m":75,"min_output_per_1m":150,"max_output_per_1m":150,"min_cache_read_per_1m":37.5,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-r1","name":"r1","display_name":"DeepSeek R1","description":"DeepSeek's flagship reasoning-focused LLM with strong performance in mathematics, coding, and logical inference, comparable to leading closed-source models.","creator":"deepseek","family":"deepseek-r1","tier":"","version":"1.0","type":"language","size_in_bn":684.531,"modalities":{"input":["text"],"output":["text"]},"context_window":163840,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-07-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-01-20","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":14,"ids":["accounts/fireworks/models/deepseek-r1","azure_ai/deepseek-r1","deepinfra/deepseek-ai/DeepSeek-R1","deepseek-llm-r1","deepseek-r1","deepseek-r1-0120","deepseek-r1-qwen3-8b","deepseek-r1685","deepseek-reasoner","deepseek.r1-v1:0","deepseek/deepseek-r1","deepseek/deepseek-reasoner","fireworks_ai/accounts/fireworks/models/deepseek-r1","hyperbolic/deepseek-ai/DeepSeek-R1","nebius/deepseek-ai/DeepSeek-R1","openrouter/deepseek/deepseek-r1","replicate/deepseek-ai/deepseek-r1","sambanova/DeepSeek-R1","snowflake/deepseek-r1","together_ai/deepseek-ai/DeepSeek-R1","us.deepseek.r1-v1:0","vercel_ai_gateway/deepseek/deepseek-r1"],"hf_likes":13288,"hf_downloads":4020320,"hf_downloads_all_time":20204112,"hf_trending_score":20,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-r1","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.28,"max_input_per_1m":5,"min_output_per_1m":0.4,"max_output_per_1m":10,"min_cache_read_per_1m":0.028,"min_cache_write_per_1m":null,"min_reasoning_per_1m":10,"cheapest_providers":["deepseek"],"provider_count":14},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-1-405b-instruct","name":"llama-3-1-405b-instruct","display_name":"Llama 3.1 405B Instruct","description":"Meta's 405B instruction-tuned LLM optimized for following complex instructions, with FP8 quantization for efficient large-scale inference.","creator":"meta","family":"llama","tier":"","version":"3-1","type":"language","size_in_bn":405,"modalities":{"input":["image","text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-07-23","earliest_deprecation_date":"2026-07","deprecated":false,"has_pricing":true,"provider_count":11,"ids":["accounts/fireworks/models/llama-v3p1-405b-instruct","azure_ai/Meta-Llama-3.1-405B-Instruct","databricks/databricks-meta-llama-3-1-405b-instruct","fireworks_ai/accounts/fireworks/models/llama-v3p1-405b-instruct","hyperbolic/meta-llama/Meta-Llama-3.1-405B-Instruct","lambda_ai/llama3.1-405b-instruct-fp8","llama-3-1-instruct-405b","meta-llama-3-1-405b-instruct","meta-textgeneration-llama-3-1-405b-instruct-fp8","meta.llama3-1-405b-instruct-v1:0","nebius/meta-llama/Meta-Llama-3.1-405B-Instruct","oci/meta.llama-3.1-405b-instruct","sambanova/Meta-Llama-3.1-405B-Instruct","together_ai/meta-llama/Meta-Llama-3.1-405B-Instruct-Turbo","us.meta.llama3-1-405b-instruct-v1:0","vertex_ai/meta/llama-3.1-405b-instruct-maas"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-1-405b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.12,"max_input_per_1m":10.68,"min_output_per_1m":0.3,"max_output_per_1m":16,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["hyperbolic"],"provider_count":11},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-v3","name":"v3","display_name":"DeepSeek V3","description":"DeepSeek's third-generation MoE LLM with 671B total parameters (37B activated per token), excelling at coding, reasoning, and tool use.","creator":"deepseek","family":"deepseek-v3","tier":"","version":"3.0","type":"language","size_in_bn":684.531,"modalities":{"input":["image","text"],"output":["text"]},"context_window":163840,"max_output_tokens":81920,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-07-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-12-26","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":11,"ids":["accounts/fireworks/models/deepseek-v3","azure_ai/deepseek-v3","deepinfra/deepseek-ai/DeepSeek-V3","deepseek-ai/DeepSeek-V3","deepseek-chat","deepseek-v3","deepseek.v3-v1:0","deepseek/deepseek_v3","deepseek/deepseek-chat","deepseek/deepseek-v3","fireworks_ai/accounts/fireworks/models/deepseek-v3","hyperbolic/deepseek-ai/DeepSeek-V3","nebius/deepseek-ai/DeepSeek-V3","openrouter/deepseek/deepseek-chat","replicate/deepseek-ai/deepseek-v3","together_ai/deepseek-ai/DeepSeek-V3","vercel_ai_gateway/deepseek/deepseek-v3"],"hf_likes":4056,"hf_downloads":882009,"hf_downloads_all_time":15156328,"hf_trending_score":4,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-v3","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2,"max_input_per_1m":1.45,"min_output_per_1m":0.2,"max_output_per_1m":4.56,"min_cache_read_per_1m":0.028,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["hyperbolic"],"provider_count":11},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-3-70b-instruct","name":"llama-3-3-70b-instruct","display_name":"Llama 3.3 70B Instruct","description":"Meta's 70B instruction-tuned LLM from Llama 3.3, optimized for complex instruction-following and deployed across multiple cloud regions.","creator":"meta","family":"llama","tier":"","version":"3-3","type":"language","size_in_bn":70,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":120000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-12","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Llama3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-12-06","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":20,"ids":["accounts/fireworks/models/llama-v3p3-70b-instruct","azure_ai/Llama-3.3-70B-Instruct","crusoe/meta-llama/Llama-3.3-70B-Instruct","databricks/databricks-meta-llama-3-3-70b-instruct","deepinfra/meta-llama/Llama-3.3-70B-Instruct","fireworks_ai/accounts/fireworks/models/llama-v3p3-70b-instruct","gradient_ai/llama3.3-70b-instruct","groq/llama-3.3-70b-versatile","hyperbolic/meta-llama/Llama-3.3-70B-Instruct","lambda_ai/llama3.3-70b-instruct-fp8","llama-3-3-instruct-70b","llama-3.3-70b-instruct-maas","meta_llama/Llama-3.3-70B-Instruct","meta-llama-3-3-70b-instruct","meta-llama/llama-3.3-70b-instruct","meta-llama/llama-3.3-70b-instruct:free","meta-textgeneration-llama-3-3-70b-instruct","meta.llama3-3-70b-instruct-v1:0","meta.llama3-3-70b-instruct-v1:0:128k","nebius/meta-llama/Llama-3.3-70B-Instruct","novita/meta-llama/llama-3.3-70b-instruct","nscale/meta-llama/Llama-3.3-70B-Instruct","oci/meta.llama-3.3-70b-instruct","oci/meta.llama-3.3-70b-instruct-fp8-dynamic","ovhcloud/Meta-Llama-3_3-70B-Instruct","publishers/google/models/llama-3.3-70b-instruct-maas","publishers/meta/models/llama-3.3-70b-instruct-maas","sambanova/Meta-Llama-3.3-70B-Instruct","together_ai/meta-llama/Llama-3.3-70B-Instruct-Turbo-Free","us.meta.llama3-3-70b-instruct-v1:0","wandb/meta-llama/Llama-3.3-70B-Instruct","watsonx/meta-llama/llama-3-3-70b-instruct"],"hf_likes":2731,"hf_downloads":496024,"hf_downloads_all_time":10779619,"hf_trending_score":1.5,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-3-70b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.1,"max_input_per_1m":71,"min_output_per_1m":0.2,"max_output_per_1m":71,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":20},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-4-turbo","name":"gpt-4-turbo","display_name":"GPT-4 Turbo","description":"OpenAI's cost-optimized successor to GPT-4, offering improved performance and lower pricing for high-intelligence chat and tool-use tasks.","creator":"openai","family":"gpt","tier":"","version":"4","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":128000,"max_output_tokens":4096,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-12","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-01-25","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["azure/gpt-4-turbo","azure/gpt-4-turbo-2024-04-09","gpt-4-turbo","gpt-4-turbo-2024-04-09","gpt-4-turbo-preview","openai-gpt-4-turbo","openai/gpt-4-turbo","openai/gpt-4-turbo-preview","vercel_ai_gateway/openai/gpt-4-turbo"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-4-turbo","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":10,"max_input_per_1m":10,"min_output_per_1m":30,"max_output_per_1m":30,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"cohere-command-a","name":"cohere-command-a","display_name":"Command A","description":"A highly efficient generative LLM from Cohere excelling at agentic workflows, tool use, and multilingual enterprise tasks.","creator":"cohere","family":"command","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":256000,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-08-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-03-13","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["cohere-command-a","cohere-command-a-a100","cohere-command-a-h100","cohere/command-a","command-a","command-a-03-2025","oci/cohere.command-a-03-2025","vercel_ai_gateway/cohere/command-a"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"cohere-command-a","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.56,"max_input_per_1m":2.5,"min_output_per_1m":1.56,"max_output_per_1m":10,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["oracle_oci"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-4-1-nano","name":"gpt-4-1-nano","display_name":"GPT-4.1 Nano","description":"The smallest tier of GPT-4.1, optimized for ultra-low latency instruction following and tool calling with a 1M-token context window.","creator":"openai","family":"gpt","tier":"nano","version":"4-1","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1047576,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-14","earliest_deprecation_date":"2026-11-04","deprecated":false,"has_pricing":true,"provider_count":5,"ids":["azure/gpt-4.1-nano","azure/gpt-4.1-nano-2025-04-14","azure/us/gpt-4.1-nano-2025-04-14","ft:gpt-4.1-nano-2025-04-14","gpt-4-1-nano","gpt-4.1-nano","gpt-4.1-nano-2025-04-14","openai-gpt-4-1-nano","openai/gpt-4.1-nano","openrouter/openai/gpt-4.1-nano","replicate/openai/gpt-4.1-nano","vercel_ai_gateway/openai/gpt-4.1-nano"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-4-1-nano","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.1,"max_input_per_1m":0.1,"min_output_per_1m":0.4,"max_output_per_1m":0.4,"min_cache_read_per_1m":0.025,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","replicate","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-4o-mini","name":"gpt-4o-mini","display_name":"GPT-4o mini","description":"A fast, cost-efficient small LLM in the GPT-4o family that accepts text and image inputs, ideal for focused tasks and fine-tuning.","creator":"openai","family":"gpt","tier":"mini","version":"4o","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-10","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-07-18","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure/eu/gpt-4o-mini-2024-07-18","azure/global-standard/gpt-4o-mini","azure/gpt-4o-mini","azure/gpt-4o-mini-2024-07-18","azure/us/gpt-4o-mini-2024-07-18","ft:gpt-4o-mini-2024-07-18","github_copilot/gpt-4o-mini","github_copilot/gpt-4o-mini-2024-07-18","gmi/openai/gpt-4o-mini","gpt-4o-mini","gpt-4o-mini-2024-07-18","gpt-4o-mini-realtime-dec-2024","gradient_ai/openai-gpt-4o-mini","openai-gpt-4o-mini","openai/gpt-4o-mini","openai/gpt-4o-mini-2024-07-18","replicate/openai/gpt-4o-mini","vercel_ai_gateway/openai/gpt-4o-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-4o-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.15,"max_input_per_1m":0.15,"min_output_per_1m":0.6,"max_output_per_1m":0.6,"min_cache_read_per_1m":0.075,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","gmi","openai","openrouter","replicate","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-1-70b-instruct","name":"llama-3-1-70b-instruct","display_name":"Llama 3.1 70B Instruct","description":"Meta's 70B instruction-tuned LLM with strong tool-use and multilingual capabilities, widely deployed across cloud regions for enterprise workloads.","creator":"meta","family":"llama","tier":"","version":"3-1","type":"language","size_in_bn":70,"modalities":{"input":["image","text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-12-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Llama3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-07-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":13,"ids":["accounts/fireworks/models/llama-v3p1-70b-instruct","accounts/fireworks/models/llama-v3p1-70b-instruct-1b","azure_ai/Meta-Llama-3.1-70B-Instruct","deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct","deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo","fireworks_ai/accounts/fireworks/models/llama-v3p1-70b-instruct","fireworks_ai/accounts/fireworks/models/llama-v3p1-70b-instruct-1b","friendliai/meta-llama-3.1-70b-instruct","hyperbolic/meta-llama/Meta-Llama-3.1-70B-Instruct","lambda_ai/llama3.1-70b-instruct-fp8","llama-3-1-instruct-70b","meta-llama-3-1-70b-instruct","meta-llama/llama-3.1-70b-instruct","meta-llama/Meta-Llama-3.1-70B-Instruct","meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo","meta-textgeneration-llama-3-1-70b-instruct","meta-textgenerationneuron-llama-3-1-70b-instruct","meta.llama3-1-70b-instruct-v1:0","meta.llama3-1-70b-instruct-v1:0:128k","nebius/meta-llama/Meta-Llama-3.1-70B-Instruct","oci/meta.llama-3.1-70b-instruct","ovhcloud/Meta-Llama-3_1-70B-Instruct","perplexity/llama-3.1-70b-instruct","together_ai/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo","us.meta.llama3-1-70b-instruct-v1:0","vertex_ai/meta/llama-3.1-70b-instruct-maas"],"hf_likes":907,"hf_downloads":737459,"hf_downloads_all_time":20735812,"hf_trending_score":0,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-1-70b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.12,"max_input_per_1m":2.68,"min_output_per_1m":0.3,"max_output_per_1m":3.54,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["hyperbolic","lambda"],"provider_count":13},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-1-8b-instruct","name":"llama-3-1-8b-instruct","display_name":"Llama 3.1 8B Instruct","description":"Meta's 8B instruction-tuned LLM optimized for fast, cost-effective deployment across multiple cloud regions with strong instruction-following performance.","creator":"meta","family":"llama","tier":"","version":"3-1","type":"language","size_in_bn":8,"modalities":{"input":["image","text"],"output":["text"]},"context_window":200000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-12-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Llama3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-07-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":21,"ids":["@cf/meta/llama-3.1-8b-instruct","accounts/fireworks/models/full-llama-v3p1-8b-instruct-8b-fp8","accounts/fireworks/models/full-llama-v3p1-8b-instruct-8b-fp8-amd","accounts/fireworks/models/llama-v3p1-8b-instruct","azure_ai/Meta-Llama-3.1-8B-Instruct","databricks/databricks-meta-llama-3-1-8b-instruct","deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct","deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo","fireworks_ai/accounts/fireworks/models/llama-v3p1-8b-instruct","friendliai/meta-llama-3.1-8b-instruct","groq/llama-3.1-8b-instant","hyperbolic/meta-llama/Meta-Llama-3.1-8B-Instruct","lambda_ai/llama3.1-8b-instruct","llama-3-1-instruct-8b","meta-llama-3-1-8b-instruct","meta-llama/llama-3.1-8b-instruct","meta-llama/Meta-Llama-3.1-8B-Instruct","meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo","meta-textgeneration-llama-3-1-8b-instruct","meta-textgenerationneuron-llama-3-1-8b-instruct","meta.llama3-1-8b-instruct-v1:0","meta.llama3-1-8b-instruct-v1:0:128k","nebius/meta-llama/Meta-Llama-3.1-8B-Instruct","novita/meta-llama/llama-3.1-8b-instruct","nscale/meta-llama/Llama-3.1-8B-Instruct","oci/meta.llama-3.1-8b-instruct","ovhcloud/Llama-3.1-8B-Instruct","perplexity/llama-3.1-8b-instruct","sambanova/Meta-Llama-3.1-8B-Instruct","together_ai/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo","us.meta.llama3-1-8b-instruct-v1:0","vertex_ai/meta/llama-3.1-8b-instruct-maas","wandb/meta-llama/Llama-3.1-8B-Instruct"],"hf_likes":5731,"hf_downloads":9306502,"hf_downloads_all_time":140394735,"hf_trending_score":24,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-1-8b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.02,"max_input_per_1m":22,"min_output_per_1m":0.03,"max_output_per_1m":22,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["huggingface","nebius","novita","openrouter"],"provider_count":21},"providers":[],"regions":[],"region_info":{}}}],"pagination":{"page_size":50,"has_next":true,"next_token":"NTA","total_count":191},"meta":{"updated_at":"2026-06-13","request_id":"989ef299-994b-4a00-9c87-5740551d15c2","execution_ms":18}}