{"data":[{"id":"anthropic-claude-5-fable","name":"claude-5-fable","display_name":"Claude Fable 5","description":"A highly capable Claude LLM optimized for demanding reasoning and long-horizon agentic tasks, with vision, tool-use, and explicit-caching support.","creator":"anthropic","family":"claude","tier":"fable","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default","xhigh"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-06-09","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["anthropic-claude-5-fable","anthropic.claude-fable-5","anthropic/claude-fable-5","au.anthropic.claude-fable-5","azure_ai/claude-fable-5","claude-fable-5","eu.anthropic.claude-fable-5","global.anthropic.claude-fable-5","publishers/anthropic/models/claude-fable-5","publishers/google/models/claude-fable-5","us.anthropic.claude-fable-5","vertex_ai/claude-fable-5","vertex_ai/claude-fable-5@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-5-fable","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":10,"max_input_per_1m":12,"min_output_per_1m":50,"max_output_per_1m":60,"min_cache_read_per_1m":1,"min_cache_write_per_1m":12.5,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-8-opus","name":"claude-4-8-opus","display_name":"Claude Opus 4.8","description":"A flagship Anthropic LLM in the Claude Opus tier at version 4.8, supporting adaptive reasoning, vision, tool use, file input, and web search across multiple geographic regions.","creator":"anthropic","family":"claude","tier":"opus","version":"4-8","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","xhigh"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-05-28","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-8-opus","anthropic.claude-opus-4-8","anthropic/claude-opus-4-8","anthropic/claude-opus-4.8","au.anthropic.claude-opus-4-8","azure_ai/claude-opus-4-8","claude-opus-4-8","eu.anthropic.claude-opus-4-8","global.anthropic.claude-opus-4-8","jp.anthropic.claude-opus-4-8","publishers/anthropic/models/claude-opus-4-8","publishers/google/models/claude-opus-4-8","us.anthropic.claude-opus-4-8","vertex_ai/claude-opus-4-8","vertex_ai/claude-opus-4-8@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-8-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-5","name":"gpt-5-5","display_name":"GPT-5.5","description":"A GPT-5 series large language model from OpenAI targeting high-capability reasoning and generation tasks at the xhigh performance tier.","creator":"openai","family":"gpt","tier":"","version":"5-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-12","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure/gpt-5.5","azure/gpt-5.5-2026-04-23","bedrock_mantle/openai.gpt-5.5","gpt-5-5","gpt-5-5-high","gpt-5-5-instant-05-26","gpt-5-5-low","gpt-5-5-medium","gpt-5-5-non-reasoning","gpt-5.5","gpt-5.5-2026-04-23","openai-gpt-5-5","openai/gpt-5.5"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":30,"max_output_per_1m":36,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-7-opus","name":"claude-4-7-opus","display_name":"Claude Opus 4.7","description":"Anthropic's Claude 4.7 Opus model with adaptive reasoning at maximum effort, vision, and tool-use for complex enterprise tasks.","creator":"anthropic","family":"claude","tier":"opus","version":"4-7","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2026-01","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","minimal","xhigh"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-04-16","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-7-opus","anthropic.claude-opus-4-7","anthropic/claude-opus-4-7","anthropic/claude-opus-4.7","au.anthropic.claude-opus-4-7","azure_ai/claude-opus-4-7","claude-opus-4-7","claude-opus-4-7-20260416","claude-opus-4-7-non-reasoning","eu.anthropic.claude-opus-4-7","global.anthropic.claude-opus-4-7","jp.anthropic.claude-opus-4-7","openrouter/anthropic/claude-opus-4.7","perplexity/anthropic/claude-opus-4-7","publishers/anthropic/models/claude-opus-4-7","publishers/google/models/claude-opus-4-7","us.anthropic.claude-opus-4-7","vertex_ai/claude-opus-4-7","vertex_ai/claude-opus-4-7@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-7-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-4","name":"gpt-5-4","display_name":"GPT-5.4","description":"OpenAI's frontier reasoning model for complex professional work, supporting vision, file input, tool use, and configurable reasoning effort from none to xhigh.","creator":"openai","family":"gpt","tier":"","version":"5-4","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure_ai/gpt-5.4","azure_ai/gpt-5.4-2026-03-05","azure/gpt-5.4","azure/gpt-5.4-2026-03-05","bedrock_mantle/openai.gpt-5.4","chatgpt/gpt-5.4","gpt-5-4","gpt-5-4-low","gpt-5-4-non-reasoning","gpt-5.4","gpt-5.4-2026-03-05","openai-gpt-5-4","openai/gpt-5.4"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-4","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2.5,"max_input_per_1m":3,"min_output_per_1m":15,"max_output_per_1m":18,"min_cache_read_per_1m":0.25,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-3-5-flash","name":"gemini-3-5-flash","display_name":"Gemini 3.5 Flash","description":"A fast, efficient Gemini 3.5 model optimized for high-throughput tasks with support for reasoning, vision, tool use, and web search.","creator":"google","family":"gemini","tier":"flash","version":"3-5","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-05-19","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["gemini-3-5-flash","gemini-3-5-flash-medium","gemini-3-5-flash-minimal","gemini-3.5-flash","gemini/gemini-3.5-flash","google-gemini-3-5-flash","google/gemini-3.5-flash","publishers/google/models/gemini-3.5-flash","vertex_ai/gemini-3.5-flash"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-3-5-flash","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.5,"max_input_per_1m":1.8,"min_output_per_1m":9,"max_output_per_1m":10.8,"min_cache_read_per_1m":0.15,"min_cache_write_per_1m":0.0833333333,"min_reasoning_per_1m":9,"cheapest_providers":["google_gemini","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"xai-grok-4-3","name":"grok-4-3","display_name":"Grok 4.3","description":"A multimodal reasoning LLM from xAI that accepts text and image inputs, designed for agentic workflows, instruction-following, and tool-use tasks requiring high factual accuracy.","creator":"xai","family":"grok","tier":"","version":"4-3","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Grok","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-04-30","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["grok-4-3","grok-4-3-low","grok-4-3-medium","grok-4-3-non-reasoning","grok-4.3","publishers/google/models/grok-4.3","x-ai/grok-4.3","xai-grok-4-3","xai/grok-4.3","xai/grok-4.3-latest"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"xai-grok-4-3","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.25,"max_input_per_1m":1.5,"min_output_per_1m":2.5,"max_output_per_1m":3,"min_cache_read_per_1m":0.2,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","vercel_ai_gateway","xai"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-2","name":"gpt-5-2","display_name":"GPT-5.2","description":"A frontier GPT-5 generation LLM for complex professional work with configurable reasoning effort, available via the Responses API.","creator":"openai","family":"gpt","tier":"","version":"5-2","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-12-11","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure/gpt-5.2","azure/gpt-5.2-2025-12-11","chatgpt/gpt-5.2","github_copilot/gpt-5.2","gmi/openai/gpt-5.2","gpt-5-2","gpt-5-2-medium","gpt-5-2-non-reasoning","gpt-5.2","gpt-5.2-2025-12-11","openai-gpt-5-2","openai/gpt-5.2","openrouter/openai/gpt-5.2","perplexity/openai/gpt-5.2"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-2","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.75,"max_input_per_1m":2.1,"min_output_per_1m":14,"max_output_per_1m":16.8,"min_cache_read_per_1m":0.175,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","gmi","openai","openrouter","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-4-mini","name":"gpt-5-4-mini","display_name":"GPT-5.4 Mini","description":"A faster, cost-efficient variant of GPT-5.4 designed for high-volume workloads while retaining strong reasoning, vision, and tool-use capabilities.","creator":"openai","family":"gpt","tier":"mini","version":"5-4","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["azure_ai/gpt-5.4-mini","azure_ai/gpt-5.4-mini-2026-03-17","azure/gpt-5.4-mini","azure/gpt-5.4-mini-2026-03-17","gpt-5-4-mini","gpt-5-4-mini-medium","gpt-5-4-mini-non-reasoning","gpt-5.4-mini","gpt-5.4-mini-2026-03-17","openai-gpt-5-4-mini","openai/gpt-5.4-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-4-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.75,"max_input_per_1m":0.9,"min_output_per_1m":4.5,"max_output_per_1m":5.4,"min_cache_read_per_1m":0.075,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"xai-grok-4-20","name":"grok-4-20","display_name":"Grok 4.20","description":"xAI's flagship LLM combining industry-leading speed, agentic tool calling, and low hallucination rates for enterprise and research applications.","creator":"xai","family":"grok","tier":"","version":"4-20","type":"language","size_in_bn":null,"modalities":{"input":["image","text"],"output":["text"]},"context_window":2000000,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-09-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Grok","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-31","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["grok-4-20","grok-4-20-0309","oci/xai.grok-4.20","x-ai/grok-4.20","xai-grok-4-20"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"xai-grok-4-20","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.25,"max_input_per_1m":3,"min_output_per_1m":2.5,"max_output_per_1m":15,"min_cache_read_per_1m":0.2,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","xai"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-1","name":"gpt-5-1","display_name":"GPT-5.1","description":"OpenAI's flagship LLM for coding and agentic tasks with configurable reasoning effort levels, available via the Responses API.","creator":"openai","family":"gpt","tier":"","version":"5-1","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-09","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal","none"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-11-13","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure/eu/gpt-5.1","azure/global/gpt-5.1","azure/gpt-5.1","azure/gpt-5.1-2025-11-13","azure/us/gpt-5.1","databricks/databricks-gpt-5-1","github_copilot/gpt-5.1","gmi/openai/gpt-5.1","gpt-5-1","gpt-5-1-non-reasoning","gpt-5.1","gpt-5.1-2025-11-13","openai-gpt-5-1","openai/gpt-5.1","perplexity/openai/gpt-5.1"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-1","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.24999,"max_input_per_1m":1.5,"min_output_per_1m":9.99999,"max_output_per_1m":12,"min_cache_read_per_1m":0.125,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-6-opus","name":"claude-4-6-opus","display_name":"Claude Opus 4.6","description":"Anthropic's high-capability Claude 4.6 Opus model with advanced reasoning, vision, and tool-use for demanding workloads.","creator":"anthropic","family":"claude","tier":"opus","version":"4-6","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-05","training_data_cutoff":"2025-08","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-02-05","earliest_deprecation_date":"2026-06-29","deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-6-opus","anthropic.claude-opus-4-6-v1","anthropic/claude-opus-4.6","anthropic/claude-opus-4.6-fast","au.anthropic.claude-opus-4-6-v1","azure_ai/claude-opus-4-6","claude-opus-4-6","claude-opus-4-6-20260205","claude-opus-4-6-adaptive","eu.anthropic.claude-opus-4-6-v1","github_copilot/claude-opus-4.6-fast","global.anthropic.claude-opus-4-6-v1","openrouter/anthropic/claude-opus-4.6","perplexity/anthropic/claude-opus-4-6","publishers/anthropic/models/claude-opus-4-6","publishers/google/models/claude-opus-4-6","us.anthropic.claude-opus-4-6-v1","vercel_ai_gateway/anthropic/claude-opus-4.6","vertex_ai/claude-opus-4-6","vertex_ai/claude-opus-4-6@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-6-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":30,"min_output_per_1m":25,"max_output_per_1m":150,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5","name":"gpt-5","display_name":"GPT-5","description":"OpenAI's frontier LLM with integrated reasoning, vision, image generation, and tool-use capabilities designed for complex coding and agentic tasks.","creator":"openai","family":"gpt","tier":"","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-09","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["azure/eu/gpt-5-2025-08-07","azure/gpt-5","azure/gpt-5-2025-08-07","azure/us/gpt-5-2025-08-07","databricks/databricks-gpt-5","github_copilot/gpt-5","gmi/openai/gpt-5","gpt-5","gpt-5-2025-08-07","gpt-5-chatgpt","gpt-5-low","gpt-5-medium","gpt-5-minimal","oci/openai.gpt-5","openai-gpt-5","openai/gpt-5","openrouter/openai/gpt-5","replicate/openai/gpt-5","snowflake/openai-gpt-5"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.24999,"max_input_per_1m":1.5,"min_output_per_1m":9.99999,"max_output_per_1m":12,"min_cache_read_per_1m":0.125,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-6-sonnet","name":"claude-4-6-sonnet","display_name":"Claude Sonnet 4.6","description":"A capable Claude 4.6 Sonnet model with reasoning, vision, and tool-use support for a wide range of applications.","creator":"anthropic","family":"claude","tier":"sonnet","version":"4-6","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":"2026-01","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":true},"release_date":"2026-02-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-4-6-sonnet","anthropic.claude-sonnet-4-6","anthropic/claude-sonnet-4-6","anthropic/claude-sonnet-4.6","au.anthropic.claude-sonnet-4-6","azure_ai/claude-sonnet-4-6","claude-sonnet-4-6","claude-sonnet-4-6-adaptive","claude-sonnet-4-6-non-reasoning-low-effort","eu.anthropic.claude-sonnet-4-6","global.anthropic.claude-sonnet-4-6","jp.anthropic.claude-sonnet-4-6","openrouter/anthropic/claude-sonnet-4.6","publishers/anthropic/models/claude-sonnet-4-6","publishers/google/models/claude-sonnet-4-6","snowflake/claude-sonnet-4-6","us.anthropic.claude-sonnet-4-6","vertex_ai/claude-sonnet-4-6","vertex_ai/claude-sonnet-4-6@default"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-6-sonnet","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":3,"max_input_per_1m":3.6,"min_output_per_1m":15,"max_output_per_1m":18,"min_cache_read_per_1m":0.3,"min_cache_write_per_1m":3.75,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-4-nano","name":"gpt-5-4-nano","display_name":"GPT-5.4 Nano","description":"The smallest and fastest GPT-5.4 tier, optimized for speed- and cost-sensitive tasks such as classification, data extraction, ranking, and sub-agent orchestration.","creator":"openai","family":"gpt","tier":"nano","version":"5-4","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1050000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-08","training_data_cutoff":null,"supported_reasoning_efforts":["default","none","xhigh"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-03-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["azure_ai/gpt-5.4-nano","azure_ai/gpt-5.4-nano-2026-03-17","azure/gpt-5.4-nano","azure/gpt-5.4-nano-2026-03-17","gpt-5-4-nano","gpt-5-4-nano-medium","gpt-5-4-nano-non-reasoning","gpt-5.4-nano","gpt-5.4-nano-2026-03-17","openai-gpt-5-4-nano","openai/gpt-5.4-nano"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-4-nano","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.2,"max_input_per_1m":0.24,"min_output_per_1m":1.25,"max_output_per_1m":1.5,"min_cache_read_per_1m":0.02,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-5-opus","name":"claude-4-5-opus","display_name":"Claude Opus 4.5","description":"Anthropic's flagship Claude 4.5 model with top-tier reasoning, vision, and tool-use capabilities for complex tasks.","creator":"anthropic","family":"claude","tier":"opus","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":409600,"max_output_tokens":64000,"tool_use_system_prompt_tokens":159,"output_vector_sizes":[],"knowledge_cutoff":"2025-05","training_data_cutoff":"2025-08","supported_reasoning_efforts":["default","minimal"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-11-24","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["anthropic-claude-4-5-opus","anthropic.claude-opus-4-5-20251101-v1:0","anthropic/claude-opus-4.5","azure_ai/claude-opus-4-5","claude-opus-4-5","claude-opus-4-5-20251101","claude-opus-4-5-thinking","claude-opus-4-5@20251101","databricks/databricks-claude-opus-4-5","eu.anthropic.claude-opus-4-5-20251101-v1:0","github_copilot/claude-opus-4.5","global.anthropic.claude-opus-4-5-20251101-v1:0","gmi/anthropic/claude-opus-4.5","openrouter/anthropic/claude-opus-4.5","perplexity/anthropic/claude-opus-4-5","publishers/anthropic/models/claude-opus-4-5","publishers/google/models/claude-opus-4-5","us.anthropic.claude-opus-4-5-20251101-v1:0","vercel_ai_gateway/anthropic/claude-opus-4.5","vertex_ai/claude-opus-4-5","vertex_ai/claude-opus-4-5@20251101"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-5-opus","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":5,"max_input_per_1m":6,"min_output_per_1m":25,"max_output_per_1m":30,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":6.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","gmi","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-mini","name":"gpt-5-mini","display_name":"GPT-5 Mini","description":"A faster, cost-efficient variant of GPT-5 suited for well-defined tasks and high-volume, low-latency workloads with vision and tool-use support.","creator":"openai","family":"gpt","tier":"mini","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-05","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["azure/eu/gpt-5-mini-2025-08-07","azure/gpt-5-mini","azure/gpt-5-mini-2025-08-07","azure/us/gpt-5-mini-2025-08-07","databricks/databricks-gpt-5-mini","github_copilot/gpt-5-mini","gpt-5-mini","gpt-5-mini-2025-08-07","gpt-5-mini-medium","gpt-5-mini-minimal","oci/openai.gpt-5-mini","openai-gpt-5-mini","openai/gpt-5-mini","openrouter/openai/gpt-5-mini","perplexity/openai/gpt-5-mini","replicate/openai/gpt-5-mini","snowflake/openai-gpt-5-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-mini","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.24997,"max_input_per_1m":0.3,"min_output_per_1m":1.99997,"max_output_per_1m":2.4,"min_cache_read_per_1m":0.025,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-5-sonnet","name":"claude-4-5-sonnet","display_name":"Claude Sonnet 4.5","description":"A versatile Claude 4.5 model with strong reasoning, vision, and tool-use capabilities suited for a broad range of tasks.","creator":"anthropic","family":"claude","tier":"sonnet","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":64000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":"2025-07","supported_reasoning_efforts":["default"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-09-29","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":10,"ids":["anthropic-claude-4-5-sonnet","anthropic.claude-sonnet-4-5-20250929-v1:0","anthropic/claude-sonnet-4.5","au.anthropic.claude-sonnet-4-5-20250929-v1:0","azure_ai/claude-sonnet-4-5","bedrock/us-gov-east-1/anthropic.claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-east-1/claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-west-1/anthropic.claude-sonnet-4-5-20250929-v1:0","bedrock/us-gov-west-1/claude-sonnet-4-5-20250929-v1:0","claude-4-5-sonnet","claude-4-5-sonnet-thinking","claude-sonnet-4-5","claude-sonnet-4-5-20250929","claude-sonnet-4-5-20250929-v1:0","claude-sonnet-4-5@20250929","databricks/databricks-claude-sonnet-4-5","eu.anthropic.claude-sonnet-4-5-20250929-v1:0","github_copilot/claude-sonnet-4.5","global.anthropic.claude-sonnet-4-5-20250929-v1:0","gmi/anthropic/claude-sonnet-4.5","jp.anthropic.claude-sonnet-4-5-20250929-v1:0","openrouter/anthropic/claude-sonnet-4.5","perplexity/anthropic/claude-sonnet-4-5","publishers/anthropic/models/claude-sonnet-4-5","publishers/google/models/claude-sonnet-4-5","replicate/anthropic/claude-4.5-sonnet","snowflake/claude-sonnet-4-5","us-gov.anthropic.claude-sonnet-4-5-20250929-v1:0","us.anthropic.claude-sonnet-4-5-20250929-v1:0","vercel_ai_gateway/anthropic/claude-sonnet-4.5","vertex_ai/claude-sonnet-4-5","vertex_ai/claude-sonnet-4-5@20250929"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-5-sonnet","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2.99999,"max_input_per_1m":3.6,"min_output_per_1m":15,"max_output_per_1m":18,"min_cache_read_per_1m":0.3,"min_cache_write_per_1m":3.75,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":10},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-4-5-haiku","name":"claude-4-5-haiku","display_name":"Claude Haiku 4.5","description":"A fast, lightweight Claude 4.5 model with vision, file input, and tool-use support optimized for low-latency applications.","creator":"anthropic","family":"claude","tier":"haiku","version":"4-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":200000,"max_output_tokens":64000,"tool_use_system_prompt_tokens":346,"output_vector_sizes":[],"knowledge_cutoff":"2025-02","training_data_cutoff":"2025-07","supported_reasoning_efforts":["default"],"tokenizer":"Claude","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-10-15","earliest_deprecation_date":"2026-10-15","deprecated":false,"has_pricing":true,"provider_count":9,"ids":["anthropic-claude-4-5-haiku","anthropic.claude-haiku-4-5-20251001-v1:0","anthropic.claude-haiku-4-5@20251001","anthropic/claude-haiku-4-5","anthropic/claude-haiku-4.5","apac.anthropic.claude-haiku-4-5-20251001-v1:0","au.anthropic.claude-haiku-4-5-20251001-v1:0","azure_ai/claude-haiku-4-5","bedrock/us-gov-east-1/anthropic.claude-haiku-4-5-20251001-v1:0","bedrock/us-gov-west-1/anthropic.claude-haiku-4-5-20251001-v1:0","claude-4-5-haiku","claude-4-5-haiku-reasoning","claude-haiku-4-5","claude-haiku-4-5-20251001","claude-haiku-4-5@20251001","databricks/databricks-claude-haiku-4-5","eu.anthropic.claude-haiku-4-5-20251001-v1:0","github_copilot/claude-haiku-4.5","global.anthropic.claude-haiku-4-5-20251001-v1:0","jp.anthropic.claude-haiku-4-5-20251001-v1:0","openrouter/anthropic/claude-haiku-4.5","perplexity/anthropic/claude-haiku-4-5","publishers/anthropic/models/claude-haiku-4-5","publishers/google/models/claude-haiku-4-5","replicate/anthropic/claude-4.5-haiku","snowflake/claude-haiku-4-5","us.anthropic.claude-haiku-4-5-20251001-v1:0","vercel_ai_gateway/anthropic/claude-haiku-4.5","vertex_ai/claude-haiku-4-5","vertex_ai/claude-haiku-4-5@20251001"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-4-5-haiku","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1,"max_input_per_1m":1.2,"min_output_per_1m":5,"max_output_per_1m":6,"min_cache_read_per_1m":0.1,"min_cache_write_per_1m":1.25,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","anthropic","azure_aifoundry","google_vertex_ai","openrouter","replicate","vercel_ai_gateway"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-5-nano","name":"gpt-5-nano","display_name":"GPT-5 Nano","description":"The smallest and fastest GPT-5 tier, designed for summarization, classification, and other speed- and cost-sensitive workloads with vision and image-generation support.","creator":"openai","family":"gpt","tier":"nano","version":"5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":5000000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-05","training_data_cutoff":null,"supported_reasoning_efforts":["default","minimal"],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-08-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["azure/eu/gpt-5-nano-2025-08-07","azure/gpt-5-nano","azure/gpt-5-nano-2025-08-07","azure/us/gpt-5-nano-2025-08-07","databricks/databricks-gpt-5-nano","gpt-5-nano","gpt-5-nano-2025-08-07","gpt-5-nano-medium","gpt-5-nano-minimal","oci/openai.gpt-5-nano","openai-gpt-5-nano","openai/gpt-5-nano","openrouter/openai/gpt-5-nano","replicate/openai/gpt-5-nano","snowflake/openai-gpt-5-nano"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-5-nano","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.04998,"max_input_per_1m":0.066,"min_output_per_1m":0.39998,"max_output_per_1m":0.48,"min_cache_read_per_1m":0.005,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"openai-gpt-4-1","name":"gpt-4-1","display_name":"GPT-4.1","description":"An OpenAI LLM excelling at instruction following and tool calling with a 1M-token context window and low latency without a reasoning step.","creator":"openai","family":"gpt","tier":"","version":"4-1","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1047576,"max_output_tokens":32768,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-06","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"GPT","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-14","earliest_deprecation_date":"2026-11-04","deprecated":false,"has_pricing":true,"provider_count":6,"ids":["azure/gpt-4.1","azure/gpt-4.1-2025-04-14","azure/us/gpt-4.1-2025-04-14","ft:gpt-4.1-2025-04-14","github_copilot/gpt-4.1","github_copilot/gpt-4.1-2025-04-14","gpt-4-1","gpt-4.1","gpt-4.1-2025-04-14","openai-gpt-4-1","openai/gpt-4.1","openrouter/openai/gpt-4.1","replicate/openai/gpt-4.1","snowflake/openai-gpt-4.1","vercel_ai_gateway/openai/gpt-4.1"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"openai-gpt-4-1","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2,"max_input_per_1m":2.4,"min_output_per_1m":8,"max_output_per_1m":9.6,"min_cache_read_per_1m":0.5,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","openai","openrouter","replicate","vercel_ai_gateway"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-large-3","name":"mistral-large-3","display_name":"Mistral Large 3","description":"Mistral AI's third-generation flagship model, a multimodal Mixture-of-Experts architecture with 675B total parameters and 41B active parameters.","creator":"mistral","family":"mistral3","tier":"","version":"3","type":"language","size_in_bn":null,"modalities":{"input":["image"],"output":["text"]},"context_window":262144,"max_output_tokens":8191,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-12-02","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["accounts/fireworks/models/mistral-large-3-fp8","azure_ai/mistral-large-3","fireworks_ai/accounts/fireworks/models/mistral-large-3-fp8","mistral-large-3","mistral/mistral-large-3"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-large-3","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.5,"max_input_per_1m":1.2,"min_output_per_1m":1.2,"max_output_per_1m":1.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["azure_aifoundry","mistral","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"deepseek-r1","name":"r1","display_name":"DeepSeek R1","description":"DeepSeek's flagship reasoning-focused LLM with strong performance in mathematics, coding, and logical inference, comparable to leading closed-source models.","creator":"deepseek","family":"deepseek-r1","tier":"","version":"1.0","type":"language","size_in_bn":684.531,"modalities":{"input":["text"],"output":["text"]},"context_window":163840,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-07-31","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"DeepSeek","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-01-20","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":14,"ids":["accounts/fireworks/models/deepseek-r1","azure_ai/deepseek-r1","deepinfra/deepseek-ai/DeepSeek-R1","deepseek-llm-r1","deepseek-r1","deepseek-r1-0120","deepseek-r1-qwen3-8b","deepseek-r1685","deepseek-reasoner","deepseek.r1-v1:0","deepseek/deepseek-r1","deepseek/deepseek-reasoner","fireworks_ai/accounts/fireworks/models/deepseek-r1","hyperbolic/deepseek-ai/DeepSeek-R1","nebius/deepseek-ai/DeepSeek-R1","openrouter/deepseek/deepseek-r1","replicate/deepseek-ai/deepseek-r1","sambanova/DeepSeek-R1","snowflake/deepseek-r1","together_ai/deepseek-ai/DeepSeek-R1","us.deepseek.r1-v1:0","vercel_ai_gateway/deepseek/deepseek-r1"],"hf_likes":13288,"hf_downloads":4020320,"hf_downloads_all_time":20204112,"hf_trending_score":20,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"deepseek-r1","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.28,"max_input_per_1m":5,"min_output_per_1m":0.4,"max_output_per_1m":10,"min_cache_read_per_1m":0.028,"min_cache_write_per_1m":null,"min_reasoning_per_1m":10,"cheapest_providers":["deepseek"],"provider_count":14},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-4-maverick","name":"llama-4-maverick","display_name":"Llama 4 Maverick","description":"Meta's Llama 4 Maverick MoE LLM with 128 experts and 17B active parameters, delivering high-capacity multimodal language and vision understanding.","creator":"meta","family":"llama4","tier":"","version":"4","type":"language","size_in_bn":401.584,"modalities":{"input":["image","text"],"output":["text"]},"context_window":1048576,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-08-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Llama4","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["databricks/databricks-llama-4-maverick","llama-4-maverick","meta-llama-4-maverick","meta-llama/llama-4-maverick","meta/llama-4-maverick","snowflake/llama4-maverick","vercel_ai_gateway/meta/llama-4-maverick"],"hf_likes":478,"hf_downloads":30421,"hf_downloads_all_time":554732,"hf_trending_score":1,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-4-maverick","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.12,"max_input_per_1m":0.50001,"min_output_per_1m":0.485,"max_output_per_1m":1.50003,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-2-5-flash","name":"gemini-2-5-flash","display_name":"Gemini 2.5 Flash","description":"A fast, cost-efficient Gemini 2.5 thinking model with strong reasoning, vision, and tool-use capabilities designed for high-throughput applications.","creator":"google","family":"gemini","tier":"flash","version":"2-5","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["audio","text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-06-17","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":9,"ids":["databricks/databricks-gemini-2-5-flash","deepinfra/google/gemini-2.5-flash","gemini-2-5-flash","gemini-2-5-flash-04-2025","gemini-2-5-flash-dec-2025","gemini-2-5-flash-reasoning","gemini-2-5-flash-reasoning-04-2025","gemini-2.5-flash","gemini/gemini-2.5-flash","google_gemini-2-5-flash","google-gemini-2-5-flash","google/gemini-2.5-flash","oci/google.gemini-2.5-flash","openrouter/google/gemini-2.5-flash","perplexity/google/gemini-2.5-flash","publishers/google/models/gemini-2.5-flash","replicate/google/gemini-2.5-flash","vercel_ai_gateway/google/gemini-2.5-flash"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-2-5-flash","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.15,"max_input_per_1m":2.5,"min_output_per_1m":0.6,"max_output_per_1m":3,"min_cache_read_per_1m":0.03,"min_cache_write_per_1m":0.03,"min_reasoning_per_1m":2.5,"cheapest_providers":["google_gemini","google_vertex_ai","oracle_oci"],"provider_count":9},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-large-2","name":"mistral-large-2","display_name":"Mistral Large 2","description":"The second major release of Mistral AI's flagship model, offering improved reasoning, coding, and instruction-following capabilities.","creator":"mistral","family":"mistral","tier":"","version":"2","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":128000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["mistral-large-2","snowflake/mistral-large2"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-large-2","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1,"max_input_per_1m":1,"min_output_per_1m":3,"max_output_per_1m":3,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"anthropic-claude-3-5-sonnet","name":"claude-3-5-sonnet","display_name":"Claude Sonnet 3.5","description":"A mid-tier Claude model offering strong reasoning and instruction-following across text and multimodal tasks.","creator":"anthropic","family":"claude","tier":"sonnet","version":"3-5","type":"language","size_in_bn":null,"modalities":{"input":["image","pdf","text"],"output":["text"]},"context_window":1000000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":159,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":false,"computer_use":true,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-06-20","earliest_deprecation_date":"2026-07","deprecated":false,"has_pricing":true,"provider_count":7,"ids":["anthropic-claude-3-5-sonnet","anthropic.claude-3-5-sonnet-20240620-v1:0","anthropic.claude-3-5-sonnet-20241022-v2:0","apac.anthropic.claude-3-5-sonnet-20240620-v1:0","apac.anthropic.claude-3-5-sonnet-20241022-v2:0","bedrock/invoke/anthropic.claude-3-5-sonnet-20240620-v1:0","bedrock/us-gov-east-1/anthropic.claude-3-5-sonnet-20240620-v1:0","bedrock/us-gov-west-1/anthropic.claude-3-5-sonnet-20240620-v1:0","claude-35-sonnet","claude-35-sonnet-june-24","eu.anthropic.claude-3-5-sonnet-20240620-v1:0","eu.anthropic.claude-3-5-sonnet-20241022-v2:0","gradient_ai/anthropic-claude-3.5-sonnet","heroku/claude-3-5-sonnet-latest","openrouter/anthropic/claude-3.5-sonnet","replicate/anthropic/claude-3.5-sonnet","snowflake/claude-3-5-sonnet","us.anthropic.claude-3-5-sonnet-20240620-v1:0","vercel_ai_gateway/anthropic/claude-3-5-sonnet","vercel_ai_gateway/anthropic/claude-3-5-sonnet-20241022","vercel_ai_gateway/anthropic/claude-3.5-sonnet","vertex_ai/claude-3-5-sonnet","vertex_ai/claude-3-5-sonnet@20240620"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"anthropic-claude-3-5-sonnet","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":3,"max_input_per_1m":3.75,"min_output_per_1m":15,"max_output_per_1m":18.75,"min_cache_read_per_1m":0.3,"min_cache_write_per_1m":3.75,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","google_vertex_ai","gradient_ai","openrouter","snowflake","vercel_ai_gateway"],"provider_count":7},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-pixtral-large","name":"pixtral-large","display_name":"Pixtral Large (25.02)","description":"Mistral's large-scale multimodal model combining vision understanding and tool-use capabilities for complex image-text reasoning tasks.","creator":"mistral","family":"pixtral","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","text"],"output":["text"]},"context_window":128000,"max_output_tokens":4096,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-07-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Mistral","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-08","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["eu.mistral.pixtral-large-2502-v1:0","mistral-pixtral-large","mistral.pixtral-large-2502-v1:0","mistral/pixtral-large","mistral/pixtral-large-2411","mistral/pixtral-large-latest","mistralai/pixtral-large-2411","pixtral-large-2411","us.mistral.pixtral-large-2502-v1:0","vercel_ai_gateway/mistral/pixtral-large"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-pixtral-large","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2,"max_input_per_1m":2.4,"min_output_per_1m":6,"max_output_per_1m":7.2,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["amazon_bedrock","mistral","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-4-scout","name":"llama-4-scout","display_name":"Llama 4 Scout","description":"Meta's Llama 4 Scout MoE LLM with 17B active parameters and 16 experts, offering efficient multimodal inference with native image and text support.","creator":"meta","family":"llama4","tier":"","version":"4","type":"language","size_in_bn":108.642,"modalities":{"input":["image","text"],"output":["text"]},"context_window":10000000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-08-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Llama4","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-04-05","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["llama-4-scout","meta-llama-4-scout","meta-llama/llama-4-scout","meta/llama-4-scout","vercel_ai_gateway/meta/llama-4-scout"],"hf_likes":1274,"hf_downloads":399353,"hf_downloads_all_time":5433902,"hf_trending_score":1,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-4-scout","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.1,"max_input_per_1m":0.25,"min_output_per_1m":0.3,"max_output_per_1m":0.792,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-2-5-flash-lite","name":"gemini-2-5-flash-lite","display_name":"Gemini 2.5 Flash Lite","description":"A lightweight Gemini 2.5 Flash variant optimized for ultra-low latency and cost efficiency while retaining reasoning capabilities.","creator":"google","family":"gemini","tier":"flash-lite","version":"2-5","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2025-07-22","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["gemini-2-5-flash-lite","gemini-2-5-flash-lite-reasoning","gemini-2.5-flash-lite","gemini/gemini-2.5-flash-lite","google-gemini-2-5-flash-lite","google/gemini-2.5-flash-lite","oci/google.gemini-2.5-flash-lite","publishers/google/models/gemini-2.5-flash-lite"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-2-5-flash-lite","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.075,"max_input_per_1m":0.12,"min_output_per_1m":0.3,"max_output_per_1m":0.48,"min_cache_read_per_1m":0.01,"min_cache_write_per_1m":0.01,"min_reasoning_per_1m":0.4,"cheapest_providers":["oracle_oci"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-large","name":"mistral-large","display_name":"Mistral Large","description":"Mistral AI's flagship large language model excelling at reasoning, code generation, JSON output, and multilingual tasks.","creator":"mistral","family":"mistral","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","text"],"output":["text"]},"context_window":262144,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2024-11-30","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Mistral","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":true,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-02-26","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":8,"ids":["azure_ai/mistral-large","azure_ai/mistral-large-2407","azure_ai/mistral-large-latest","azure/mistral-large-2402","azure/mistral-large-latest","bedrock/eu-west-3/mistral.mistral-large-2402-v1:0","bedrock/us-east-1/mistral.mistral-large-2402-v1:0","bedrock/us-west-2/mistral.mistral-large-2402-v1:0","mistral-large","mistral-large-2407","mistral-large-2512","mistral-large-latest","mistral.mistral-large-2402-v1:0","mistral.mistral-large-2407-v1:0","mistral/mistral-large-2402","mistral/mistral-large-2407","mistral/mistral-large-2411","mistral/mistral-large-2512","mistral/mistral-large-latest","mistralai/mistral-large","mistralai/mistral-large-2407","mistralai/mistral-large-2411","mistralai/mistral-large-2512","openrouter/mistralai/mistral-large","openrouter/mistralai/mistral-large-2512","snowflake/mistral-large","vercel_ai_gateway/mistral/mistral-large","vertex_ai/mistral-large-2411","vertex_ai/mistral-large@2407","vertex_ai/mistral-large@2411-001","vertex_ai/mistral-large@latest","watsonx/mistralai/mistral-large"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-large","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.5,"max_input_per_1m":8,"min_output_per_1m":1.5,"max_output_per_1m":24,"min_cache_read_per_1m":0.05,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter"],"provider_count":8},"providers":[],"regions":[],"region_info":{}}},{"id":"snowflake-arctic-1-5-embed-m","name":"snowflake-arctic-1-5-embed-m","display_name":"Arctic 1.5 Embed M","description":"A medium-sized embedding model in Snowflake's Arctic 1.5 series, designed for high-quality semantic retrieval and enterprise search.","creator":"snowflake","family":"arctic","tier":"","version":"1-5","type":"embedding","size_in_bn":null,"modalities":{"input":["text"],"output":["embedding"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["snowflake-arctic-1-5-embed-m"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"snowflake-arctic-1-5-embed-m","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.06,"max_input_per_1m":0.06,"min_output_per_1m":0.06,"max_output_per_1m":0.06,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"snowflake-arctic-2-embed-l","name":"snowflake-arctic-2-embed-l","display_name":"Arctic 2 Embed L","description":"A large embedding model in Snowflake's Arctic 2 series, delivering high-dimensional semantic representations for enterprise retrieval workloads.","creator":"snowflake","family":"arctic","tier":"","version":"2","type":"embedding","size_in_bn":0.568,"modalities":{"input":["text"],"output":["embedding"]},"context_window":8192,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["snowflake-arctic-2-embed-l","snowflake/snowflake-arctic-embed-l-v2.0"],"hf_likes":248,"hf_downloads":1062514,"hf_downloads_all_time":10289273,"hf_trending_score":1,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"snowflake-arctic-2-embed-l","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.1,"max_input_per_1m":0.1,"min_output_per_1m":0.1,"max_output_per_1m":0.1,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"snowflake-arctic-embed-2-m","name":"snowflake-arctic-embed-2-m","display_name":"Arctic Embed 2 M","description":"A medium-sized second-generation embedding model from Snowflake's Arctic series, optimized for dense vector retrieval tasks.","creator":"snowflake","family":"embed","tier":"","version":"2","type":"embedding","size_in_bn":null,"modalities":{"input":["text"],"output":["embedding"]},"context_window":8192,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["snowflake-arctic-embed-2-m","snowflake/snowflake-arctic-embed-m-v2.0"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"snowflake-arctic-embed-2-m","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.07,"max_input_per_1m":0.07,"min_output_per_1m":null,"max_output_per_1m":null,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"snowflake-arctic-embed-m","name":"snowflake-arctic-embed-m","display_name":"Arctic Embed M","description":"A medium-sized text embedding model from Snowflake's Arctic series, optimized for efficient semantic search and retrieval-augmented generation.","creator":"snowflake","family":"arctic","tier":"","version":null,"type":"embedding","size_in_bn":null,"modalities":{"input":["text"],"output":["embedding"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["snowflake-arctic-embed-m"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"snowflake-arctic-embed-m","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.06,"max_input_per_1m":0.06,"min_output_per_1m":0.06,"max_output_per_1m":0.06,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"snowflake-arctic-extract","name":"arctic-extract","display_name":"Arctic Extract","description":"A Snowflake Arctic model specialized for structured information extraction from unstructured enterprise text.","creator":"snowflake","family":"arctic","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["snowflake-arctic-extract"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"snowflake-arctic-extract","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":11.1,"max_input_per_1m":11.1,"min_output_per_1m":11.1,"max_output_per_1m":11.1,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"snowflake-arctic-tilt-entity","name":"arctic-tilt-entity","display_name":"Arctic Tilt Entity","description":"A Snowflake Arctic model variant from the TILT series, specialized for named entity recognition in enterprise documents.","creator":"snowflake","family":"arctic","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["snowflake-arctic-tilt-entity"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"snowflake-arctic-tilt-entity","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":19,"max_input_per_1m":19,"min_output_per_1m":19,"max_output_per_1m":19,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"snowflake-arctic-tilt-table","name":"arctic-tilt-table","display_name":"Arctic Tilt Table","description":"A Snowflake Arctic TILT model variant focused on structured table understanding and extraction from enterprise documents.","creator":"snowflake","family":"arctic","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["snowflake-arctic-tilt-table"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"snowflake-arctic-tilt-table","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":56.8,"max_input_per_1m":56.8,"min_output_per_1m":56.8,"max_output_per_1m":56.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"microsoft-e5-2-base","name":"e5-2-base","display_name":"E5 Base V2","description":"A base-size V2 text embedding model from the E5 family, designed for general-purpose sentence similarity and retrieval.","creator":"microsoft","family":"e5","tier":"","version":"2","type":"embedding","size_in_bn":null,"modalities":{"input":["text"],"output":["embedding"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["huggingface-sentencesimilarity-e5-base-v2","intfloat/e5-base-v2","microsoft-e5-2-base"],"hf_likes":155,"hf_downloads":1663286,"hf_downloads_all_time":20305144,"hf_trending_score":0,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"microsoft-e5-2-base","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.06,"max_input_per_1m":0.06,"min_output_per_1m":0.06,"max_output_per_1m":0.06,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-3-1-flash-lite","name":"gemini-3-1-flash-lite","display_name":"Gemini 3.1 Flash Lite","description":"A lightweight, cost-efficient variant of Gemini 3.1 Flash designed for high-throughput multimodal tasks at minimal latency.","creator":"google","family":"gemini","tier":"flash-lite","version":"3-1","type":"language","size_in_bn":null,"modalities":{"input":["audio","image","pdf","text","video"],"output":["text"]},"context_window":1048576,"max_output_tokens":65536,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2025-01","training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Gemini","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":true,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":true,"file_search":true,"url_context":true,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2026-05-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["gemini-3.1-flash-lite","gemini/gemini-3.1-flash-lite","google-gemini-3-1-flash-lite","google/gemini-3.1-flash-lite","openrouter/google/gemini-3.1-flash-lite","publishers/google/models/gemini-3.1-flash-lite","vertex_ai/gemini-3.1-flash-lite"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-3-1-flash-lite","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.25,"max_input_per_1m":0.3,"min_output_per_1m":1.5,"max_output_per_1m":1.8,"min_cache_read_per_1m":0.025,"min_cache_write_per_1m":0.025,"min_reasoning_per_1m":1.5,"cheapest_providers":["google_gemini","google_vertex_ai","openrouter","vercel_ai_gateway"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}},{"id":"google-gemini-3-1-pro","name":"gemini-3-1-pro","display_name":"Gemini 3.1 Pro","description":"Google's pro-tier LLM in the Gemini 3.1 generation offering high-capability multimodal reasoning, coding, and tool use.","creator":"google","family":"gemini","tier":"pro","version":"3-1","type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["google-gemini-3-1-pro","google/gemini-3.1-pro"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"google-gemini-3-1-pro","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2.4,"max_input_per_1m":2.4,"min_output_per_1m":14.4,"max_output_per_1m":14.4,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-70b","name":"meta-llama-3-70b","display_name":"Llama 3 70B","description":"Meta's 70B pre-trained LLM from the Llama 3 generation, offering strong general-purpose text generation and reasoning capabilities.","creator":"meta","family":"llama","tier":"","version":"3","type":"language","size_in_bn":70,"modalities":{"input":["text"],"output":["text"]},"context_window":8192,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["meta-llama-3-70b","meta-textgeneration-llama-3-70b","meta-textgenerationneuron-llama-3-70b","ollama/llama3:70b","replicate/meta/llama-3-70b","snowflake/llama3-70b","vercel_ai_gateway/meta/llama-3-70b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-70b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.59,"max_input_per_1m":2.42,"min_output_per_1m":0.79,"max_output_per_1m":2.75,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["vercel_ai_gateway"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-8b","name":"meta-llama-3-8b","display_name":"Llama 3 8B","description":"Meta's compact 8B pre-trained LLM from the Llama 3 generation, suitable for efficient on-device and low-cost cloud inference.","creator":"meta","family":"llama","tier":"","version":"3","type":"language","size_in_bn":8,"modalities":{"input":["text"],"output":["text"]},"context_window":8192,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/llama-v3-8b","fireworks_ai/accounts/fireworks/models/llama-v3-8b","meta-llama-3-8b","meta-textgeneration-llama-3-8b","meta-textgenerationneuron-llama-3-8b","ollama/llama3:8b","replicate/meta/llama-3-8b","snowflake/llama3-8b","vercel_ai_gateway/meta/llama-3-8b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-8b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.05,"max_input_per_1m":0.38,"min_output_per_1m":0.08,"max_output_per_1m":0.38,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["replicate","vercel_ai_gateway"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-1-405b","name":"meta-llama-3-1-405b","display_name":"Llama 3.1 405B","description":"Meta's flagship 405B-parameter pre-trained LLM in the Llama 3.1 series, offering frontier-scale text generation with FP8 precision support.","creator":"meta","family":"llama","tier":"","version":"3-1","type":"language","size_in_bn":405,"modalities":{"input":["text"],"output":["text"]},"context_window":128000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["meta-llama-3-1-405b","meta-textgeneration-llama-3-1-405b-fp8","snowflake/llama3.1-405b","snowflake/snowflake-llama-3.1-405b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-1-405b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1.2,"max_input_per_1m":5,"min_output_per_1m":1.2,"max_output_per_1m":16,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-1-70b","name":"meta-llama-3-1-70b","display_name":"Llama 3.1 70B","description":"Meta's 70B pre-trained LLM in the Llama 3.1 series, balancing high capability with practical deployment costs and supporting tool-use tasks.","creator":"meta","family":"llama","tier":"","version":"3-1","type":"language","size_in_bn":70,"modalities":{"input":["text"],"output":["text"]},"context_window":128000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-07-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["cerebras/llama3.1-70b","meta-llama-3-1-70b","meta-textgeneration-llama-3-1-70b","meta-textgenerationneuron-llama-3-1-70b","meta/llama-3.1-70b","snowflake/llama3.1-70b","vercel_ai_gateway/meta/llama-3.1-70b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-1-70b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.36,"max_input_per_1m":0.72,"min_output_per_1m":0.36,"max_output_per_1m":0.72,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-1-8b","name":"meta-llama-3-1-8b","display_name":"Llama 3.1 8B","description":"Meta's compact 8B pre-trained LLM in the Llama 3.1 series, offering efficient on-device or low-cost inference with tool-use support.","creator":"meta","family":"llama","tier":"","version":"3-1","type":"language","size_in_bn":8,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-07-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["cerebras/llama3.1-8b","llamagate/llama-3.1-8b","meta-llama-3-1-8b","meta-textgeneration-llama-3-1-8b","meta-textgenerationneuron-llama-3-1-8b","meta/llama-3.1-8b","snowflake/llama3.1-8b","vercel_ai_gateway/meta/llama-3.1-8b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-1-8b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.03,"max_input_per_1m":0.22,"min_output_per_1m":0.05,"max_output_per_1m":0.22,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["other/llamagate"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-2-1b","name":"meta-llama-3-2-1b","display_name":"Llama 3.2 1B","description":"Meta's ultra-compact 1B pre-trained LLM from the Llama 3.2 series, designed for on-device and edge inference with minimal resource requirements.","creator":"meta","family":"llama","tier":"","version":"3-2","type":"language","size_in_bn":1,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-09-18","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["accounts/fireworks/models/llama-v3p2-1b","fireworks_ai/accounts/fireworks/models/llama-v3p2-1b","meta-llama-3-2-1b","meta-textgeneration-llama-3-2-1b","meta-textgenerationneuron-llama-3-2-1b","meta/llama-3.2-1b","snowflake/llama3.2-1b","vercel_ai_gateway/meta/llama-3.2-1b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-2-1b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.05,"max_input_per_1m":0.1,"min_output_per_1m":0.05,"max_output_per_1m":0.1,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-2-3b","name":"meta-llama-3-2-3b","display_name":"Llama 3.2 3B","description":"Meta's 3B pre-trained LLM from the Llama 3.2 series, balancing compact size with capable text generation for edge and mobile deployments.","creator":"meta","family":"llama","tier":"","version":"3-2","type":"language","size_in_bn":3,"modalities":{"input":["text"],"output":["text"]},"context_window":131072,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-09-18","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":4,"ids":["accounts/fireworks/models/llama-v3p2-3b","fireworks_ai/accounts/fireworks/models/llama-v3p2-3b","llamagate/llama-3.2-3b","meta-llama-3-2-3b","meta-textgeneration-llama-3-2-3b","meta-textgenerationneuron-llama-3-2-3b","meta/llama-3.2-3b","snowflake/llama3.2-3b","vercel_ai_gateway/meta/llama-3.2-3b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-2-3b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.04,"max_input_per_1m":0.15,"min_output_per_1m":0.075,"max_output_per_1m":0.15,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["other/llamagate"],"provider_count":4},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-3-70b","name":"llama-3-3-70b","display_name":"Llama 3.3 70B","description":"Meta's 70B instruction-tuned LLM from the Llama 3.3 series, designed for high-performance conversational AI, content creation, and enterprise applications.","creator":"meta","family":"llama","tier":"","version":"3-3","type":"language","size_in_bn":70,"modalities":{"input":["text"],"output":["text"]},"context_window":128000,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2024-12-06","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["cerebras/llama-3.3-70b","meta-llama-3-3-70b","meta/llama-3.3-70b","snowflake/llama3.3-70b","snowflake/snowflake-llama-3.3-70b","vercel_ai_gateway/meta/llama-3.3-70b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-3-70b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.36,"max_input_per_1m":0.85,"min_output_per_1m":0.36,"max_output_per_1m":1.2,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["snowflake"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"mistral-7b","name":"7b","display_name":"Mistral 7B","description":"Mistral AI's foundational 7B-parameter base language model known for strong performance relative to its compact size.","creator":"mistral","family":"mistral","tier":"","version":null,"type":"language","size_in_bn":7,"modalities":{"input":["text"],"output":["text"]},"context_window":32768,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":true,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":5,"ids":["accounts/fireworks/models/hermes-2-pro-mistral-7b","accounts/fireworks/models/mistral-7b","accounts/fireworks/models/mistral-7b-v0p2","accounts/fireworks/models/openhermes-2-mistral-7b","accounts/fireworks/models/openhermes-2p5-mistral-7b","fireworks_ai/accounts/fireworks/models/hermes-2-pro-mistral-7b","fireworks_ai/accounts/fireworks/models/mistral-7b","fireworks_ai/accounts/fireworks/models/mistral-7b-v0p2","fireworks_ai/accounts/fireworks/models/openhermes-2-mistral-7b","fireworks_ai/accounts/fireworks/models/openhermes-2p5-mistral-7b","huggingface-llm-dolphin-2-2-1-mistral-7b","huggingface-llm-mistral-7b","huggingface-llm-teknium-openhermes-2-mistral-7b","huggingface-llmneuron-mistral-7b","llamagate/mistral-7b-v0.3","mistral-7b","mistral/open-mistral-7b","replicate/mistralai/mistral-7b-v0.1","snowflake/mistral-7b","teknium/openhermes-2.5-mistral-7b"],"hf_likes":900,"hf_downloads":6234,"hf_downloads_all_time":3856208,"hf_trending_score":3,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"mistral-7b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.05,"max_input_per_1m":0.25,"min_output_per_1m":0.1,"max_output_per_1m":0.25,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["replicate"],"provider_count":5},"providers":[],"regions":[],"region_info":{}}}],"pagination":{"page_size":50,"has_next":true,"next_token":"NTA","total_count":58},"meta":{"updated_at":"2026-06-13","request_id":"dfdd3103-4d14-4d29-9848-8429eb22468a","execution_ms":19}}