{"data":[{"id":"perplexity-sonar-pro-reasoning","name":"sonar-pro-reasoning","display_name":"Sonar Reasoning Pro","description":"A reasoning-enhanced pro-tier Sonar model that combines Perplexity's web search with chain-of-thought reasoning for complex analytical queries.","creator":"perplexity","family":"sonar","tier":"pro","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","text"],"output":["text"]},"context_window":128000,"max_output_tokens":8000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-03-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["perplexity-sonar-pro-reasoning","perplexity/sonar-reasoning-pro","sonar-reasoning-pro","vercel_ai_gateway/perplexity/sonar-reasoning-pro"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-sonar-pro-reasoning","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2,"max_input_per_1m":2,"min_output_per_1m":8,"max_output_per_1m":8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","perplexity","vercel_ai_gateway"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-sonar-reasoning","name":"sonar-reasoning","display_name":"Sonar Reasoning","description":"A reasoning-focused Sonar model from Perplexity that integrates chain-of-thought capabilities with web search for structured analytical responses.","creator":"perplexity","family":"sonar","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":128000,"max_output_tokens":8000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["perplexity-sonar-reasoning","perplexity/sonar-reasoning","sonar-reasoning","vercel_ai_gateway/perplexity/sonar-reasoning"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-sonar-reasoning","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1,"max_input_per_1m":1,"min_output_per_1m":5,"max_output_per_1m":5,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["perplexity","vercel_ai_gateway"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-sonar","name":"sonar","display_name":"Sonar","description":"Perplexity's lightweight web-search-augmented LLM with citation support, designed for fast and affordable question-answering with customizable sources.","creator":"perplexity","family":"sonar","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","text"],"output":["text"]},"context_window":128000,"max_output_tokens":8000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-01-27","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["perplexity-sonar","perplexity/perplexity/sonar","perplexity/sonar","sonar","vercel_ai_gateway/perplexity/sonar"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-sonar","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":1,"max_input_per_1m":1,"min_output_per_1m":1,"max_output_per_1m":1,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","perplexity","vercel_ai_gateway"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-sonar-pro","name":"sonar-pro","display_name":"Sonar Pro","description":"Perplexity's premium Sonar model with vision and tool-use capabilities, offering deeper search integration and enterprise-grade question-answering.","creator":"perplexity","family":"sonar","tier":"pro","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["image","text"],"output":["text"]},"context_window":200000,"max_output_tokens":8000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Other","capabilities":{"function_calling":true,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-03-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["perplexity-sonar-pro","perplexity/sonar-pro","sonar-pro","vercel_ai_gateway/perplexity/sonar-pro"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-sonar-pro","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":3,"max_input_per_1m":3,"min_output_per_1m":15,"max_output_per_1m":15,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["openrouter","perplexity","vercel_ai_gateway"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-1-70b-instruct","name":"llama-3-1-70b-instruct","display_name":"Llama 3.1 70B Instruct","description":"Meta's 70B instruction-tuned LLM with strong tool-use and multilingual capabilities, widely deployed across cloud regions for enterprise workloads.","creator":"meta","family":"llama","tier":"","version":"3-1","type":"language","size_in_bn":70,"modalities":{"input":["image","text"],"output":["text"]},"context_window":131072,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-12-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Llama3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-07-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":13,"ids":["accounts/fireworks/models/llama-v3p1-70b-instruct","accounts/fireworks/models/llama-v3p1-70b-instruct-1b","azure_ai/Meta-Llama-3.1-70B-Instruct","deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct","deepinfra/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo","fireworks_ai/accounts/fireworks/models/llama-v3p1-70b-instruct","fireworks_ai/accounts/fireworks/models/llama-v3p1-70b-instruct-1b","friendliai/meta-llama-3.1-70b-instruct","hyperbolic/meta-llama/Meta-Llama-3.1-70B-Instruct","lambda_ai/llama3.1-70b-instruct-fp8","llama-3-1-instruct-70b","meta-llama-3-1-70b-instruct","meta-llama/llama-3.1-70b-instruct","meta-llama/Meta-Llama-3.1-70B-Instruct","meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo","meta-textgeneration-llama-3-1-70b-instruct","meta-textgenerationneuron-llama-3-1-70b-instruct","meta.llama3-1-70b-instruct-v1:0","meta.llama3-1-70b-instruct-v1:0:128k","nebius/meta-llama/Meta-Llama-3.1-70B-Instruct","oci/meta.llama-3.1-70b-instruct","ovhcloud/Meta-Llama-3_1-70B-Instruct","perplexity/llama-3.1-70b-instruct","together_ai/meta-llama/Meta-Llama-3.1-70B-Instruct-Turbo","us.meta.llama3-1-70b-instruct-v1:0","vertex_ai/meta/llama-3.1-70b-instruct-maas"],"hf_likes":907,"hf_downloads":737459,"hf_downloads_all_time":20735812,"hf_trending_score":0,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-1-70b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.12,"max_input_per_1m":2.68,"min_output_per_1m":0.3,"max_output_per_1m":3.54,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["hyperbolic","lambda"],"provider_count":13},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-3-1-8b-instruct","name":"llama-3-1-8b-instruct","display_name":"Llama 3.1 8B Instruct","description":"Meta's 8B instruction-tuned LLM optimized for fast, cost-effective deployment across multiple cloud regions with strong instruction-following performance.","creator":"meta","family":"llama","tier":"","version":"3-1","type":"language","size_in_bn":8,"modalities":{"input":["image","text"],"output":["text"]},"context_window":200000,"max_output_tokens":128000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":"2023-12-31","training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":"Llama3","capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":true,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":true,"adaptive_reasoning":false},"release_date":"2024-07-23","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":21,"ids":["@cf/meta/llama-3.1-8b-instruct","accounts/fireworks/models/full-llama-v3p1-8b-instruct-8b-fp8","accounts/fireworks/models/full-llama-v3p1-8b-instruct-8b-fp8-amd","accounts/fireworks/models/llama-v3p1-8b-instruct","azure_ai/Meta-Llama-3.1-8B-Instruct","databricks/databricks-meta-llama-3-1-8b-instruct","deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct","deepinfra/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo","fireworks_ai/accounts/fireworks/models/llama-v3p1-8b-instruct","friendliai/meta-llama-3.1-8b-instruct","groq/llama-3.1-8b-instant","hyperbolic/meta-llama/Meta-Llama-3.1-8B-Instruct","lambda_ai/llama3.1-8b-instruct","llama-3-1-instruct-8b","meta-llama-3-1-8b-instruct","meta-llama/llama-3.1-8b-instruct","meta-llama/Meta-Llama-3.1-8B-Instruct","meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo","meta-textgeneration-llama-3-1-8b-instruct","meta-textgenerationneuron-llama-3-1-8b-instruct","meta.llama3-1-8b-instruct-v1:0","meta.llama3-1-8b-instruct-v1:0:128k","nebius/meta-llama/Meta-Llama-3.1-8B-Instruct","novita/meta-llama/llama-3.1-8b-instruct","nscale/meta-llama/Llama-3.1-8B-Instruct","oci/meta.llama-3.1-8b-instruct","ovhcloud/Llama-3.1-8B-Instruct","perplexity/llama-3.1-8b-instruct","sambanova/Meta-Llama-3.1-8B-Instruct","together_ai/meta-llama/Meta-Llama-3.1-8B-Instruct-Turbo","us.meta.llama3-1-8b-instruct-v1:0","vertex_ai/meta/llama-3.1-8b-instruct-maas","wandb/meta-llama/Llama-3.1-8B-Instruct"],"hf_likes":5731,"hf_downloads":9306502,"hf_downloads_all_time":140394735,"hf_trending_score":24,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-3-1-8b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.02,"max_input_per_1m":22,"min_output_per_1m":0.03,"max_output_per_1m":22,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["huggingface","nebius","novita","openrouter"],"provider_count":21},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-llama-2-70b-chat","name":"llama-2-70b-chat","display_name":"Llama 2 70B Chat","description":"A 70B Llama 2 model fine-tuned with RLHF for dialogue, providing high-quality conversational responses at the largest Llama 2 scale.","creator":"meta","family":"llama","tier":"","version":"2","type":"language","size_in_bn":70,"modalities":{"input":["text"],"output":["text"]},"context_window":4096,"max_output_tokens":4096,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":6,"ids":["anyscale/meta-llama/Llama-2-70b-chat-hf","databricks/databricks-llama-2-70b-chat","fireworks_ai/accounts/fireworks/models/llama-v2-70b-chat","llama-2-chat-70b","meta-llama-2-70b-chat","meta.llama2-70b-chat-v1","perplexity/llama-2-70b-chat","replicate/meta/llama-2-70b-chat","snowflake/llama2-70b-chat"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-llama-2-70b-chat","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.50001,"max_input_per_1m":1.95,"min_output_per_1m":0.9,"max_output_per_1m":2.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["databricks"],"provider_count":6},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-codellama-34b-instruct","name":"meta-codellama-34b-instruct","display_name":"Code Llama 34B Instruct","description":"A 34B-parameter instruction-tuned Code Llama model designed to follow natural language instructions for code generation tasks.","creator":"meta","family":"llama","tier":"","version":null,"type":"language","size_in_bn":34,"modalities":{"input":["text"],"output":["text"]},"context_window":16384,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":true,"parallel_function_calling":true,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["accounts/fireworks/models/code-llama-34b-instruct","anyscale/codellama/CodeLlama-34b-Instruct-hf","fireworks_ai/accounts/fireworks/models/code-llama-34b-instruct","meta-codellama-34b-instruct","meta-textgeneration-llama-codellama-34b-instruct","perplexity/codellama-34b-instruct","together_ai/togethercomputer/CodeLlama-34b-Instruct"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-codellama-34b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.35,"max_input_per_1m":1,"min_output_per_1m":0.9,"max_output_per_1m":1.4,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["perplexity"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"meta-codellama-70b-instruct","name":"meta-codellama-70b-instruct","display_name":"Code Llama 70B Instruct","description":"A 70B-parameter instruction-tuned Code Llama model designed to follow natural language instructions for complex code generation tasks.","creator":"meta","family":"llama","tier":"","version":null,"type":"language","size_in_bn":70,"modalities":{"input":["text"],"output":["text"]},"context_window":16384,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":3,"ids":["accounts/fireworks/models/code-llama-70b-instruct","anyscale/codellama/CodeLlama-70b-Instruct-hf","fireworks_ai/accounts/fireworks/models/code-llama-70b-instruct","meta-codellama-70b-instruct","meta-textgeneration-llama-codellama-70b-instruct","perplexity/codellama-70b-instruct"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"meta-codellama-70b-instruct","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.7,"max_input_per_1m":1,"min_output_per_1m":0.9,"max_output_per_1m":2.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["perplexity"],"provider_count":3},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-pplx-70b-chat","name":"pplx-70b-chat","display_name":"PPLX 70B Chat","description":"A 70B Perplexity chat model offering high-capacity conversational AI without real-time web search integration.","creator":"perplexity","family":"pplx","tier":"","version":null,"type":"language","size_in_bn":70,"modalities":{"input":["text"],"output":["text"]},"context_window":4096,"max_output_tokens":4096,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-pplx-70b-chat","perplexity/pplx-70b-chat"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-pplx-70b-chat","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.7,"max_input_per_1m":0.7,"min_output_per_1m":2.8,"max_output_per_1m":2.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["perplexity"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-pplx-70b-online","name":"pplx-70b-online","display_name":"PPLX 70B Online","description":"A 70B Perplexity model with real-time web search access, combining large-scale language understanding with live online retrieval.","creator":"perplexity","family":"pplx","tier":"","version":null,"type":"language","size_in_bn":70,"modalities":{"input":["text"],"output":["text"]},"context_window":4096,"max_output_tokens":4096,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-pplx-70b-online","perplexity/pplx-70b-online"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-pplx-70b-online","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":null,"max_input_per_1m":null,"min_output_per_1m":2.8,"max_output_per_1m":2.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":[],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-pplx-7b-chat","name":"pplx-7b-chat","display_name":"PPLX 7B Chat","description":"A compact 7B Perplexity chat model for efficient conversational AI without web search, suited for low-latency deployments.","creator":"perplexity","family":"pplx","tier":"","version":null,"type":"language","size_in_bn":7,"modalities":{"input":["text"],"output":["text"]},"context_window":8192,"max_output_tokens":8192,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-pplx-7b-chat","perplexity/pplx-7b-chat"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-pplx-7b-chat","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.07,"max_input_per_1m":0.07,"min_output_per_1m":0.28,"max_output_per_1m":0.28,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["perplexity"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-pplx-7b-online","name":"pplx-7b-online","display_name":"PPLX 7B Online","description":"A lightweight 7B Perplexity model augmented with real-time web search, enabling up-to-date answers at low computational cost.","creator":"perplexity","family":"pplx","tier":"","version":null,"type":"language","size_in_bn":7,"modalities":{"input":["text"],"output":["text"]},"context_window":4096,"max_output_tokens":4096,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-pplx-7b-online","perplexity/pplx-7b-online"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-pplx-7b-online","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":null,"max_input_per_1m":null,"min_output_per_1m":0.28,"max_output_per_1m":0.28,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":[],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-pplx-embed-1-0-6b","name":"pplx-embed-1-0-6b","display_name":"PPLX Embed 1.0 0.6B","description":"A compact 0.6B embedding model from Perplexity's PPLX series, designed for efficient semantic text representation and retrieval.","creator":"perplexity","family":"embed","tier":"","version":"1","type":"embedding","size_in_bn":0.6,"modalities":{"input":["text"],"output":["embedding"]},"context_window":32768,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[1024],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-pplx-embed-1-0-6b","perplexity/pplx-embed-v1-0.6b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-pplx-embed-1-0-6b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.004,"max_input_per_1m":0.004,"min_output_per_1m":null,"max_output_per_1m":null,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["perplexity"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-pplx-embed-1-4b","name":"pplx-embed-1-4b","display_name":"PPLX Embed 1.4B","description":"A 1.4B embedding model from Perplexity's PPLX series, offering a balance of embedding quality and computational efficiency for semantic search.","creator":"perplexity","family":"embed","tier":"","version":"1","type":"embedding","size_in_bn":4,"modalities":{"input":["text"],"output":["embedding"]},"context_window":32768,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[2560],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-pplx-embed-1-4b","perplexity/pplx-embed-v1-4b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-pplx-embed-1-4b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.03,"max_input_per_1m":0.03,"min_output_per_1m":null,"max_output_per_1m":null,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["perplexity"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-pplx-embed-context-1-0-6b","name":"pplx-embed-context-1-0-6b","display_name":"PPLX Embed Context 1 0.6B","description":"A context-aware 0.6B embedding model from Perplexity, designed to capture richer contextual signals for improved retrieval performance.","creator":"perplexity","family":"pplx","tier":"","version":"1","type":"embedding","size_in_bn":0.6,"modalities":{"input":["text"],"output":["embedding"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-pplx-embed-context-1-0-6b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-pplx-embed-context-1-0-6b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.008,"max_input_per_1m":0.008,"min_output_per_1m":null,"max_output_per_1m":null,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["perplexity"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-pplx-embed-context-1-4b","name":"pplx-embed-context-1-4b","display_name":"PPLX Embed Context 1.4B","description":"A context-aware 1.4B embedding model from Perplexity, providing enhanced contextual text representations for semantic search and retrieval tasks.","creator":"perplexity","family":"pplx","tier":"","version":"1","type":"embedding","size_in_bn":4,"modalities":{"input":["text"],"output":["embedding"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-pplx-embed-context-1-4b"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-pplx-embed-context-1-4b","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.05,"max_input_per_1m":0.05,"min_output_per_1m":null,"max_output_per_1m":null,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["perplexity"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-sonar-deep-research","name":"sonar-deep-research","display_name":"Sonar Deep Research","description":"A research-focused Sonar model that autonomously performs multi-step web retrieval, source evaluation, and synthesis for complex research queries.","creator":"perplexity","family":"sonar","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":128000,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":["default"],"tokenizer":"Other","capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":true,"web_search":true,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":"2025-03-07","earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["perplexity-sonar-deep-research","perplexity/sonar-deep-research"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-sonar-deep-research","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":2,"max_input_per_1m":2,"min_output_per_1m":8,"max_output_per_1m":8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":3,"cheapest_providers":["openrouter","perplexity"],"provider_count":2},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-sonar-medium-chat","name":"sonar-medium-chat","display_name":"Sonar Medium Chat","description":"A mid-sized Sonar chat model from Perplexity offering conversational AI without live web search integration.","creator":"perplexity","family":"sonar","tier":"medium","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":16384,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-sonar-medium-chat","perplexity/sonar-medium-chat"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-sonar-medium-chat","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.6,"max_input_per_1m":0.6,"min_output_per_1m":1.8,"max_output_per_1m":1.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["perplexity"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-sonar-medium-online","name":"sonar-medium-online","display_name":"Sonar Medium Online","description":"A mid-sized Sonar model with real-time web search, balancing response quality and retrieval capability for online question-answering.","creator":"perplexity","family":"sonar","tier":"medium","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":12000,"max_output_tokens":12000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-sonar-medium-online","perplexity/sonar-medium-online"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-sonar-medium-online","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":null,"max_input_per_1m":null,"min_output_per_1m":1.8,"max_output_per_1m":1.8,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":[],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-sonar-small-chat","name":"sonar-small-chat","display_name":"Sonar Small Chat","description":"A lightweight Sonar chat model from Perplexity optimized for low-latency conversational AI without live web retrieval.","creator":"perplexity","family":"sonar","tier":"small","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":16384,"max_output_tokens":16384,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-sonar-small-chat","perplexity/sonar-small-chat"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-sonar-small-chat","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":0.07,"max_input_per_1m":0.07,"min_output_per_1m":0.28,"max_output_per_1m":0.28,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":["perplexity"],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"perplexity-sonar-small-online","name":"sonar-small-online","display_name":"Sonar Small Online","description":"A compact Sonar model with real-time web search, providing fast and affordable online question-answering at small scale.","creator":"perplexity","family":"sonar","tier":"small","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":12000,"max_output_tokens":12000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["perplexity-sonar-small-online","perplexity/sonar-small-online"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30","pricing":{"model_id":"perplexity-sonar-small-online","currency":"USD","exchange_rate":1,"exchange_rate_date":"2026-06-13","ingestion_date":"2026-06-13","summary":{"currency":"USD","min_input_per_1m":null,"max_input_per_1m":null,"min_output_per_1m":0.28,"max_output_per_1m":0.28,"min_cache_read_per_1m":null,"min_cache_write_per_1m":null,"min_reasoning_per_1m":null,"cheapest_providers":[],"provider_count":1},"providers":[],"regions":[],"region_info":{}}},{"id":"tavily-search","name":"search","display_name":"Tavily Search","description":"A real-time web search API optimized for AI agents, returning structured, relevant results from live web sources.","creator":"tavily","family":"tavily","tier":"","version":null,"type":"language","size_in_bn":null,"modalities":{"input":["text"],"output":["text"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":7,"ids":["dataforseo/search","duckduckgo/search","exa_ai/search","firecrawl/search","google_pse/search","linkup/search","parallel_ai/search","perplexity/search","searxng/search","serper/search","tavily-search","tavily/search"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-13 08:02:30"}],"pagination":{"page_size":50,"has_next":false,"next_token":null,"total_count":23},"meta":{"updated_at":"2026-06-13","request_id":"98d64f93-32fb-4beb-91e9-1b89e54a208f","execution_ms":10}}