{"data":[{"id":"self_hosted","name":"Self-hosted","description":"Models with downloadable open weights — runnable on your own infrastructure. Not a hosted inference provider.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":false,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":["open-weights","self-hosted"],"modalities":[],"model_count":156,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":null,"synthetic":true},{"id":"aisingapore","name":"AI Singapore","description":"National AI program for Singapore. Creator of the SEA-LION family of open-weight models covering Southeast Asian languages and the English-based Llama-SEA variants.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/aisingapore.png"},{"id":"ai21_labs","name":"AI21 Labs","description":"AI21 builds Foundation Models and AI Systems for the enterprise. Power your most critical enterprise workflows with accurate, reliable, and scalable AI.","url":"https://www.ai21.com","api_base_url":"https://api.ai21.com/studio/v1","docs_url":"https://docs.ai21.com/docs/models-overview","pricing_url":"https://www.ai21.com/pricing","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["ai21"],"tags":["enterprise","long-context","mamba","rag"],"modalities":["text"],"model_count":10,"priced_model_count":10,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/ai21_labs.png"},{"id":"aiml","name":"AI/ML API","description":"One API for 500+ AI models: GPT-5.5, Claude Opus 4.7, Gemini 3.5, DeepSeek v4, Seedance. Save up to 80% vs OpenAI & Anthropic. No token limits. Free playground.","url":"https://aimlapi.com","api_base_url":"https://api.aimlapi.com/v1","docs_url":"https://docs.aimlapi.com","pricing_url":"https://aimlapi.com/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["aiml"],"tags":["aggregator","free-tier","image-generation","multimodal"],"modalities":["audio","embedding","image","text"],"model_count":12,"priced_model_count":12,"pricing_tiers":["standard"],"pricing_dimensions":["image_output"],"icon_url":"/images/providers/favicons/aiml.png"},{"id":"alibaba_qwen","name":"Alibaba Qwen","description":"Supercharge Your AI Journey Effortlessly With Industry-Leading GenAI Models","url":"https://www.alibabacloud.com/product/modelstudio","api_base_url":"https://dashscope-intl.aliyuncs.com/compatible-mode/v1","docs_url":"https://www.alibabacloud.com/help/en/model-studio/getting-started/models","pricing_url":"https://www.alibabacloud.com/help/en/model-studio/getting-started/models","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["dashscope"],"tags":["code","low-cost","multimodal","open-weight","reasoning"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":98,"priced_model_count":98,"pricing_tiers":["batch","standard"],"pricing_dimensions":["input","output","reasoning_output"],"icon_url":"/images/providers/favicons/alibaba_qwen.png"},{"id":"amazon_bedrock","name":"Amazon Bedrock","description":"Amazon Bedrock: The platform for building generative AI applications and agents at production scale","url":"https://aws.amazon.com/bedrock","api_base_url":"https://bedrock-runtime.{region}.amazonaws.com","docs_url":"https://docs.aws.amazon.com/bedrock/latest/userguide","pricing_url":"https://aws.amazon.com/bedrock/pricing","own_models":true,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["bedrock"],"tags":["agents","cloud","enterprise","fine-tuning","guardrails","knowledge-base","regional"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":138,"priced_model_count":138,"pricing_tiers":["batch","flex","latency_optimized","priority","standard"],"pricing_dimensions":["audio_input","audio_output","cache_read","cache_write_1h","cache_write_5m","image_input","image_output","image_output_512","image_output_512_premium","image_output_premium","input","output","query","video_input","video_output"],"icon_url":"/images/providers/favicons/amazon_bedrock.png"},{"id":"amazon_nova","name":"Amazon Nova","description":"Amazon Nova is a family of foundation models and services that delivers frontier intelligence and industry-leading price performance.","url":"https://aws.amazon.com/nova/","api_base_url":"https://bedrock-runtime.{region}.amazonaws.com","docs_url":"https://docs.aws.amazon.com/nova/latest/userguide/what-is-nova.html","pricing_url":"https://aws.amazon.com/bedrock/pricing","own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":["amazon_nova","amazon-nova"],"tags":["fast","low-cost","multimodal"],"modalities":["image","pdf","text","video"],"model_count":4,"priced_model_count":4,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/amazon_nova.png"},{"id":"amazon_sagemaker","name":"AWS SageMaker","description":"The next generation of Amazon SageMaker is the center for all your data, analytics, and AI","url":"https://aws.amazon.com/sagemaker","api_base_url":"https://runtime.sagemaker.{region}.amazonaws.com","docs_url":"https://docs.aws.amazon.com/sagemaker/latest/dg/jumpstart-foundation-models.html","pricing_url":"https://aws.amazon.com/sagemaker/pricing","own_models":false,"hosts_platform":true,"openai_compatible":false,"litellm_provider":["sagemaker"],"tags":["cloud","enterprise","fine-tuning","gpu-instances","jumpstart","ml-platform"],"modalities":["audio","embedding","image","text"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/amazon_sagemaker.png"},{"id":"anthropic","name":"Anthropic","description":"Anthropic is an AI safety and research company that's working to build reliable, interpretable, and steerable AI systems.","url":"https://anthropic.com","api_base_url":"https://api.anthropic.com/v1","docs_url":"https://docs.anthropic.com/en/docs/about-claude/models/overview","pricing_url":"https://platform.claude.com/docs/en/about-claude/pricing","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["anthropic"],"tags":["frontier","long-context","prompt-caching","reasoning","safety"],"modalities":["image","pdf","text"],"model_count":17,"priced_model_count":17,"pricing_tiers":["batch","standard"],"pricing_dimensions":["cache_read","cache_write_1h","cache_write_5m","input","output"],"icon_url":"/images/providers/favicons/anthropic.png"},{"id":"arcee_ai","name":"Arcee AI","description":"Specialist in small language models (SLMs) and model merging. Creator of the Arcee Spark, Maestro, and Virtuoso model families, fine-tuned for business and agentic use cases.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/arcee_ai.png"},{"id":"baichuan_ai","name":"Baichuan AI","description":"Chinese AI company and creator of the Baichuan model series, including Baichuan2 and Baichuan3 bilingual (Chinese-English) large language models.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/baichuan_ai.png"},{"id":"baidu","name":"Baidu","description":"Chinese internet company and creator of ERNIE (Enhanced Representation through Knowledge Integration), including ERNIE Bot, ERNIE 4.0, and the ERNIE Speed/Lite series.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/baidu.png"},{"id":"black_forest_labs","name":"Black Forest Labs","description":"Black Forest Labs is building visual intelligence: models that understand, reason, and act in the world. Use FLUX models via our API.","url":"https://blackforestlabs.ai","api_base_url":"https://api.bfl.ml/v1","docs_url":"https://docs.bfl.ml","pricing_url":"https://docs.bfl.ml/pricing","own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":["black_forest_labs"],"tags":["diffusion","flux","image-generation","open-weight"],"modalities":["image","text"],"model_count":8,"priced_model_count":8,"pricing_tiers":["standard"],"pricing_dimensions":["image_output"],"icon_url":"/images/providers/favicons/black_forest_labs.png"},{"id":"bria_ai","name":"Bria AI","description":"Enterprise visual AI company focused on responsible generation. Creator of BRIA RMBG (background removal) and BRIA text-to-image foundation models with commercial licensing.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/bria_ai.png"},{"id":"bsc_lt","name":"BSC-LT","description":"Language Technologies unit of the Barcelona Supercomputing Center. Creator of the FLOR and Atalaya multilingual models with focus on Spanish, Catalan, and Basque.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/bsc_lt.png"},{"id":"volcengine","name":"Volcengine (ByteDance)","description":"ByteDance's cloud platform offering the Doubao model family and third-party models via the Ark inference service. Doubao-Pro and Doubao-Lite cover a range of cost and capability trade-offs. Dominant in China; international access available via the VolcEngine API.","url":"https://www.volcengine.com/product/ark","api_base_url":"https://ark.cn-beijing.volces.com/api/v3","docs_url":"https://www.volcengine.com/docs/82379/1263482","pricing_url":"https://www.volcengine.com/docs/82379/1099320","own_models":true,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["volcengine"],"tags":["chinese","doubao","low-cost","multimodal"],"modalities":["audio","embedding","image","text","video"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/volcengine.png"},{"id":"cerebras","name":"Cerebras","description":"Cerebras is the go-to platform for fast and effortless AI training. Learn more at cerebras.ai.","url":"https://cerebras.ai","api_base_url":"https://api.cerebras.ai/v1","docs_url":"https://inference-docs.cerebras.ai/introduction","pricing_url":"https://cerebras.ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["cerebras"],"tags":["fast-inference","open-weight","ultra-fast","wafer-scale"],"modalities":["image","pdf","text"],"model_count":7,"priced_model_count":7,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/cerebras.png"},{"id":"cloudflare_workers_ai","name":"Cloudflare Workers AI","description":"Run machine learning models, powered by serverless GPUs, on Cloudflare's global network.","url":"https://developers.cloudflare.com/workers-ai","api_base_url":"https://api.cloudflare.com/client/v4/accounts/{account_id}/ai/run","docs_url":"https://developers.cloudflare.com/workers-ai/models","pricing_url":"https://developers.cloudflare.com/workers-ai/platform/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["cloudflare"],"tags":["edge","low-latency","open-source","serverless"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":57,"priced_model_count":57,"pricing_tiers":["standard"],"pricing_dimensions":["audio_input","cache_read","image_input","image_output","input","output","request"],"icon_url":"/images/providers/favicons/cloudflare.png"},{"id":"cohere","name":"Cohere","description":"Cohere builds powerful models and AI solutions enabling enterprises to automate processes, empower employees, and turn fragmented data into actionable insights.","url":"https://cohere.com","api_base_url":"https://api.cohere.com/v2","docs_url":"https://docs.cohere.com/docs/models","pricing_url":"https://cohere.com/pricing","own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":["cohere"],"tags":["embeddings","enterprise","rag","rerank","search"],"modalities":["embedding","image","text"],"model_count":24,"priced_model_count":24,"pricing_tiers":["batch","standard"],"pricing_dimensions":["image_input","input","output","query"],"icon_url":"/images/providers/favicons/cohere.png"},{"id":"databricks","name":"Databricks","description":"Databricks offers a unified platform for data, analytics and AI. Build better AI with a data-centric approach. Simplify ETL, data warehousing, governance and AI on the Data Intelligence Platform.","url":"https://www.databricks.com","api_base_url":"https://{workspace}.azuredatabricks.net/serving-endpoints","docs_url":"https://docs.databricks.com/en/machine-learning/foundation-models","pricing_url":"https://www.databricks.com/product/foundation-model-api","own_models":true,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["databricks"],"tags":["data-platform","enterprise","fine-tuning","lakehouse","open-weight"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":28,"priced_model_count":28,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/databricks.png"},{"id":"deepinfra","name":"DeepInfra","description":"DeepInfra offers cost-effective, scalable, easy-to-deploy, and production-ready machine-learning models and infrastructures for deep-learning models.","url":"https://deepinfra.com","api_base_url":"https://api.deepinfra.com/v1/openai","docs_url":"https://deepinfra.com/models","pricing_url":"https://deepinfra.com/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["deepinfra"],"tags":["low-cost","open-source","serverless"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":64,"priced_model_count":64,"pricing_tiers":["standard"],"pricing_dimensions":["cache_read","input","output"],"icon_url":"/images/providers/favicons/deepinfra.png"},{"id":"deepgram","name":"Deepgram","description":"Power enterprise voice solutions with Deepgram’s Speech-to-Text, Text-to-Speech, and Voice Agent APIs. Real-time, accurate, and built for scale.","url":"https://deepgram.com","api_base_url":"https://api.deepgram.com/v1","docs_url":"https://developers.deepgram.com/docs/introduction","pricing_url":"https://deepgram.com/pricing","own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":["deepgram"],"tags":["diarisation","real-time","speech-to-text","transcription","voice-ai"],"modalities":["audio","text"],"model_count":36,"priced_model_count":36,"pricing_tiers":["standard"],"pricing_dimensions":["audio_input"],"icon_url":"/images/providers/favicons/deepgram.png"},{"id":"deepseek","name":"DeepSeek","description":"DeepSeek, unravel the mystery of AGI with curiosity. Answer the essential question with long-termism.","url":"https://www.deepseek.com","api_base_url":"https://api.deepseek.com/v1","docs_url":"https://api-docs.deepseek.com","pricing_url":"https://api-docs.deepseek.com/quick_start/pricing","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["deepseek"],"tags":["frontier","low-cost","open-weight","reasoning"],"modalities":["image","pdf","text"],"model_count":6,"priced_model_count":6,"pricing_tiers":["batch","standard"],"pricing_dimensions":["cache_read","input","output"],"icon_url":"/images/providers/favicons/deepseek.png"},{"id":"eleutherai","name":"EleutherAI","description":"Open-source AI research collective and creator of GPT-NeoX, Pythia, and related open models. Focused on interpretability and democratizing AI research.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/eleutherai.png"},{"id":"elevenlabs","name":"ElevenLabs","description":"Create lifelike speech with our AI voice generator and voice agents platform. Access 5,000+ voices in 70+ languages with secure APIs and SDKs.","url":"https://elevenlabs.io","api_base_url":"https://api.elevenlabs.io/v1","docs_url":"https://elevenlabs.io/docs/api-reference/introduction","pricing_url":"https://elevenlabs.io/pricing","own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":["elevenlabs"],"tags":["dubbing","real-time","text-to-speech","voice-cloning"],"modalities":["audio","text"],"model_count":4,"priced_model_count":4,"pricing_tiers":["standard"],"pricing_dimensions":["audio_input"],"icon_url":"/images/providers/favicons/elevenlabs.png"},{"id":"fal","name":"fal.ai","description":"Easiest & most cost-effective way to use Gen AI. fal.ai is how devs integrate dozens of generative media models. FLUX, Kling, Hailuo +1000 more","url":"https://fal.ai","api_base_url":"https://fal.run","docs_url":"https://fal.ai/docs","pricing_url":"https://fal.ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":false,"litellm_provider":["fal_ai"],"tags":["diffusion","image-generation","lora","serverless","video-generation"],"modalities":["audio","image","pdf","text","video"],"model_count":9,"priced_model_count":9,"pricing_tiers":["standard"],"pricing_dimensions":["image_output"],"icon_url":"/images/providers/favicons/fal.png"},{"id":"featherless_ai","name":"Featherless AI","description":"Freedom to reliably deploy any open model effortlessly.","url":"https://featherless.ai","api_base_url":"https://api.featherless.ai/v1","docs_url":"https://featherless.ai/docs","pricing_url":"https://featherless.ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["featherless_ai"],"tags":["low-cost","open-source","serverless"],"modalities":["text"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/featherless_ai.png"},{"id":"fireworks_ai","name":"Fireworks AI","description":"Use state-of-the-art, open-source LLMs and image models at blazing fast speed, or fine-tune and deploy your own at no additional cost with Fireworks AI!","url":"https://fireworks.ai","api_base_url":"https://api.fireworks.ai/inference/v1","docs_url":"https://docs.fireworks.ai/models/overview","pricing_url":"https://fireworks.ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["fireworks_ai"],"tags":["enterprise","fast-inference","open-source","structured-outputs"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":232,"priced_model_count":232,"pricing_tiers":["standard"],"pricing_dimensions":["cache_read","input","output"],"icon_url":"/images/providers/favicons/fireworks_ai.png"},{"id":"friendliai","name":"FriendliAI","description":"FriendliAI is The Frontier AI Inference Cloud. Built by the researchers who invented the continuous batching technique that is now industry standard, FriendliAI provides AI engineers with a highly optimized engine that constantly evolves to efficiently run state-of-the-art open-weight and custom models at production scale. By maximizing GPU utilization, FriendliAI delivers speeds up to 3x faster than vLLM, and 50% to 90% cost savings relative to closed model APIs. FriendliAI empowers engineers to deploy frontier AI with uncompromising speed, model ownership, and enterprise-grade reliability.","url":"https://friendli.ai","api_base_url":"https://inference.friendli.ai/v1","docs_url":"https://docs.friendli.ai","pricing_url":"https://friendli.ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["friendliai"],"tags":["high-throughput","low-latency","open-source"],"modalities":["image","text"],"model_count":2,"priced_model_count":2,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/friendliai.png"},{"id":"github_models","name":"GitHub Models","description":"GitHub is where people build software. More than 150 million people use GitHub to discover, fork, and contribute to over 420 million projects.","url":"https://github.com/marketplace/models","api_base_url":"https://models.inference.ai.azure.com","docs_url":"https://docs.github.com/en/github-models","pricing_url":"https://docs.github.com/en/github-models/prototyping-with-ai-models#rate-limits","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["github_copilot"],"tags":["azure-backed","developer","free-tier","openai-compatible"],"modalities":["embedding","image","text"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/github_models.png"},{"id":"gmi","name":"GMI Cloud","description":"Singapore-based GPU cloud offering serverless inference for a broad catalog of open-weight and frontier models. Hosts Qwen, MiniMax, DeepSeek, Llama, and others with OpenAI-compatible endpoints. Focuses on Asia-Pacific availability and competitive pricing.","url":"https://gmi.ai","api_base_url":"https://api.gmi.ai/v1","docs_url":"https://docs.gmi.ai","pricing_url":"https://gmi.ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["gmi"],"tags":["asia-pacific","gpu-cloud","low-cost","open-source","serverless"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":17,"priced_model_count":17,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/gmi.png"},{"id":"google_gemini","name":"Google Gemini","description":"Build with Gemini 2.0 Flash, 2.5 Pro, and Gemma using the Gemini API and Google AI Studio.","url":"https://ai.google.dev","api_base_url":"https://generativelanguage.googleapis.com/v1beta","docs_url":"https://ai.google.dev/gemini-api/docs/models","pricing_url":"https://ai.google.dev/gemini-api/docs/pricing","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["gemini","palm"],"tags":["frontier","grounding","image-generation","long-context","multimodal","reasoning"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":146,"priced_model_count":146,"pricing_tiers":["batch","flex","priority","standard"],"pricing_dimensions":["audio_input","audio_output","cache_read","cache_write","image_input","image_output","input","output","reasoning_output","video_input","video_output"],"icon_url":"/images/providers/favicons/google_gemini.png"},{"id":"google_vertex_ai","name":"Google Vertex AI","description":"Gemini Enterprise Agent Platform (formerly Vertex AI) is a comprehensive platform for developers to build, scale, govern and optimize agents.","url":"https://cloud.google.com/vertex-ai","api_base_url":"https://us-central1-aiplatform.googleapis.com/v1","docs_url":"https://cloud.google.com/vertex-ai/generative-ai/docs/models","pricing_url":"https://cloud.google.com/vertex-ai/generative-ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["vertex_ai-language-models"],"tags":["cloud","enterprise","fine-tuning","model-garden","multimodal","regional"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":176,"priced_model_count":176,"pricing_tiers":["batch","flex","priority","standard"],"pricing_dimensions":["audio_input","audio_output","cache_read","cache_write","cache_write_5m","image_input","image_output","input","output","page_input","reasoning_output","video_input","video_output"],"icon_url":"/images/providers/favicons/google_vertex_ai.png"},{"id":"gradient_ai","name":"Gradient AI","description":"Hyperagent is the system of agents that does real work, learns how your organization operates, and deploys across your entire team.","url":"https://gradient.ai","api_base_url":"https://api.gradient.ai/v1","docs_url":"https://docs.gradient.ai","pricing_url":"https://gradient.ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["gradient_ai"],"tags":["aggregator","compliance","enterprise","model-routing"],"modalities":["image","pdf","text"],"model_count":10,"priced_model_count":10,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/gradient_ai.png"},{"id":"groq","name":"Groq","description":"The Groq LPU delivers inference with the speed and cost developers need.","url":"https://groq.com","api_base_url":"https://api.groq.com/openai/v1","docs_url":"https://console.groq.com/docs/models","pricing_url":"https://groq.com/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["groq"],"tags":["fast-inference","low-latency","lpu","open-weight"],"modalities":["audio","image","text"],"model_count":14,"priced_model_count":14,"pricing_tiers":["standard"],"pricing_dimensions":["audio_input","cache_read","input","output"],"icon_url":"/images/providers/favicons/groq.png"},{"id":"huggingface","name":"Hugging Face","description":"We’re on a journey to advance and democratize artificial intelligence through open source and open science.","url":"https://huggingface.co","api_base_url":"https://api-inference.huggingface.co","docs_url":"https://huggingface.co/docs/inference-endpoints","pricing_url":"https://huggingface.co/pricing","own_models":false,"hosts_platform":true,"openai_compatible":false,"litellm_provider":[],"tags":["community","hub","inference-endpoints","model-registry","open-source"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":94,"priced_model_count":94,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/huggingface.png"},{"id":"hyperbolic","name":"Hyperbolic","description":"Access open-source inference and compute at a fraction of the cost. Build with us.","url":"https://hyperbolic.xyz","api_base_url":"https://api.hyperbolic.xyz/v1","docs_url":"https://docs.hyperbolic.xyz/docs/getting-started","pricing_url":"https://app.hyperbolic.xyz/models","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["hyperbolic"],"tags":["gpu-cloud","low-cost","open-source","serverless"],"modalities":["image","pdf","text"],"model_count":16,"priced_model_count":16,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/hyperbolic.png"},{"id":"ibm_watsonx","name":"IBM watsonx","description":"IBM watsonx is a portfolio of AI products that accelerates the impact of generative AI in core workflows to drive productivity.","url":"https://www.ibm.com/watsonx","api_base_url":"https://{region}.ml.cloud.ibm.com/ml/v1","docs_url":"https://ibm.github.io/watsonx-ai-python-sdk/models.html","pricing_url":"https://www.ibm.com/products/watsonx-ai/pricing","own_models":true,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["watsonx"],"tags":["compliance","enterprise","explainability","granite","regulated-industries"],"modalities":["audio","embedding","image","pdf","text"],"model_count":29,"priced_model_count":29,"pricing_tiers":["standard"],"pricing_dimensions":["audio_input","audio_output","input","output"],"icon_url":"/images/providers/favicons/ibm_watsonx.png"},{"id":"imagineart","name":"ImagineArt","description":"AI image generation platform and creator of ImagineArt models for creative image synthesis.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/imagineart.png"},{"id":"jetbrains","name":"Jetbrains","description":"Developer tools company and creator of Mellum, a code completion language model trained on code repositories and optimized for IDE integration.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/jetbrains.png"},{"id":"krea_ai","name":"Krea AI","description":"Creative AI platform and model developer. Creator of Krea image and video generation models designed for real-time creative workflows.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/krea_ai.png"},{"id":"kwaipilot","name":"KwaiPilot","description":"Kuaishou's AI research arm. Creator of the Kwaipilot and Wan video/image generation models, including Wan2.1 video synthesis and image-to-video capabilities.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/kwaipilot.png"},{"id":"lambda","name":"Lambda","description":"Cloud GPUs, on-demand clusters, private cloud, and hardware for AI training and inference. Run B200 and H100, deploy fast, and scale cost effectively.","url":"https://lambdalabs.com","api_base_url":"https://api.lambdalabs.com/v1","docs_url":"https://docs.lambdalabs.com/inference","pricing_url":"https://lambdalabs.com/service/gpu-cloud","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["lambda_ai"],"tags":["gpu-cloud","open-source","serverless","training"],"modalities":["image","pdf","text"],"model_count":20,"priced_model_count":20,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/lambda.png"},{"id":"leonardo_ai","name":"Leonardo AI","description":"Creative AI platform and creator of Leonardo models for high-fidelity image generation, style-transfer, and asset production for games and media.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/leonardo_ai.png"},{"id":"lgresearch","name":"LG Research","description":"LG AI Research lab and creator of EXAONE, a bilingual (Korean-English) large language model family focused on enterprise and reasoning tasks.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/lgresearch.png"},{"id":"lighton","name":"LightOn","description":"French enterprise AI company and creator of Alfred, a large language model family optimized for European enterprise use cases and multilingual support.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/lighton.png"},{"id":"lmnt","name":"LMNT","description":"Voice synthesis company and creator of LMNT TTS models with low-latency streaming speech synthesis and custom voice cloning.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/lmnt.png"},{"id":"luma","name":"Luma","description":"Your creative team becomes prolific with Luma Agents","url":"https://lumalabs.ai","api_base_url":"https://api.lumalabs.ai/dream-machine/v1","docs_url":"https://docs.lumalabs.ai","pricing_url":"https://lumalabs.ai/dream-machine/api/pricing","own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":["cinematic","image-generation","video-generation"],"modalities":["image","video"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/luma.png"},{"id":"meituan","name":"Meituan","description":"Chinese technology company. Creator of the Meituan AI models including vision-language models for e-commerce and service recommendation tasks.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/meituan.png"},{"id":"meta","name":"Meta","description":"Creator of the Llama open-weight model series. Llama 3.x and 4 models are widely deployed across inference providers, cloud platforms, and on-premise installations. Meta releases model weights publicly under the Llama Community License. No direct API — access via platforms and inference providers.","url":"https://llama.meta.com","api_base_url":null,"docs_url":"https://www.llama.com/docs/overview","pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":["meta_llama"],"tags":["frontier","multimodal","open-weight","widely-deployed"],"modalities":["image","text"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/meta.png"},{"id":"microsoft","name":"Microsoft","description":"Microsoft Research AI division. Creator of the Phi small language model series (Phi-1 through Phi-4), demonstrating strong reasoning on par with much larger models through quality data curation.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/microsoft.png"},{"id":"azure_aifoundry","name":"Azure AI Foundry","description":"Microsoft Foundry","url":"https://ai.azure.com","api_base_url":"https://{endpoint}.services.ai.azure.com/models","docs_url":"https://learn.microsoft.com/en-us/azure/ai-foundry/model-inference/overview","pricing_url":"https://azure.microsoft.com/en-us/pricing/details/ai-foundry/","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["azure"],"tags":["cloud","compliance","enterprise","maas","openai-compatible","serverless"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":237,"priced_model_count":237,"pricing_tiers":["batch","standard"],"pricing_dimensions":["audio_input","audio_output","cache_read","cache_write_5m","image_input","image_output","input","output","page_input","query","video_output"],"icon_url":"/images/providers/favicons/azure_aifoundry.png"},{"id":"minimax","name":"MiniMax","description":"Building AGI with our mission Intelligence with Everyone. Global leader in multi-modal models and AI-native products with over 200 million users.","url":"https://www.minimax.io","api_base_url":"https://api.minimax.chat/v1","docs_url":"https://platform.minimaxi.com/document/models","pricing_url":"https://www.minimax.io/price","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["minimax"],"tags":["chinese","long-context","multimodal","video-generation"],"modalities":["audio","image","pdf","text","video"],"model_count":10,"priced_model_count":10,"pricing_tiers":["standard"],"pricing_dimensions":["audio_input","cache_read","cache_write_5m","input","output"],"icon_url":"/images/providers/favicons/minimax.png"},{"id":"mistral","name":"Mistral AI","description":"The most powerful AI platform for enterprises. Customize, fine-tune, and deploy AI assistants, autonomous agents, and multimodal AI with open models.","url":"https://mistral.ai","api_base_url":"https://api.mistral.ai/v1","docs_url":"https://docs.mistral.ai/models","pricing_url":"https://mistral.ai/pricing","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["mistral","codestral","text-completion-codestral"],"tags":["agents","code","european","open-weight","reasoning"],"modalities":["audio","embedding","image","pdf","text"],"model_count":33,"priced_model_count":33,"pricing_tiers":["batch","standard"],"pricing_dimensions":["input","output","page_input"],"icon_url":"/images/providers/favicons/mistral.png"},{"id":"moonshot_ai","name":"Moonshot AI (Kimi)","description":"Chinese AI company creator of the Kimi model family. Kimi k1.5 and k2 are strong reasoning models with long context. Kimi VL handles vision tasks. Known for efficient long-document processing. Direct API available globally via Moonshot's platform.","url":"https://www.moonshot.cn","api_base_url":"https://api.moonshot.cn/v1","docs_url":"https://platform.moonshot.cn/docs/intro","pricing_url":"https://platform.moonshot.cn/docs/pricing/chat","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["moonshot"],"tags":["chinese","long-context","reasoning"],"modalities":["image","pdf","text","video"],"model_count":18,"priced_model_count":18,"pricing_tiers":["standard"],"pricing_dimensions":["cache_read","input","output"],"icon_url":"/images/providers/favicons/moonshot_ai.png"},{"id":"myshell","name":"MyShell","description":"Conversational AI and creator of MyShell TTS and voice AI models for interactive agents and voice cloning applications.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/myshell.png"},{"id":"nebius","name":"Nebius","description":"Build and scale faster on the purpose-built AI cloud, engineered from silicon to API.","url":"https://nebius.com/ai-studio","api_base_url":"https://api.studio.nebius.com/v1","docs_url":"https://studio.nebius.com/docs","pricing_url":"https://nebius.com/ai-studio/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["nebius"],"tags":["european","gpu-cloud","open-source","serverless"],"modalities":["embedding","image","pdf","text"],"model_count":30,"priced_model_count":30,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/nebius.png"},{"id":"neuphonic","name":"Neuphonic","description":"Speech AI company and creator of Neuphonic TTS models, offering low-latency multilingual text-to-speech with expressive voice control.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/neuphonic.png"},{"id":"nlp_cloud","name":"NLP Cloud","description":"API platform for deploying NLP and LLM models including text generation, summarisation, sentiment analysis, and named entity recognition. Hosts open-source models and provides fine-tuning capabilities. Simple REST API with pay-as-you-go pricing.","url":"https://nlpcloud.com","api_base_url":"https://api.nlpcloud.io/v1","docs_url":"https://docs.nlpcloud.com","pricing_url":"https://nlpcloud.com/ai-api-pricing.html","own_models":false,"hosts_platform":true,"openai_compatible":false,"litellm_provider":["nlp_cloud"],"tags":["fine-tuning","nlp","open-source"],"modalities":["text"],"model_count":1,"priced_model_count":1,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/nlp_cloud.png"},{"id":"nomic_ai","name":"Nomic AI","description":"Creator of nomic-embed-text, high-performance open-source text embedding models optimized for retrieval, clustering, and semantic search.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/nomic_ai.png"},{"id":"novita","name":"Novita","description":"Novita AI provides 200+ Model APIs, custom deployment, GPU Instances, and Serverless GPUs. Scale AI, optimize performance, and innovate with ease and efficiency.","url":"https://novita.ai","api_base_url":"https://api.novita.ai/v3/openai","docs_url":"https://novita.ai/docs/model-list","pricing_url":"https://novita.ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["novita"],"tags":["fine-tuning","lora","low-cost","open-source","serverless"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":85,"priced_model_count":85,"pricing_tiers":["standard"],"pricing_dimensions":["cache_read","input","output"],"icon_url":"/images/providers/favicons/novita.png"},{"id":"nscale","name":"Nscale","description":"Nscale full-stack AI cloud platform and services are designed for scale, resilience, and speed.","url":"https://nscale.com","api_base_url":"https://inference.api.nscale.com/v1","docs_url":"https://docs.nscale.com","pricing_url":"https://nscale.com/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["nscale"],"tags":["european","gpu-cloud","image-generation","open-source","serverless"],"modalities":["embedding","image","text"],"model_count":14,"priced_model_count":14,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/nscale.png"},{"id":"nvidia","name":"NVIDIA","description":"The building blocks of AI. Learn more.","url":"https://www.nvidia.com/en-us/ai","api_base_url":"https://integrate.api.nvidia.com/v1","docs_url":"https://docs.nvidia.com/nim/index.html","pricing_url":"https://build.nvidia.com/nim","own_models":true,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["nvidia_nim"],"tags":["containers","enterprise","gpu-optimised","open-weight","self-hosted"],"modalities":["embedding","image","text"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/nvidia.png"},{"id":"ollama","name":"Ollama","description":"Ollama is the easiest way to automate your work using open models, while keeping your data safe.","url":"https://ollama.com","api_base_url":"http://localhost:11434","docs_url":"https://github.com/ollama/ollama/blob/main/docs/api.md","pricing_url":null,"own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["ollama"],"tags":["free","local","open-source","privacy","self-hosted"],"modalities":["embedding","image","text"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/ollama.png"},{"id":"openai","name":"OpenAI","description":"Creator of GPT-4o, o3, and the GPT model family. Offers text, vision, audio, image generation, speech, and embedding models via a REST API. Pioneered the modern LLM API interface now widely adopted as the de-facto standard.","url":"https://openai.com","api_base_url":"https://api.openai.com/v1","docs_url":"https://platform.openai.com/docs/models","pricing_url":"https://developers.openai.com/api/docs/pricing/","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["openai","chatgpt","text-completion-openai"],"tags":["frontier","image-generation","multimodal","reasoning","speech"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":88,"priced_model_count":88,"pricing_tiers":["batch","flex","priority","standard"],"pricing_dimensions":["audio_input","audio_output","cache_read","cache_write_5m","image_input","image_output","image_output_premium","input","output","video_output"],"icon_url":"/images/providers/favicons/openai.png"},{"id":"openrouter","name":"OpenRouter","description":"The unified interface for LLMs. Find the best models & prices for your prompts","url":"https://openrouter.ai","api_base_url":"https://openrouter.ai/api/v1","docs_url":"https://openrouter.ai/docs","pricing_url":"https://openrouter.ai/models","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["openrouter"],"tags":["failover","gateway","model-routing","openai-compatible","unified-api"],"modalities":["audio","image","pdf","text","video"],"model_count":300,"priced_model_count":300,"pricing_tiers":["batch","standard"],"pricing_dimensions":["audio_input","cache_read","cache_write_5m","image_input","input","output","reasoning_output","web_search"],"icon_url":"/images/providers/favicons/openrouter.png"},{"id":"oracle_oci","name":"Oracle Cloud (OCI)","description":"Transform your business with generative AI, and unlock a new era of productivity with task automation and end-to-end AI solutions for enterprise customers.","url":"https://www.oracle.com/artificial-intelligence/generative-ai","api_base_url":"https://inference.generativeai.{region}.oci.oraclecloud.com","docs_url":"https://docs.oracle.com/en-us/iaas/Content/generative-ai/overview.htm","pricing_url":"https://www.oracle.com/artificial-intelligence/generative-ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":false,"litellm_provider":["oci"],"tags":["cloud","compliance","enterprise","private-networking"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":41,"priced_model_count":41,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/oracle_oci.png"},{"id":"ovhcloud","name":"OVHcloud","description":"Discover the generative AI APIs offered by OVHcloud. High-performing, easy to integrate, and secure, for application power.","url":"https://www.ovhcloud.com/en/public-cloud/ai-endpoints/","api_base_url":"https://oai.endpoints.kepler.ai.cloud.ovh.net/v1","docs_url":"https://docs.ovh.com/gb/en/publiccloud/ai","pricing_url":"https://www.ovhcloud.com/en/public-cloud/ai-endpoints","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["ovhcloud"],"tags":["cloud","european","gdpr","open-source","privacy"],"modalities":["embedding","image","text"],"model_count":14,"priced_model_count":14,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/ovhcloud.png"},{"id":"perplexity","name":"Perplexity","description":"AI company best known for its search assistant. Also offers the Sonar model family via API: Sonar (fast, grounded), Sonar Pro (more capable), and Sonar Reasoning (chain-of-thought). All models include real-time web search grounding by default.","url":"https://www.perplexity.ai","api_base_url":"https://api.perplexity.ai","docs_url":"https://docs.perplexity.ai/models/model-cards","pricing_url":"https://docs.perplexity.ai/guides/pricing","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["perplexity"],"tags":["reasoning","search-grounding","web-search"],"modalities":["embedding","image","text"],"model_count":25,"priced_model_count":25,"pricing_tiers":["batch","standard"],"pricing_dimensions":["input","output","query","reasoning_output","request"],"icon_url":"/images/providers/favicons/perplexity.png"},{"id":"pika_labs","name":"Pika Labs","description":"AI video generation company and creator of Pika, a consumer and API-accessible platform for text-to-video and image-to-video synthesis.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/pika_labs.png"},{"id":"pixverse_ai","name":"PixVerse AI","description":"Video generation platform and creator of PixVerse models for high-quality text-to-video and image-to-video generation with strong motion dynamics.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/pixverse_ai.png"},{"id":"playground_ai","name":"Playground AI","description":"Image generation platform and creator of Playground v2.5 and v3 models, competitive with Stable Diffusion and DALL-E in aesthetic quality.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/playground_ai.png"},{"id":"prime_intellect","name":"Prime Intellect","description":"Decentralized AI training and open research organization. Produces open-weight models including the INTELLECT series trained via distributed collaboration.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/prime_intellect.png"},{"id":"recraft","name":"Recraft","description":"Recraft is a top-ranked text-to-image model and design platform for photorealism, vector generation, custom styles, mockups, and more","url":"https://www.recraft.ai","api_base_url":"https://external.api.recraft.ai/v1","docs_url":"https://www.recraft.ai/docs","pricing_url":"https://www.recraft.ai/pricing","own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":["recraft"],"tags":["image-generation","text-rendering","vector"],"modalities":["image","text"],"model_count":2,"priced_model_count":2,"pricing_tiers":["standard"],"pricing_dimensions":["image_output"],"icon_url":"/images/providers/favicons/recraft.png"},{"id":"replicate","name":"Replicate","description":"Run open-source machine learning models with a cloud API","url":"https://replicate.com","api_base_url":"https://api.replicate.com/v1","docs_url":"https://replicate.com/docs","pricing_url":"https://replicate.com/pricing","own_models":false,"hosts_platform":true,"openai_compatible":false,"litellm_provider":["replicate"],"tags":["community","image-generation","open-source","video-generation"],"modalities":["audio","image","pdf","text","video"],"model_count":40,"priced_model_count":40,"pricing_tiers":["standard"],"pricing_dimensions":["input","output","reasoning_output"],"icon_url":"/images/providers/favicons/replicate.png"},{"id":"reve_image","name":"Reve Image","description":"AI image generation platform and creator of Reve Image models optimized for photorealistic and artistic image synthesis.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/reve_image.png"},{"id":"runway","name":"Runway","description":"We are building foundational General World Models that will be capable of simulating all possible worlds and experiences. The next frontier of intelligence will come from models that can understand, perceive, generate and act in the world.","url":"https://runwayml.com","api_base_url":"https://api.dev.runwayml.com/v1","docs_url":"https://docs.dev.runwayml.com","pricing_url":"https://runwayml.com/pricing","own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":["runwayml"],"tags":["cinematic","creative-ai","video-generation"],"modalities":["audio","image","text","video"],"model_count":6,"priced_model_count":6,"pricing_tiers":["standard"],"pricing_dimensions":["audio_input","image_input","image_output","video_output"],"icon_url":"/images/providers/favicons/runway.png"},{"id":"salesforce_research","name":"Salesforce Research","description":"AI research division of Salesforce. Creator of the CodeGen, XGen, and BLIP model families for code generation, long-context reasoning, and vision-language tasks.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/salesforce_research.png"},{"id":"sambanova","name":"SambaNova","description":"Discover SambaNova - the complete AI platform delivering the fastest AI inference, fine-tuning, and scalable solutions for agentic AI easily integrated into existing data center infrastructures.","url":"https://sambanova.ai","api_base_url":"https://api.sambanova.ai/v1","docs_url":"https://docs.sambanova.ai/sambanova-cloud/latest/model-availability","pricing_url":"https://sambanova.ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["sambanova"],"tags":["enterprise","fast-inference","open-weight","rdu"],"modalities":["image","pdf","text"],"model_count":15,"priced_model_count":15,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/sambanova.png"},{"id":"sarvam","name":"Sarvam","description":"Sarvam is India's full-stack sovereign AI platform, with speech-to-text, text-to-speech, translation, and conversational agents across 22 Indian languages. Start free.","url":"https://sarvam.ai","api_base_url":"https://api.sarvam.ai","docs_url":"https://docs.sarvam.ai","pricing_url":"https://sarvam.ai/pricing","own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":["sarvam"],"tags":["indic-languages","multilingual","speech"],"modalities":["audio","text"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/sarvam.png"},{"id":"scaleway","name":"Scaleway","description":"European cloud and GPU-inference provider offering serverless LLM inference via an OpenAI-compatible API with GDPR-compliant EU data residency. Hosts open-source models from Meta, Qwen, Mistral, and others.","url":"https://www.scaleway.com/en/ai-services/","api_base_url":"https://api.scaleway.ai/v1","docs_url":"https://www.scaleway.com/en/docs/ai-data/generative-apis/","pricing_url":"https://www.scaleway.com/en/pricing/generative-apis/","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["scaleway"],"tags":["cloud","european","gdpr","serverless"],"modalities":["text"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/scaleway.png"},{"id":"segmind","name":"Segmind","description":"Generative AI platform and model developer. Creator of Segmind SSD and other image generation models, as well as a hosted API for diffusion-based workflows.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/segmind.png"},{"id":"internlm_team","name":"InternLM","description":"Shanghai AI Laboratory team behind InternLM. Creator of the InternLM2 and InternLM3 open-weight model families, including InternVL multimodal variants.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/internlm_team.png"},{"id":"siliconflow","name":"SiliconFlow","description":"Chinese AI inference platform offering a large catalog of open-weight models at competitive prices. Hosts Qwen, DeepSeek, Llama, Mistral, and image generation models. OpenAI-compatible API. Popular in Asia-Pacific region for affordable, high-throughput inference.","url":"https://siliconflow.cn","api_base_url":"https://api.siliconflow.cn/v1","docs_url":"https://docs.siliconflow.cn/docs/getting-started","pricing_url":"https://siliconflow.cn/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":[],"tags":["chinese","high-throughput","low-cost","open-source"],"modalities":["audio","embedding","image","text"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/siliconflow.png"},{"id":"snowflake","name":"Snowflake","description":"Discover Snowflake Arctic, a breakthrough LLM built for enterprise AI. Enterprise intelligence. Breakthrough efficiency. Truly open.","url":"https://www.snowflake.com/en/data-cloud/arctic","api_base_url":"https://{account}.snowflakecomputing.com/api/v2/cortex/v1","docs_url":"https://docs.snowflake.com/en/user-guide/snowflake-cortex/llm-functions","pricing_url":"https://www.snowflake.com/legal/snowflake-product-and-feature-pricing","own_models":true,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["snowflake"],"tags":["data-cloud","enterprise","open-weight","sql-native"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":61,"priced_model_count":61,"pricing_tiers":["batch","long_context","standard"],"pricing_dimensions":["cache_read","input","output"],"icon_url":"/images/providers/favicons/snowflake.png"},{"id":"speechify","name":"Speechify","description":"Audio content platform and creator of Speechify TTS models, delivering natural-sounding speech synthesis with speaker cloning and multilingual support.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/speechify.png"},{"id":"stability_ai","name":"Stability AI","description":"Stability AI is the enterprise-ready creative partner for teams and creators, delivering professional-grade generative AI tools and solutions for content production at scale.","url":"https://stability.ai","api_base_url":"https://api.stability.ai","docs_url":"https://platform.stability.ai/docs/api-reference","pricing_url":"https://platform.stability.ai/pricing","own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":["stability"],"tags":["diffusion","image-generation","open-weight","video-generation"],"modalities":["audio","image","text","video"],"model_count":22,"priced_model_count":22,"pricing_tiers":["standard"],"pricing_dimensions":["image_output"],"icon_url":"/images/providers/favicons/stability_ai.png"},{"id":"stepfun","name":"StepFun","description":"Chinese AI lab offering the Step series of multimodal frontier models. Step-2 competes with GPT-4-class models on reasoning benchmarks. Step-1V handles vision. Also offers image and video generation capabilities.","url":"https://www.stepfun.com","api_base_url":"https://api.stepfun.com/v1","docs_url":"https://platform.stepfun.com/docs/overview/concept","pricing_url":"https://platform.stepfun.com/docs/pricing","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["stepfun"],"tags":["chinese","frontier","image-generation","multimodal"],"modalities":["audio","image","text","video"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/stepfun.png"},{"id":"styletts","name":"StyleTTS","description":"Research team behind StyleTTS and StyleTTS2, open-source human-level text-to-speech models using style diffusion and adversarial training.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/styletts.png"},{"id":"tii","name":"TII","description":"Abu Dhabi-based research institute and creator of the Falcon model family. Produces open-source, state-of-the-art LLMs including Falcon 180B, Falcon 2, and Falcon 3 series.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/tii.png"},{"id":"teleai","name":"Tele-AI","description":"Telecom operator AI lab. Creator of TeleChat, a Chinese-English bilingual large language model series developed by China Telecom.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/teleai.png"},{"id":"together_ai","name":"Together AI","description":"Build what's next on the AI Native Cloud. Full-stack AI platform for inference, fine-tuning, and GPU clusters — powered by cutting-edge research.","url":"https://www.together.ai","api_base_url":"https://api.together.ai/v1","docs_url":"https://docs.together.ai/docs/serverless-models","pricing_url":"https://www.together.ai/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["together_ai"],"tags":["dedicated-endpoints","fine-tuning","open-source","serverless"],"modalities":["embedding","image","pdf","text","video"],"model_count":26,"priced_model_count":26,"pricing_tiers":["standard"],"pricing_dimensions":["input","output"],"icon_url":"/images/providers/favicons/together_ai.png"},{"id":"together_research","name":"Together Research","description":"Research models from Together AI, including the RedPajama open dataset models and experimental architectures produced by the Together research team.","url":null,"api_base_url":null,"docs_url":null,"pricing_url":null,"own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":[],"tags":[],"modalities":[],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/together_research.png"},{"id":"upstage","name":"Upstage","description":"Upstage builds powerful large language models and document processing engines to transform workflows and empower leading businesses like yours.","url":"https://upstage.ai","api_base_url":"https://api.upstage.ai/v1","docs_url":"https://console.upstage.ai/docs/getting-started/models","pricing_url":"https://console.upstage.ai/docs/getting-started/pricing","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["upstage"],"tags":["document-ai","embeddings","korean","multilingual"],"modalities":["embedding","text"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/upstage.png"},{"id":"vercel_ai_gateway","name":"Vercel AI Gateway","description":"Deploy AI apps in seconds with Vercel's AI SDK and Frontend Cloud. Built-in adapters, streaming UI helpers, and zero-config deployments.","url":"https://vercel.com/ai","api_base_url":"https://ai-gateway.vercel.sh/v1","docs_url":"https://vercel.com/docs/ai-gateway","pricing_url":"https://vercel.com/docs/ai-gateway/pricing","own_models":false,"hosts_platform":true,"openai_compatible":true,"litellm_provider":["vercel_ai_gateway","v0"],"tags":["gateway","openai-compatible","unified-api","zero-markup"],"modalities":["audio","embedding","image","pdf","text","video"],"model_count":289,"priced_model_count":289,"pricing_tiers":["standard"],"pricing_dimensions":["cache_read","cache_write_5m","image_output","image_output_1k","image_output_2k","image_output_4k","image_output_512","image_output_default","input","output","video_1080p","video_1080p_audio","video_1080p_no_audio","video_480p","video_480p_audio","video_480p_no_audio","video_4k_audio","video_4k_no_audio","video_720p","video_720p_audio","video_720p_no_audio","video_pro","video_pro_audio","video_pro_no_audio","video_std","video_std_audio","video_std_no_audio"],"icon_url":"/images/providers/favicons/vercel_ai_gateway.png"},{"id":"voyage","name":"Voyage","description":"Voyage AI provides cutting-edge embedding models and rerankers for search and retrieval","url":"https://www.voyageai.com","api_base_url":"https://api.voyageai.com/v1","docs_url":"https://docs.voyageai.com/docs/embeddings","pricing_url":"https://docs.voyageai.com/docs/pricing","own_models":true,"hosts_platform":false,"openai_compatible":false,"litellm_provider":["voyage"],"tags":["embeddings","rag","rerank","retrieval"],"modalities":["embedding","text"],"model_count":19,"priced_model_count":19,"pricing_tiers":["standard"],"pricing_dimensions":["input"],"icon_url":"/images/providers/favicons/voyage.png"},{"id":"writer","name":"Writer","description":"WRITER is the enterprise AI agent platform trusted by Fortune 500 companies, built to help teams execute and scale on-brand, compliant work.","url":"https://writer.com","api_base_url":"https://api.writer.com/v1","docs_url":"https://dev.writer.com/api-guides/models","pricing_url":"https://writer.com/pricing","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":[],"tags":["business-ai","document-understanding","enterprise"],"modalities":["image","text"],"model_count":0,"priced_model_count":0,"pricing_tiers":[],"pricing_dimensions":[],"icon_url":"/images/providers/favicons/writer.png"},{"id":"xai","name":"xAI","description":"Elon Musk's AI company and creators of the Grok model family. Grok models offer large context windows, real-time knowledge via X (Twitter) integration, vision, and multimodal output. Grok-4 is their frontier reasoning model.","url":"https://x.ai","api_base_url":"https://api.x.ai/v1","docs_url":"https://docs.x.ai/docs/models","pricing_url":"https://docs.x.ai/docs/models","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["xai"],"tags":["frontier","long-context","real-time-knowledge","reasoning"],"modalities":["audio","image","pdf","text"],"model_count":38,"priced_model_count":38,"pricing_tiers":["batch","standard"],"pricing_dimensions":["cache_read","image_input","input","output"],"icon_url":"/images/providers/favicons/xai.png"},{"id":"z_ai","name":"Z AI (Zhipu)","description":"Meet Z.ai, your free AI-powered assistant. Build websites, create slides, analyze data, and get instant answers. Fast, smart, and reliable, powered by GLM-5.","url":"https://z.ai","api_base_url":"https://api.z.ai/api/v1","docs_url":"https://bigmodel.cn/dev/api","pricing_url":"https://bigmodel.cn/dev/howuse/billing","own_models":true,"hosts_platform":false,"openai_compatible":true,"litellm_provider":["zai"],"tags":["chinese","multilingual","reasoning"],"modalities":["image","pdf","text"],"model_count":10,"priced_model_count":10,"pricing_tiers":["standard"],"pricing_dimensions":["cache_read","input","output"],"icon_url":"/images/providers/favicons/z_ai.png"}],"meta":{"updated_at":"","request_id":"458443e6-107d-4c67-a7de-16540cdaa1c8","execution_ms":9}}