{"data":[{"id":"microsoft-tts-neural","name":"tts-neural","display_name":"Azure Neural","description":"Microsoft Azure's neural text-to-speech model delivering lifelike, expressive voice synthesis powered by deep learning.","creator":"microsoft","family":"tts","tier":"","version":null,"type":"","size_in_bn":null,"modalities":{"input":[],"output":[]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["azure-neural","microsoft-tts-neural"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-04-20 16:51:01"},{"id":"fun-tts-realtime","name":"fun-tts-realtime","display_name":"Fun TTS Realtime","description":"A real-time text-to-speech model from Alibaba's Fun platform, designed for low-latency streaming audio synthesis.","creator":"fun","family":"tts","tier":"","version":null,"type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["fun-realtime-tts","fun-tts-realtime"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"inworld-tts","name":"inworld-tts","display_name":"Inworld TTS 1","description":"Inworld's first-generation text-to-speech model, designed for real-time expressive voice synthesis in interactive and gaming applications.","creator":"inworld","family":"tts","tier":"","version":null,"type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["inworld-tts"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"inworld-tts-1-max","name":"inworld-tts-1-max","display_name":"Inworld TTS 1 Max","description":"The premium-quality tier of Inworld's first-generation TTS model, delivering high-fidelity expressive speech for game and interactive AI characters.","creator":"inworld","family":"tts","tier":"","version":"1","type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["inworld-tts-1-max"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"inworld-tts-1-5-max","name":"tts-1-5-max","display_name":"Inworld TTS 1.5 Max","description":"The high-quality tier of Inworld's TTS 1.5 series, offering premium voice synthesis for interactive entertainment and game character dialogue.","creator":"inworld","family":"tts","tier":"max","version":"1-5","type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["inworld-tts-1-5-max","tts-1-5-max"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"inworld-tts-1-5-mini","name":"tts-1-5-mini","display_name":"Inworld TTS 1.5 Mini","description":"A compact, low-latency variant of Inworld's TTS 1.5 series, optimized for fast voice synthesis in real-time interactive applications.","creator":"inworld","family":"tts","tier":"mini","version":"1-5","type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["inworld-tts-1-5-mini","tts-1-5-mini"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"lmnt-tts","name":"lmnt-tts","display_name":"LMNT","description":"LMNT's text-to-speech synthesis model delivering fast, natural-sounding voice generation for real-time applications.","creator":"lmnt","family":"tts","tier":"","version":null,"type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["lmnt","lmnt-tts"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"myshell-ai-melotts","name":"melotts","display_name":"MeloTTS","description":"High-quality multilingual text-to-speech library supporting multiple languages with natural-sounding synthesis for voice applications.","creator":"myshell-ai","family":"tts","tier":"","version":null,"type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["@cf/myshell-ai/melotts","myshell-ai-melotts"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"neuphonic-tts","name":"neuphonic-tts","display_name":"Neuphonic TTS","description":"A real-time text-to-speech model from Neuphonic delivering low-latency, high-quality voice synthesis for conversational applications.","creator":"neuphonic","family":"tts","tier":"","version":null,"type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["neuphonic","neuphonic-tts"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"noiz-tts","name":"noiz-tts","display_name":"Noiz TTS","description":"A text-to-speech model from Noiz designed for generating synthetic speech audio from text input.","creator":"noiz","family":"tts","tier":"","version":null,"type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["noiz-tts"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"playai-tts","name":"playai-tts","display_name":"PlayAI TTS","description":"A text-to-speech model from PlayAI offering natural-sounding voice synthesis for a range of conversational and content applications.","creator":"playai","family":"tts","tier":"","version":null,"type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":10000,"max_output_tokens":10000,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["groq/playai-tts","playai-tts"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"step-tts-2","name":"step-tts-2","display_name":"Step TTS 2","description":"A text-to-speech synthesis model from StepFun delivering natural-sounding voice generation with expressive prosody.","creator":"step","family":"tts","tier":"","version":"2","type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["step-tts-2","step-tts-2-mar-2026"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"styletts-tts-2","name":"styletts-tts-2","display_name":"StyleTTS 2","description":"A TTS model that uses style diffusion and adversarial training to achieve human-level naturalness and expressive voice synthesis.","creator":"styletts","family":"tts","tier":"","version":"2","type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["styletts-2","styletts-tts-2"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"microsoft-tts","name":"tts","display_name":"TTS","description":"Microsoft Azure's text-to-speech service providing neural voice synthesis across a wide range of languages and voice styles.","creator":"microsoft","family":"tts","tier":"","version":null,"type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["azure-neural","azure/speech/azure-tts","microsoft-tts"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"openai-tts-1","name":"tts-1","display_name":"TTS 1","description":"A text-to-speech model optimized for realtime speech synthesis, converting written text into natural-sounding spoken audio.","creator":"openai","family":"tts","tier":"","version":"1","type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["azure/tts-1","openai-tts-1","tts-1","tts-1-1106"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"openai-tts-1-hd","name":"tts-1-hd","display_name":"TTS 1 HD","description":"A high-quality text-to-speech model optimized for audio fidelity, producing natural-sounding speech for non-realtime use cases.","creator":"openai","family":"tts","tier":"","version":"1","type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":2,"ids":["azure/tts-1-hd","openai-tts-1-hd","tts-1-hd","tts-1-hd-1106"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"microsoft-tts-hd","name":"tts-hd","display_name":"TTS HD","description":"A high-definition variant of Microsoft Azure's TTS service offering improved audio fidelity and more natural prosody.","creator":"microsoft","family":"tts","tier":"","version":null,"type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":true,"provider_count":1,"ids":["azure/speech/azure-tts-hd","microsoft-tts-hd"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"},{"id":"microsoft-tts-2-5-hd","name":"tts-2-5-hd","display_name":"TTS HD 2.5","description":"A high-definition Azure TTS model at version 2.5, delivering premium audio quality for natural-sounding speech synthesis.","creator":"microsoft","family":"tts","tier":"","version":"2-5","type":"text-to-speech","size_in_bn":null,"modalities":{"input":["text"],"output":["audio"]},"context_window":null,"max_output_tokens":null,"tool_use_system_prompt_tokens":0,"output_vector_sizes":[],"knowledge_cutoff":null,"training_data_cutoff":null,"supported_reasoning_efforts":[],"tokenizer":null,"capabilities":{"function_calling":false,"parallel_function_calling":false,"structured_outputs":false,"prompt_caching":false,"reasoning":false,"web_search":false,"computer_use":false,"code_execution":false,"file_search":false,"url_context":false,"assistant_prefill":false,"native_structured_output":false,"adaptive_reasoning":false},"release_date":null,"earliest_deprecation_date":null,"deprecated":false,"has_pricing":false,"provider_count":0,"ids":["azure-hd-2-5","microsoft-tts-2-5-hd"],"hf_likes":null,"hf_downloads":null,"hf_downloads_all_time":null,"hf_trending_score":null,"updated_at":"2026-06-11 08:02:18"}],"pagination":{"page_size":50,"has_next":false,"next_token":null,"total_count":18},"meta":{"updated_at":"2026-06-11","request_id":"3fe7d3ad-ff5e-4481-8a52-094f29502d36","execution_ms":2}}