{
  "name": "Azure AI Text to Speech",
  "slug": "azure-text-to-speech",
  "website_url": "https://azure.microsoft.com/en-us/products/ai-services/ai-speech",
  "vendor_description": "\"Text to speech enables your applications, tools, or devices to convert text into human like synthesized speech. The text to speech capability is also known as speech synthesis. Use human like standard voices out of the box, or create a custom voice that's unique to your product or brand.\"",
  "categories": [
    "text-to-speech"
  ],
  "summary": "Azure AI Text to Speech is Microsoft's managed speech synthesis service, suited for voice agents, call center automation, audiobook narration, accessibility tools, and content creation. It offers over 30 deployment regions, a free tier of 500,000 characters per month, and usage-based pricing starting at $15 per million characters for standard voices. SDKs are available for Python, C#, JavaScript, Java, and Go, and the service carries SOC 2 Type 2, HIPAA, GDPR, ISO 27001, and PCI DSS certifications. Custom and personal voice cloning are supported, though professional voice fine-tuning requires limited-access approval.",
  "capabilities": {
    "supported_actions": [
      "synthesize_speech",
      "streaming_tts",
      "batch_synthesis",
      "ssml_support",
      "word_timestamps",
      "viseme_generation",
      "professional_voice_cloning",
      "personal_voice_cloning",
      "custom_voice_training",
      "multilingual_synthesis",
      "voice_design",
      "audio_content_creation",
      "text_to_speech_avatar",
      "real_time_synthesis",
      "async_long_audio_synthesis"
    ],
    "supported_regions": [
      "Australia East",
      "Brazil South",
      "Canada Central",
      "Canada East",
      "Central US",
      "East Asia",
      "East US",
      "East US 2",
      "France Central",
      "Germany West Central",
      "India Central",
      "Italy North",
      "Japan East",
      "Japan West",
      "Korea Central",
      "North Central US",
      "North Europe",
      "Norway East",
      "Qatar Central",
      "South Africa North",
      "South Central US",
      "Southeast Asia",
      "Sweden Central",
      "Switzerland North",
      "Switzerland West",
      "UAE North",
      "UK South",
      "UK West",
      "West Central US",
      "West Europe",
      "West US",
      "West US 2",
      "West US 3",
      "US Gov Arizona",
      "US Gov Virginia"
    ],
    "supported_languages": [
      "af-ZA (Afrikaans, South Africa)",
      "am-ET (Amharic, Ethiopia)",
      "ar-AE (Arabic, UAE)",
      "ar-BH (Arabic, Bahrain)",
      "ar-DZ (Arabic, Algeria)",
      "ar-EG (Arabic, Egypt)",
      "ar-IQ (Arabic, Iraq)",
      "ar-JO (Arabic, Jordan)",
      "ar-KW (Arabic, Kuwait)",
      "ar-LB (Arabic, Lebanon)",
      "ar-LY (Arabic, Libya)",
      "ar-MA (Arabic, Morocco)",
      "ar-OM (Arabic, Oman)",
      "ar-QA (Arabic, Qatar)",
      "ar-SA (Arabic, Saudi Arabia)",
      "ar-SY (Arabic, Syria)",
      "ar-TN (Arabic, Tunisia)",
      "ar-YE (Arabic, Yemen)",
      "as-IN (Assamese, India)",
      "az-AZ (Azerbaijani, Azerbaijan)",
      "bg-BG (Bulgarian, Bulgaria)",
      "bn-BD (Bangla, Bangladesh)",
      "bn-IN (Bengali, India)",
      "bs-BA (Bosnian, Bosnia and Herzegovina)",
      "ca-ES (Catalan)",
      "cs-CZ (Czech, Czechia)",
      "cy-GB (Welsh, United Kingdom)",
      "da-DK (Danish, Denmark)",
      "de-AT (German, Austria)",
      "de-CH (German, Switzerland)",
      "de-DE (German, Germany)",
      "el-GR (Greek, Greece)",
      "en-AU (English, Australia)",
      "en-CA (English, Canada)",
      "en-GB (English, United Kingdom)",
      "en-HK (English, Hong Kong SAR)",
      "en-IE (English, Ireland)",
      "en-IN (English, India)",
      "en-KE (English, Kenya)",
      "en-NG (English, Nigeria)",
      "en-NZ (English, New Zealand)",
      "en-PH (English, Philippines)",
      "en-SG (English, Singapore)",
      "en-TZ (English, Tanzania)",
      "en-US (English, United States)",
      "en-ZA (English, South Africa)",
      "es-AR (Spanish, Argentina)",
      "es-BO (Spanish, Bolivia)",
      "es-CL (Spanish, Chile)",
      "es-CO (Spanish, Colombia)",
      "es-CR (Spanish, Costa Rica)",
      "es-CU (Spanish, Cuba)",
      "es-DO (Spanish, Dominican Republic)",
      "es-EC (Spanish, Ecuador)",
      "es-ES (Spanish, Spain)",
      "es-GQ (Spanish, Equatorial Guinea)",
      "es-GT (Spanish, Guatemala)",
      "es-HN (Spanish, Honduras)",
      "es-MX (Spanish, Mexico)",
      "es-NI (Spanish, Nicaragua)",
      "es-PA (Spanish, Panama)",
      "es-PE (Spanish, Peru)",
      "es-PR (Spanish, Puerto Rico)",
      "es-PY (Spanish, Paraguay)",
      "es-SV (Spanish, El Salvador)",
      "es-US (Spanish, United States)",
      "es-UY (Spanish, Uruguay)",
      "es-VE (Spanish, Venezuela)",
      "et-EE (Estonian, Estonia)",
      "eu-ES (Basque)",
      "fa-IR (Persian, Iran)",
      "fi-FI (Finnish, Finland)",
      "fil-PH (Filipino, Philippines)",
      "fr-BE (French, Belgium)",
      "fr-CA (French, Canada)",
      "fr-CH (French, Switzerland)",
      "fr-FR (French, France)",
      "ga-IE (Irish, Ireland)",
      "gl-ES (Galician)",
      "gu-IN (Gujarati, India)",
      "he-IL (Hebrew, Israel)",
      "hi-IN (Hindi, India)",
      "hr-HR (Croatian, Croatia)",
      "hu-HU (Hungarian, Hungary)",
      "hy-AM (Armenian, Armenia)",
      "id-ID (Indonesian, Indonesia)",
      "is-IS (Icelandic, Iceland)",
      "it-IT (Italian, Italy)",
      "iu-CANS-CA (Inuktitut Syllabics, Canada)",
      "iu-LATN-CA (Inuktitut Latin, Canada)",
      "ja-JP (Japanese, Japan)",
      "jv-ID (Javanese, Indonesia)",
      "ka-GE (Georgian, Georgia)",
      "kk-KZ (Kazakh, Kazakhstan)",
      "km-KH (Khmer, Cambodia)",
      "kn-IN (Kannada, India)",
      "ko-KR (Korean, Korea)",
      "lo-LA (Lao, Laos)",
      "lt-LT (Lithuanian, Lithuania)",
      "lv-LV (Latvian, Latvia)",
      "mk-MK (Macedonian, North Macedonia)",
      "ml-IN (Malayalam, India)",
      "mn-MN (Mongolian, Mongolia)",
      "mr-IN (Marathi, India)",
      "ms-MY (Malay, Malaysia)",
      "mt-MT (Maltese, Malta)",
      "my-MM (Burmese, Myanmar)",
      "nb-NO (Norwegian Bokmål, Norway)",
      "ne-NP (Nepali, Nepal)",
      "nl-BE (Dutch, Belgium)",
      "nl-NL (Dutch, Netherlands)",
      "or-IN (Odia, India)",
      "pa-IN (Punjabi, India)",
      "pl-PL (Polish, Poland)",
      "ps-AF (Pashto, Afghanistan)",
      "pt-BR (Portuguese, Brazil)",
      "pt-PT (Portuguese, Portugal)",
      "ro-RO (Romanian, Romania)",
      "ru-RU (Russian, Russia)",
      "si-LK (Sinhala, Sri Lanka)",
      "sk-SK (Slovak, Slovakia)",
      "sl-SI (Slovenian, Slovenia)",
      "so-SO (Somali, Somalia)",
      "sq-AL (Albanian, Albania)",
      "sr-LATN-RS (Serbian Latin, Serbia)",
      "sr-RS (Serbian Cyrillic, Serbia)",
      "su-ID (Sundanese, Indonesia)",
      "sv-SE (Swedish, Sweden)",
      "sw-KE (Kiswahili, Kenya)",
      "sw-TZ (Kiswahili, Tanzania)",
      "ta-IN (Tamil, India)",
      "ta-LK (Tamil, Sri Lanka)",
      "ta-MY (Tamil, Malaysia)",
      "ta-SG (Tamil, Singapore)",
      "te-IN (Telugu, India)",
      "th-TH (Thai, Thailand)",
      "tr-TR (Turkish, Türkiye)",
      "uk-UA (Ukrainian, Ukraine)",
      "ur-IN (Urdu, India)",
      "ur-PK (Urdu, Pakistan)",
      "uz-UZ (Uzbek, Uzbekistan)",
      "vi-VN (Vietnamese, Vietnam)",
      "wuu-CN (Chinese Wu, Simplified)",
      "yue-CN (Chinese Cantonese, Simplified)",
      "zh-CN (Chinese Mandarin, Simplified)",
      "zh-HK (Chinese Cantonese, Traditional)",
      "zh-TW (Chinese Taiwanese Mandarin, Traditional)"
    ],
    "input_types": [
      "plain text",
      "SSML (Speech Synthesis Markup Language)"
    ],
    "output_types": [
      "mp3 (various bitrates)",
      "opus (ogg, webm containers)",
      "pcm (raw)",
      "wav (riff)",
      "alaw",
      "mulaw",
      "truesilk",
      "g722",
      "amr-wb"
    ],
    "webhooks_supported": false,
    "sandbox_available": false,
    "sdk_languages": [
      "Python",
      "C#",
      "JavaScript",
      "Java",
      "Go"
    ],
    "mcp_server_available": true
  },
  "integration": {
    "api_style": "rest",
    "base_url": "https://{region}.tts.speech.microsoft.com/cognitiveservices/v1",
    "api_version": "2024-04-01",
    "versioning_scheme": "url",
    "stability": "ga",
    "deprecation_policy_url": null,
    "auth_methods": [
      "api_key",
      "jwt"
    ],
    "auth_docs_url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/rest-text-to-speech#authentication",
    "idempotency_supported": null,
    "error_format": "vendor-specific",
    "webhook_signing": null,
    "webhook_events_url": null,
    "rate_limit_requests": 200,
    "rate_limit_window": "second",
    "sdk_packages": [
      {
        "package": "azure-cognitiveservices-speech",
        "language": "Python",
        "official": true,
        "repo_url": "https://github.com/Azure-Samples/cognitive-services-speech-sdk"
      },
      {
        "package": "Microsoft.CognitiveServices.Speech",
        "language": "C#",
        "official": true,
        "repo_url": "https://github.com/Azure-Samples/cognitive-services-speech-sdk"
      },
      {
        "package": "microsoft-cognitiveservices-speech-sdk",
        "language": "JavaScript",
        "official": true,
        "repo_url": "https://github.com/microsoft/cognitive-services-speech-sdk-js"
      },
      {
        "package": "com.microsoft.cognitiveservices.speech:client-sdk",
        "language": "Java",
        "official": true,
        "repo_url": "https://github.com/Azure-Samples/cognitive-services-speech-sdk"
      },
      {
        "package": "github.com/Microsoft/cognitive-services-speech-sdk-go",
        "language": "Go",
        "official": true,
        "repo_url": "https://github.com/Microsoft/cognitive-services-speech-sdk-go"
      }
    ],
    "mcp_url": "https://github.com/microsoft/mcp/tree/main/servers/Azure.Mcp.Server",
    "quickstart_url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/get-started-text-to-speech"
  },
  "pricing": {
    "pricing_model": "usage_based",
    "has_published_pricing": true,
    "starting_price_usd": "15.0000",
    "price_basis": "1M characters",
    "free_tier_available": true,
    "free_tier_limit": "500,000 characters/month",
    "free_tier_details": "Free (F0) tier: 0.5 million characters per month for neural text-to-speech (recurring monthly allowance, not a one-time trial). Free tier rate limits are not adjustable.",
    "minimum_commitment": null,
    "self_serve_signup": true,
    "requires_sales_call": false,
    "requires_verification": false,
    "enterprise_plan_available": true,
    "price_points": [
      {
        "plan": "Free (F0)",
        "item": "Speech synthesis - neural voices (recurring monthly allowance)",
        "amount_usd": "0.0000",
        "amount_percent": null,
        "per": "0.5M characters per month",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Pay As You Go (S0)",
        "item": "Speech synthesis - neural voices (real-time & batch)",
        "amount_usd": "16.0000",
        "amount_percent": null,
        "per": "1M characters",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Pay As You Go (S0)",
        "item": "Speech synthesis - neural HD voices (real-time & batch)",
        "amount_usd": "22.0000",
        "amount_percent": null,
        "per": "1M characters",
        "currency": "USD",
        "source_url": "https://azurefeeds.com/2026/03/31/azure-speech-neural-hd-text-to-speech-recent-voice-updates/"
      },
      {
        "plan": "Pay As You Go (S0)",
        "item": "Speech synthesis - neural voices (long audio creation)",
        "amount_usd": "100.0000",
        "amount_percent": null,
        "per": "1M characters",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Pay As You Go (S0)",
        "item": "Speech synthesis - custom neural voice (real-time & batch)",
        "amount_usd": "24.0000",
        "amount_percent": null,
        "per": "1M characters",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Pay As You Go (S0)",
        "item": "Speech synthesis - custom neural HD voice (real-time & batch)",
        "amount_usd": "48.0000",
        "amount_percent": null,
        "per": "1M characters",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Pay As You Go (S0)",
        "item": "Speech synthesis - custom neural voice (long audio creation)",
        "amount_usd": "100.0000",
        "amount_percent": null,
        "per": "1M characters",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Pay As You Go (S0)",
        "item": "Custom neural voice model training",
        "amount_usd": "52.0000",
        "amount_percent": null,
        "per": "compute hour",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Pay As You Go (S0)",
        "item": "Custom neural voice endpoint hosting",
        "amount_usd": "4.0400",
        "amount_percent": null,
        "per": "model per hour",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Pay As You Go (S0)",
        "item": "Personal voice synthesis",
        "amount_usd": "24.0000",
        "amount_percent": null,
        "per": "1M characters",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Pay As You Go (S0)",
        "item": "Personal voice profile storage",
        "amount_usd": "600.0000",
        "amount_percent": null,
        "per": "1,000 profiles per month",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Commitment - 80M characters/month",
        "item": "Speech synthesis - neural voices",
        "amount_usd": "1024.0000",
        "amount_percent": null,
        "per": "month (80M characters included)",
        "currency": "USD",
        "source_url": "https://speechify.com/blog/microsoft-azure-pricing-plans/"
      },
      {
        "plan": "Commitment - 400M characters/month",
        "item": "Speech synthesis - neural voices",
        "amount_usd": "4160.0000",
        "amount_percent": null,
        "per": "month (400M characters included)",
        "currency": "USD",
        "source_url": "https://speechify.com/blog/microsoft-azure-pricing-plans/"
      },
      {
        "plan": "Commitment - 2,000M characters/month",
        "item": "Speech synthesis - neural voices",
        "amount_usd": "16000.0000",
        "amount_percent": null,
        "per": "month (2,000M characters included)",
        "currency": "USD",
        "source_url": "https://speechify.com/blog/microsoft-azure-pricing-plans/"
      },
      {
        "plan": "Connected Container - 80M characters/month",
        "item": "Speech synthesis - neural voices",
        "amount_usd": "972.8000",
        "amount_percent": null,
        "per": "month (80M characters included)",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Connected Container - 400M characters/month",
        "item": "Speech synthesis - neural voices",
        "amount_usd": "3952.0000",
        "amount_percent": null,
        "per": "month (400M characters included)",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      },
      {
        "plan": "Connected Container - 2,000M characters/month",
        "item": "Speech synthesis - neural voices",
        "amount_usd": "15200.0000",
        "amount_percent": null,
        "per": "month (2,000M characters included)",
        "currency": "USD",
        "source_url": "https://azure.microsoft.com/en-us/pricing/details/speech/"
      }
    ]
  },
  "compliance": {
    "soc2": "type_2",
    "hipaa": true,
    "gdpr": true,
    "iso_27001": true,
    "pci_dss": true,
    "sla_published": true,
    "sla_url": "https://www.microsoft.com/licensing/docs/view/Service-Level-Agreements-SLA-for-Online-Services?lang=1",
    "data_retention_policy_url": "https://learn.microsoft.com/en-us/azure/foundry/responsible-ai/speech-service/text-to-speech/data-privacy-security",
    "documented_rate_limits": "Free (F0): 20 transactions per 60 seconds (not adjustable). Standard (S0): 200 transactions per second (TPS) default, adjustable up to 1,000 TPS upon request. Maximum audio length per request: 10 minutes. Maximum SSML message size per WebSocket turn: 64 KB. Maximum distinct voice/audio tags in SSML: 50. HD voice latency: less than 300 ms.",
    "known_restrictions": [
      "Custom voice (professional voice fine-tuning) requires limited-access application approval",
      "Chinese characters counted as two characters for billing, including kanji (Japanese), hanja (Korean), hanzi (other languages)",
      "HD voices support only a subset of SSML elements (not full SSML)",
      "Personal voice does not support BYOS (Bring Your Own Storage)",
      "Dragon HD Flash voices only support zh-CN and en-US text",
      "Real-time HD voice synthesis only (no batch synthesis for HD voices)",
      "Maximum 10 minutes audio output per real-time synthesis request",
      "Custom voice endpoint hosting billed separately per hour",
      "Voice talent verbal consent recording required before custom voice training"
    ]
  },
  "developer": {
    "docs_url": "https://azure.microsoft.com/en-us/resources/developers/",
    "api_reference_url": null,
    "openapi_spec_url": null,
    "postman_collection_url": null,
    "changelog_url": null,
    "status_page_url": null,
    "llms_txt_url": "https://azure.microsoft.com/llms.txt",
    "markdown_docs_url": null,
    "rendering": "static"
  },
  "adoption": {
    "launched_at": "2018-09-24",
    "ga_date": "2018-11-01",
    "github_stars": null,
    "github_stars_at": null,
    "notable_customers": []
  },
  "scores": {
    "agent_friendliness": 65,
    "pricing_transparency": 100,
    "setup_speed": 85,
    "docs_quality": 25,
    "procurement_friction": 100,
    "trust_readiness": 100,
    "best_for": [
      "Prototypes and side projects - free to start, no sales call",
      "Regulated or enterprise workloads - compliance attestations and an enterprise plan",
      "AI agents and automation - an agent-ready surface (MCP / llms.txt)"
    ],
    "avoid_if": []
  },
  "sources": [
    {
      "field": "categories",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/text-to-speech",
      "excerpt": "Text to speech enables your applications, tools, or devices to convert text into human like synthesized speech.",
      "confidence": "high"
    },
    {
      "field": "supported_languages",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/text-to-speech",
      "excerpt": "Standard voices: High-quality neural voices available out of the box in 100+ languages and locales",
      "confidence": "high"
    },
    {
      "field": "supported_actions",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/text-to-speech",
      "excerpt": "Improve text to speech output with SSML: Speech Synthesis Markup Language (SSML) is an XML-based markup language used to customize text to speech outputs. Visemes: Visemes are the key poses in observed speech, including the position of the lips, jaw, and tongue in producing a particular phoneme.",
      "confidence": "high"
    },
    {
      "field": "sdk_languages",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-sdk",
      "excerpt": "The Speech SDK supports the following languages and platforms: C#, C++, Go, Java, JavaScript, Objective-C, Python, Swift",
      "confidence": "high"
    },
    {
      "field": "pricing_model",
      "url": "https://azure.microsoft.com/en-us/pricing/details/speech/",
      "excerpt": null,
      "confidence": "high"
    },
    {
      "field": "free_tier_available",
      "url": "https://speechify.com/blog/microsoft-azure-pricing-plans/",
      "excerpt": "Limited to processing 0.5 million characters per month",
      "confidence": "high"
    },
    {
      "field": "documented_rate_limits",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-services-quotas-and-limits",
      "excerpt": "Maximum number of transactions per time period for standard voices and custom voices: Free (F0): 20 transactions per 60 seconds (This limit isn't adjustable). Standard (S0): 200 transactions per second (TPS) (default value). The rate is adjustable up to 1,000 TPS for Standard (S0) resources.",
      "confidence": "high"
    },
    {
      "field": "mcp_server_available",
      "url": "https://learn.microsoft.com/en-us/azure/developer/azure-mcp-server/services/azure-mcp-speech-foundry-tools",
      "excerpt": "Azure Model Context Protocol (MCP) Server enables AI assistants like GitHub Copilot, Claude Desktop, and others to interact with Azure Speech in Foundry Tools through natural language commands.",
      "confidence": "high"
    },
    {
      "field": "pci_dss",
      "url": "https://learn.microsoft.com/en-us/azure/compliance/offerings/offering-pci-dss",
      "excerpt": "Microsoft Azure maintains a PCI DSS validation using an approved Qualified Security Assessor (QSA), and is certified as compliant under PCI DSS version 4.0 at Service Provider Level 1.",
      "confidence": "high"
    },
    {
      "field": "iso_27001",
      "url": "https://learn.microsoft.com/en-us/azure/compliance/offerings/offering-iso-27001",
      "excerpt": "Microsoft Azure, Dynamics 365, and other Microsoft online services undergo regular independent third-party audits for ISO/IEC 27001 compliance.",
      "confidence": "high"
    },
    {
      "field": "gdpr",
      "url": "https://learn.microsoft.com/en-us/azure/foundry/responsible-ai/speech-service/text-to-speech/data-privacy-security",
      "excerpt": "The Microsoft Products and Services Data Protection Addendum sets forth customers' and Microsoft's obligations with respect to the processing and security of Customer Data and Personal Data in connection with Azure",
      "confidence": "high"
    },
    {
      "field": "supported_regions",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/rest-text-to-speech",
      "excerpt": "These regions are supported for text to speech through the REST API: Australia East, Brazil South, Canada Central, Canada East, Central US, East Asia, East US, East US 2, France Central, Germany West Central, India Central, Italy North, Japan East, Japan West, Korea Central, North Central US, North Europe, Norway East, Qatar Central, South Africa North, South Central US, Southeast Asia, Sweden Central, Switzerland North, Switzerland West, UAE North, UK South, UK West, US Gov Arizona, US Gov Virginia, West Central US, West Europe, West US, West US 2, West US 3",
      "confidence": "high"
    },
    {
      "field": "known_restrictions",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/text-to-speech",
      "excerpt": "Custom voice is an umbrella term that includes professional voice fine-tuning and personal voice. Custom voice training and hosting are both calculated by hour and billed per second.",
      "confidence": "high"
    },
    {
      "field": "vendor_description",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/text-to-speech",
      "excerpt": "Text to speech enables your applications, tools, or devices to convert text into human like synthesized speech. The text to speech capability is also known as speech synthesis. Use human like standard voices out of the box, or create a custom voice that's unique to your product or brand.",
      "confidence": "high"
    },
    {
      "field": "supported_languages",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/language-support?tabs=tts",
      "excerpt": "The text-to-speech section contains an extensive table listing supported locales including af-ZA, am-ET, ar-AE through zh-TW — approximately 140+ language-locale combinations representing over 130 distinct languages.",
      "confidence": "high"
    },
    {
      "field": "supported_actions",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/text-to-speech",
      "excerpt": "Real-time speech synthesis: Use the Speech SDK or REST API to convert text to speech by using standard voices or custom voices. Asynchronous synthesis of long audio: Use the batch synthesis API to asynchronously synthesize text to speech files longer than 10 minutes",
      "confidence": "high"
    },
    {
      "field": "output_types",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/rest-text-to-speech",
      "excerpt": "audio-16khz-32kbitrate-mono-mp3\naudio-24khz-48kbitrate-mono-mp3\nogg-16khz-16bit-mono-opus\nwebm-24khz-16bit-mono-opus\nraw-8khz-8bit-mono-alaw\nraw-8khz-8bit-mono-mulaw\nriff-24khz-16bit-mono-pcm\ng722-16khz-64kbps\namr-wb-16000hz",
      "confidence": "high"
    },
    {
      "field": "pricing_model",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/text-to-speech",
      "excerpt": "When you use the text to speech feature, billing is based on the total number of characters in each successfully processed request.",
      "confidence": "high"
    },
    {
      "field": "free_tier_available",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-services-quotas-and-limits",
      "excerpt": "For the Free (F0) pricing tier, see the monthly allowances on the pricing page.",
      "confidence": "high"
    },
    {
      "field": "has_published_pricing",
      "url": "https://azure.microsoft.com/en-us/pricing/details/speech/",
      "excerpt": null,
      "confidence": "high"
    },
    {
      "field": "documented_rate_limits",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-services-quotas-and-limits",
      "excerpt": "Maximum audio length produced per request: 10 minutes (both F0 and S0). Maximum SSML message size per turn for WebSocket: 64 KB. Maximum total number of distinct voice and audio tags in SSML: 50.",
      "confidence": "high"
    },
    {
      "field": "hipaa",
      "url": "https://learn.microsoft.com/en-us/azure/compliance/offerings/offering-hipaa-us",
      "excerpt": "Microsoft will enter into BAAs with its covered entity and business associate customers. Azure has enabled the physical, technical, and administrative safeguards required by HIPAA and the HITECH Act inside the in-scope Azure services, and offers a HIPAA BAA as part of the Microsoft Product Terms to all customers who are covered entities or business associates under HIPAA",
      "confidence": "high"
    },
    {
      "field": "pci_dss",
      "url": "https://learn.microsoft.com/en-us/azure/compliance/offerings/offering-pci-dss",
      "excerpt": "For a list of Microsoft online services in audit scope, see the PCI DSS Attestation of Compliance (AoC) that is available separately for Azure and Azure Government",
      "confidence": "high"
    },
    {
      "field": "soc2",
      "url": "https://azure.microsoft.com/en-us/blog/cognitive-services-certifications-and-availability/",
      "excerpt": "Azure Cognitive Services include ISO 27001:2013 certification, HIPAA BAA, HITRUST CSF certification, SOC 1 Type 2, SOC 2 Type 2, and SOC 3 attestation.",
      "confidence": "high"
    },
    {
      "field": "sla_published",
      "url": "https://azure.microsoft.com/en-us/support/legal/sla/cognitive-services/v1_0/",
      "excerpt": null,
      "confidence": "high"
    },
    {
      "field": "known_restrictions",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/text-to-speech",
      "excerpt": "Each Chinese character is counted as two characters for billing, including kanji used in Japanese, hanja used in Korean, or hanzi used in other languages.",
      "confidence": "high"
    },
    {
      "field": "enterprise_plan_available",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-services-quotas-and-limits",
      "excerpt": "For Standard pricing tier, you can increase the real-time TPS limit. A TPS increase request requires business justification.",
      "confidence": "medium"
    },
    {
      "field": "auth_methods",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/rest-text-to-speech",
      "excerpt": "Each request requires an authorization header. This table illustrates which headers are supported for each feature: `Ocp-Apim-Subscription-Key` | Yes | Yes | `Authorization: Bearer` | Yes | Yes",
      "confidence": "high"
    },
    {
      "field": "base_url",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/get-started-text-to-speech",
      "excerpt": "https://${SPEECH_REGION}.tts.speech.microsoft.com/cognitiveservices/v1",
      "confidence": "high"
    },
    {
      "field": "versioning_scheme",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/rest-text-to-speech",
      "excerpt": "The `cognitiveservices/v1` endpoint allows you to convert text to speech by using Speech Synthesis Markup Language (SSML).",
      "confidence": "high"
    },
    {
      "field": "sdk_packages",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-sdk",
      "excerpt": "The Speech SDK is available in many programming languages: C#, C++, Go, Java, JavaScript, Objective-C, Python, Swift",
      "confidence": "high"
    },
    {
      "field": "mcp_url",
      "url": "https://learn.microsoft.com/en-us/azure/developer/azure-mcp-server/tools/ai-services-speech",
      "excerpt": "Use the Azure MCP Server to manage Azure Speech in Foundry Tools functionalities such as speech-to-text (STT) and text-to-speech (TTS) with natural language prompts.",
      "confidence": "high"
    },
    {
      "field": "api_style",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/how-to-lower-speech-synthesis-latency",
      "excerpt": "To use the text streaming feature, connect to the websocket V2 endpoint: `wss://{region}.tts.speech.microsoft.com/cognitiveservices/websocket/v2`",
      "confidence": "high"
    },
    {
      "field": "error_format",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/batch-synthesis",
      "excerpt": "{\"error\": {\"code\": \"BadRequest\", \"message\": \"The inputs is required.\"}}",
      "confidence": "high"
    },
    {
      "field": "rate_limit_window",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-services-quotas-and-limits",
      "excerpt": "200 transactions per second (TPS) (default value) The rate is adjustable up to 1,000 TPS for Standard (S0) resources.",
      "confidence": "high"
    },
    {
      "field": "starting_price_usd",
      "url": "https://blocksentient.com/review/microsoft-azure-speech-service/",
      "excerpt": "$15/1M characters",
      "confidence": "medium"
    },
    {
      "field": "price_basis",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-services-quotas-and-limits",
      "excerpt": "Multiply the result by the unit price of $15 per million characters to estimate the monthly cost.",
      "confidence": "high"
    },
    {
      "field": "free_tier_limit",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-services-quotas-and-limits",
      "excerpt": "For the Free (F0) pricing tier, see the monthly allowances on the pricing page.",
      "confidence": "medium"
    },
    {
      "field": "ga_date",
      "url": "https://azure.microsoft.com/de-de/updates/azure-cognitive-services-speech-service-is-now-generally-available/",
      "excerpt": "Azure Cognitive Services—Speech Service now generally available | General availability pricing for the speech service went into effect on November 1, 2018.",
      "confidence": "medium"
    },
    {
      "field": "quickstart_url",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/get-started-text-to-speech",
      "excerpt": "Text to speech quickstart - Speech service - Foundry Tools | Microsoft Learn",
      "confidence": "high"
    },
    {
      "field": "webhooks_supported",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/text-to-speech",
      "excerpt": "Asynchronous synthesis of long audio: Use the batch synthesis API to asynchronously synthesize text to speech files longer than 10 minutes; responses are polled for, and synthesized audio is downloaded when the service makes it available.",
      "confidence": "medium"
    },
    {
      "field": "base_url",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/rest-text-to-speech",
      "excerpt": "East US | `https://eastus.tts.speech.microsoft.com/cognitiveservices/v1`",
      "confidence": "high"
    },
    {
      "field": "api_version",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/batch-synthesis",
      "excerpt": "\"https://YourResourceName.cognitiveservices.azure.com/texttospeech/batchsyntheses/YourSynthesisId?api-version=2024-04-01\"",
      "confidence": "high"
    },
    {
      "field": "stability",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/batch-synthesis",
      "excerpt": "The Batch synthesis API is generally available. The Long Audio API will be retired on April 1st, 2027.",
      "confidence": "high"
    },
    {
      "field": "sdk_packages",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-sdk",
      "excerpt": "In depth samples are available in the Azure-Samples/cognitive-services-speech-sdk repository on GitHub. Code samples for Go are available in the Microsoft/cognitive-services-speech-sdk-go repository on GitHub.",
      "confidence": "high"
    },
    {
      "field": "mcp_url",
      "url": "https://learn.microsoft.com/en-us/azure/developer/azure-mcp-server/get-started",
      "excerpt": "Explore and contribute to the Azure MCP Server on GitHub: https://github.com/microsoft/mcp/tree/main/servers/Azure.Mcp.Server",
      "confidence": "high"
    },
    {
      "field": "api_style",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/rest-text-to-speech",
      "excerpt": "The Speech service allows you to convert text into synthesized speech and get a list of supported voices for a region by using a REST API.",
      "confidence": "high"
    },
    {
      "field": "rate_limit_requests",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-services-quotas-and-limits",
      "excerpt": "Maximum number of transactions per time period for standard voices and custom voices | 20 transactions per 60 seconds (F0) | 200 transactions per second (TPS) (default value)",
      "confidence": "high"
    },
    {
      "field": "data_retention_policy_url",
      "url": "https://learn.microsoft.com/en-us/azure/foundry/responsible-ai/speech-service/text-to-speech/data-privacy-security",
      "excerpt": "Microsoft doesn't retain or store the text that you provide with the real-time synthesis text to speech API. ... Microsoft doesn't store audio or video content generated with the real-time synthesis API.",
      "confidence": "high"
    },
    {
      "field": "starting_price_usd",
      "url": "https://learn.microsoft.com/en-us/azure/ai-services/speech-service/speech-services-quotas-and-limits",
      "excerpt": "Multiply the result by the unit price of $15 per million characters to estimate the monthly cost.",
      "confidence": "medium"
    },
    {
      "field": "free_tier_limit",
      "url": "https://blocksentient.com/review/microsoft-azure-speech-service/",
      "excerpt": "0.5 million characters free per month (Neural)",
      "confidence": "medium"
    },
    {
      "field": "launched_at",
      "url": "https://azure.microsoft.com/de-de/updates/azure-cognitive-services-speech-service-is-now-generally-available/",
      "excerpt": "Azure Cognitive Services—Speech Service now generally available",
      "confidence": "medium"
    },
    {
      "field": "sla_url",
      "url": "https://www.microsoft.com/licensing/docs/view/Service-Level-Agreements-SLA-for-Online-Services?lang=1",
      "excerpt": null,
      "confidence": "high"
    }
  ],
  "fields_not_found": [
    "exact_sla_uptime_percentage",
    "enterprise_plan_name",
    "deprecation_policy_url",
    "idempotency_supported",
    "webhook_signing",
    "webhook_events_url",
    "notable_customers"
  ],
  "source_confidence": "high",
  "last_verified_at": "2026-06-21T00:00:00.000Z",
  "contribute": {
    "note": "This data is crowd-editable. Suggest corrections or leave a review via these endpoints - no auth required, requests are rate-limited, and every submission is reviewed before it goes live. For a field edit, {field} is any key in this response and a citation is required.",
    "endpoints": [
      {
        "action": "review",
        "label": "Leave a review or comment",
        "method": "POST",
        "url": "https://apio.sh/api/feedback/azure-text-to-speech",
        "example_body": {
          "kind": "review",
          "rating": 5,
          "body": "Your experience with this API…"
        }
      },
      {
        "action": "field_edit",
        "label": "Suggest a correction to a field (cite a source)",
        "method": "POST",
        "url": "https://apio.sh/api/suggest/azure-text-to-speech/{field}",
        "example_body": {
          "value": "corrected value",
          "citations": [
            {
              "url": "https://source.example/page",
              "excerpt": "supporting quote"
            }
          ],
          "note": "what changed and why"
        }
      },
      {
        "action": "new_api",
        "label": "Suggest a new API to add (only name is required - send as much as you can cite)",
        "method": "POST",
        "url": "https://apio.sh/api/suggest/api",
        "example_body": {
          "value": {
            "name": "Acme Email API",
            "website_url": "https://acme.example",
            "vendor_name": "Acme",
            "categories": [
              "email"
            ],
            "pricing_model": "usage_based",
            "has_published_pricing": true,
            "free_tier_available": true,
            "price_points": [
              {
                "plan": "Pay as you go",
                "item": "1,000 emails",
                "amount_usd": 1,
                "per": "1,000 emails",
                "source_url": "https://acme.example/pricing"
              }
            ],
            "soc2": "type_2",
            "docs_url": "https://docs.acme.example"
          },
          "citations": [
            {
              "url": "https://acme.example/pricing",
              "excerpt": "$1 per 1,000 emails"
            }
          ]
        },
        "value_schema": [
          {
            "field": "name",
            "type": "string",
            "label": "Product name (the only required field)"
          },
          {
            "field": "website_url",
            "type": "string",
            "label": "Marketing website URL"
          },
          {
            "field": "vendor_name",
            "type": "string",
            "label": "Company/vendor name behind the product"
          },
          {
            "field": "vendor_description",
            "type": "string",
            "label": "One-line description, quoted from the vendor"
          },
          {
            "field": "categories",
            "type": "string[]",
            "label": "Category/leaf slugs it belongs to, e.g. [\"email\",\"sms\"]"
          },
          {
            "field": "primary_use_cases",
            "type": "string[]",
            "label": "What it's used for"
          },
          {
            "field": "supported_actions",
            "type": "string[]",
            "label": "Concrete API actions/capabilities"
          },
          {
            "field": "supported_regions",
            "type": "string[]",
            "label": "Countries/regions/data-residency"
          },
          {
            "field": "supported_languages",
            "type": "string[]",
            "label": "Human/spoken languages supported"
          },
          {
            "field": "input_types",
            "type": "string[]",
            "label": "Accepted input types/formats"
          },
          {
            "field": "output_types",
            "type": "string[]",
            "label": "Produced output types/formats"
          },
          {
            "field": "webhooks_supported",
            "type": "bool",
            "label": "Supports webhooks?"
          },
          {
            "field": "sandbox_available",
            "type": "bool",
            "label": "Dedicated sandbox/test mode?"
          },
          {
            "field": "sdk_languages",
            "type": "string[]",
            "label": "Languages with an official SDK"
          },
          {
            "field": "mcp_server_available",
            "type": "bool",
            "label": "Official MCP server?"
          },
          {
            "field": "pricing_model",
            "type": "enum",
            "label": "Pricing model",
            "values": [
              "usage_based",
              "subscription",
              "seat_based",
              "hybrid",
              "contact_sales"
            ]
          },
          {
            "field": "has_published_pricing",
            "type": "bool",
            "label": "Concrete prices published publicly?"
          },
          {
            "field": "free_tier_available",
            "type": "bool",
            "label": "Recurring/perpetual free tier (not a trial)?"
          },
          {
            "field": "free_tier_details",
            "type": "string",
            "label": "What the free tier includes"
          },
          {
            "field": "minimum_commitment",
            "type": "string",
            "label": "Any stated minimum spend/commitment"
          },
          {
            "field": "self_serve_signup",
            "type": "bool",
            "label": "Get an API key without talking to sales?"
          },
          {
            "field": "requires_sales_call",
            "type": "bool",
            "label": "Does going live require sales?"
          },
          {
            "field": "enterprise_plan_available",
            "type": "bool",
            "label": "Named enterprise tier?"
          },
          {
            "field": "starting_price_usd",
            "type": "number",
            "label": "Lowest published paid entry price (USD number)"
          },
          {
            "field": "price_basis",
            "type": "string",
            "label": "Unit the starting price is per, e.g. '1,000 emails'"
          },
          {
            "field": "free_tier_limit",
            "type": "string",
            "label": "Free-tier ceiling in literal terms"
          },
          {
            "field": "price_points",
            "type": "object[]",
            "label": "Structured prices: [{plan,item,amount_usd,amount_percent,per,source_url}]"
          },
          {
            "field": "soc2",
            "type": "enum",
            "label": "SOC 2 status",
            "values": [
              "type_2",
              "type_1",
              "in_progress",
              "none",
              "unknown"
            ]
          },
          {
            "field": "hipaa",
            "type": "bool",
            "label": "HIPAA (e.g. BAA available)?"
          },
          {
            "field": "gdpr",
            "type": "bool",
            "label": "GDPR compliance stated?"
          },
          {
            "field": "iso_27001",
            "type": "bool",
            "label": "ISO 27001 certified?"
          },
          {
            "field": "pci_dss",
            "type": "bool",
            "label": "PCI DSS compliant?"
          },
          {
            "field": "sla_published",
            "type": "bool",
            "label": "Published SLA / uptime commitment?"
          },
          {
            "field": "documented_rate_limits",
            "type": "string",
            "label": "Documented rate limits, quoted"
          },
          {
            "field": "known_restrictions",
            "type": "string[]",
            "label": "Notable documented restrictions/limits"
          },
          {
            "field": "auth_methods",
            "type": "string[]",
            "label": "Auth methods",
            "values": [
              "api_key",
              "oauth2",
              "jwt",
              "basic",
              "hmac_signature",
              "mtls",
              "session"
            ]
          },
          {
            "field": "api_style",
            "type": "enum",
            "label": "Primary API style",
            "values": [
              "rest",
              "graphql",
              "grpc",
              "soap",
              "websocket"
            ]
          },
          {
            "field": "base_url",
            "type": "string",
            "label": "API root/base URL"
          },
          {
            "field": "api_version",
            "type": "string",
            "label": "Current API version string"
          },
          {
            "field": "quickstart_url",
            "type": "string",
            "label": "Quickstart / hello-world URL"
          },
          {
            "field": "docs_url",
            "type": "string",
            "label": "Developer docs URL"
          },
          {
            "field": "api_reference_url",
            "type": "string",
            "label": "API reference URL"
          },
          {
            "field": "openapi_spec_url",
            "type": "string",
            "label": "OpenAPI spec URL"
          },
          {
            "field": "changelog_url",
            "type": "string",
            "label": "Changelog URL"
          },
          {
            "field": "status_page_url",
            "type": "string",
            "label": "Status page URL"
          },
          {
            "field": "notable_customers",
            "type": "string[]",
            "label": "Named public customers"
          },
          {
            "field": "launched_at",
            "type": "string",
            "label": "Launch date (ISO date or year)"
          }
        ]
      },
      {
        "action": "token",
        "label": "Optional - raise your rate limit",
        "method": "GET",
        "url": "https://apio.sh/api/feedback/token"
      }
    ]
  }
}