{
  "name": "Google Cloud Speech-to-Text",
  "slug": "google-speech-to-text",
  "website_url": "https://cloud.google.com/speech-to-text",
  "vendor_description": "\"Accurate voice typing and transcription powered by Gemini.\"",
  "categories": [
    "speech-to-text"
  ],
  "summary": "Google Cloud Speech-to-Text is a REST API from Google Cloud that converts audio to text, supporting synchronous, batch, and streaming transcription across more than a dozen languages and regional endpoints. It covers call center transcription, live captioning with WebVTT and SRT output, speaker diarization, and multi-speaker meeting transcription. Pricing starts at $0.016 per minute with a free tier of 60 minutes per month, self-serve signup, and no sales call required. The service holds SOC 2 Type 2, ISO 27001, HIPAA, GDPR, and PCI DSS certifications, and ships official SDKs for Python, Node.js, Java, Go, C#, PHP, Ruby, and C++.",
  "capabilities": {
    "supported_actions": [
      "transcribe_synchronous",
      "transcribe_batch",
      "transcribe_streaming",
      "speaker_diarization",
      "automatic_punctuation",
      "spoken_punctuation",
      "spoken_emoji",
      "profanity_filtering",
      "word_timestamps",
      "word_confidence_scores",
      "language_detection",
      "model_adaptation",
      "custom_vocabulary_phrase_sets",
      "custom_classes",
      "srt_caption_generation",
      "webvtt_caption_generation",
      "recognizer_management",
      "dynamic_batch_recognition"
    ],
    "supported_regions": [
      "global",
      "us (US North America multi-region)",
      "eu (Europe multi-region)",
      "europe-west1",
      "europe-west2",
      "europe-west3",
      "europe-west4",
      "us-central1",
      "asia-southeast1",
      "asia-northeast1",
      "asia-south1",
      "northamerica-northeast1"
    ],
    "supported_languages": [
      "190+ language-region variants (BCP-47 codes) including: Afrikaans (af-ZA), Albanian (sq-AL), Amharic (am-ET), Arabic (20+ regional variants: ar-AE, ar-BH, ar-DZ, ar-EG, ar-IL, ar-IQ, ar-JO, ar-KW, ar-LB, ar-LY, ar-MA, ar-MR, ar-OM, ar-PS, ar-QA, ar-SA, ar-SY, ar-TN, ar-YE), Armenian (hy-AM), Assamese (as-IN), Azerbaijani (az-AZ), Bangla/Bengali (bn-BD, bn-IN), Basque (eu-ES), Bosnian (bs-BA), Bulgarian (bg-BG), Burmese (my-MM), Catalan (ca-ES), Chinese Cantonese (yue-Hant-HK), Chinese Mandarin (zh, zh-TW), Croatian (hr-HR), Czech (cs-CZ), Danish (da-DK), Dutch (nl-BE, nl-NL), English (en-AU, en-CA, en-GB, en-GH, en-HK, en-IE, en-IN, en-KE, en-NG, en-NZ, en-PH, en-PK, en-SG, en-TZ, en-US, en-ZA), Estonian (et-EE), Filipino (fil-PH), Finnish (fi-FI), French (fr-BE, fr-CA, fr-CH, fr-FR), Galician (gl-ES), Georgian (ka-GE), German (de-AT, de-CH, de-DE), Greek (el-GR), Gujarati (gu-IN), Hausa (ha-NG), Hebrew (iw-IL), Hindi (hi-IN), Hungarian (hu-HU), Icelandic (is-IS), Indonesian (id-ID), Italian (it-CH, it-IT), Japanese (ja-JP), Javanese (jv-ID), Kannada (kn-IN), Kazakh (kk-KZ), Khmer (km-KH), Korean (ko-KR), Lao (lo-LA), Latvian (lv-LV), Lithuanian (lt-LT), Macedonian (mk-MK), Malay (ms-MY), Malayalam (ml-IN), Marathi (mr-IN), Mongolian (mn-MN), Nepali (ne-NP), Norwegian (nb-NO), Pashto (ps-AF), Persian (fa-IR), Polish (pl-PL), Portuguese (pt-BR, pt-PT), Punjabi (pa-Guru-IN), Romanian (ro-RO), Russian (ru-RU), Serbian (sr-RS), Sinhala (si-LK), Slovak (sk-SK), Slovenian (sl-SI), Somali (so-SO), Spanish (es-AR, es-BO, es-CL, es-CO, es-CR, es-CU, es-DO, es-EC, es-ES, es-GT, es-HN, es-MX, es-NI, es-PA, es-PE, es-PR, es-PY, es-SV, es-US, es-UY, es-VE), Sundanese (su-ID), Swahili (sw-KE, sw-TZ), Swedish (sv-SE), Tamil (ta-IN, ta-LK, ta-MY, ta-SG), Telugu (te-IN), Thai (th-TH), Turkish (tr-TR), Ukrainian (uk-UA), Urdu (ur-IN, ur-PK), Uzbek (uz-UZ), Vietnamese (vi-VN), Xhosa (xh-ZA), Yoruba (yo-NG), Zulu (zu-ZA)"
    ],
    "input_types": [
      "audio/flac (FLAC)",
      "audio/l16 (LINEAR16 PCM)",
      "audio/mulaw (MULAW / μ-law)",
      "audio/mpeg (MP3)",
      "audio/amr (AMR narrowband, 8000 Hz)",
      "audio/amr-wb (AMR-WB wideband, 16000 Hz)",
      "audio/ogg; codecs=opus (OGG_OPUS)",
      "audio/speex (SPEEX_WITH_HEADER_BYTE, 16000 Hz)",
      "video/webm; codecs=opus (WEBM_OPUS)",
      "WAV (with LINEAR16 or MULAW encoding)",
      "Cloud Storage URI (gs://)",
      "local file upload (≤10 MB)",
      "live streaming via WebSocket/gRPC"
    ],
    "output_types": [
      "JSON (transcription results with confidence scores)",
      "plain text transcript",
      "word-level timestamps",
      "word confidence scores",
      "speaker diarization tags",
      "SRT captions",
      "WebVTT captions",
      "Cloud Storage file output (TranscriptOutputConfig)"
    ],
    "webhooks_supported": false,
    "sandbox_available": false,
    "sdk_languages": [
      "Python",
      "Node.js",
      "Java",
      "Go",
      "C#",
      "PHP",
      "Ruby",
      "C++"
    ],
    "mcp_server_available": false
  },
  "integration": {
    "api_style": "rest",
    "base_url": "https://speech.googleapis.com",
    "api_version": "v2",
    "versioning_scheme": "url",
    "stability": "ga",
    "deprecation_policy_url": "https://cloud.google.com/terms/deprecation",
    "auth_methods": [
      "oauth2",
      "api_key"
    ],
    "auth_docs_url": "https://cloud.google.com/speech-to-text/docs/authentication",
    "idempotency_supported": null,
    "error_format": "vendor-specific (Google API error JSON: {error: {code, message, status}})",
    "webhook_signing": null,
    "webhook_events_url": null,
    "rate_limit_requests": 300,
    "rate_limit_window": "minute",
    "sdk_packages": [
      {
        "package": "google-cloud-speech",
        "language": "Python",
        "official": true,
        "repo_url": "https://github.com/googleapis/python-speech"
      },
      {
        "package": "@google-cloud/speech",
        "language": "Node.js",
        "official": true,
        "repo_url": "https://github.com/googleapis/nodejs-speech"
      },
      {
        "package": "com.google.cloud:google-cloud-speech",
        "language": "Java",
        "official": true,
        "repo_url": "https://github.com/googleapis/java-speech"
      },
      {
        "package": "cloud.google.com/go/speech/apiv2",
        "language": "Go",
        "official": true,
        "repo_url": "https://github.com/googleapis/google-cloud-go"
      },
      {
        "package": "Google.Cloud.Speech.V2",
        "language": "C#",
        "official": true,
        "repo_url": "https://github.com/googleapis/google-cloud-dotnet"
      },
      {
        "package": "google/cloud/speech",
        "language": "PHP",
        "official": true,
        "repo_url": "https://github.com/googleapis/google-cloud-php"
      },
      {
        "package": "google-cloud-speech",
        "language": "Ruby",
        "official": true,
        "repo_url": "https://github.com/GoogleCloudPlatform/google-cloud-ruby"
      },
      {
        "package": "google-cloud-cpp speech",
        "language": "C++",
        "official": true,
        "repo_url": "https://github.com/googleapis/google-cloud-cpp"
      }
    ],
    "mcp_url": null,
    "quickstart_url": "https://docs.cloud.google.com/speech-to-text/docs/quickstarts/transcribe-client-libraries"
  },
  "pricing": {
    "pricing_model": "usage_based",
    "has_published_pricing": true,
    "starting_price_usd": "0.0160",
    "price_basis": "minute",
    "free_tier_available": true,
    "free_tier_limit": "60 minutes/month",
    "free_tier_details": "60 minutes of audio per month free (recurring monthly allowance); applies to both streaming and batch recognition across V1 and V2 APIs.",
    "minimum_commitment": null,
    "self_serve_signup": true,
    "requires_sales_call": false,
    "requires_verification": false,
    "enterprise_plan_available": true,
    "price_points": [
      {
        "plan": "V2 API – Standard (unlogged)",
        "item": "Recognition – 0 to 500,000 min/month",
        "amount_usd": "0.0160",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V2 API – Standard (unlogged)",
        "item": "Recognition – 500,000 to 1,000,000 min/month",
        "amount_usd": "0.0100",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V2 API – Standard (unlogged)",
        "item": "Recognition – 1,000,000 to 2,000,000 min/month",
        "amount_usd": "0.0080",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V2 API – Standard (unlogged)",
        "item": "Recognition – 2,000,000+ min/month",
        "amount_usd": "0.0040",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V2 API – Standard (logged / data-logging opt-in)",
        "item": "Recognition (Logged) – 0 to 500,000 min/month",
        "amount_usd": "0.0120",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V2 API – Standard (logged / data-logging opt-in)",
        "item": "Recognition (Logged) – 2,000,000+ min/month",
        "amount_usd": "0.0030",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V2 API – Dynamic Batch",
        "item": "Dynamic Batch Recognition (unlogged)",
        "amount_usd": "0.0030",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V2 API – Dynamic Batch",
        "item": "Dynamic Batch Recognition (logged)",
        "amount_usd": "0.0023",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V2 API – Free tier",
        "item": "Monthly free allowance (all recognition types)",
        "amount_usd": "0.0000",
        "amount_percent": null,
        "per": "minute (first 60 min/month)",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V1 API – with data logging",
        "item": "Speech recognition with data logging",
        "amount_usd": "0.0160",
        "amount_percent": null,
        "per": "minute (above 60 free min/month)",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V1 API – without data logging",
        "item": "Speech recognition without data logging",
        "amount_usd": "0.0240",
        "amount_percent": null,
        "per": "minute (above 60 free min/month)",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V1 API – Medical (with data logging)",
        "item": "Medical dictation",
        "amount_usd": "0.0780",
        "amount_percent": null,
        "per": "minute (above 60 free min/month)",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      },
      {
        "plan": "V1 API – Medical (with data logging)",
        "item": "Medical conversation",
        "amount_usd": "0.0780",
        "amount_percent": null,
        "per": "minute (above 60 free min/month)",
        "currency": "USD",
        "source_url": "https://cloud.google.com/speech-to-text/pricing"
      }
    ]
  },
  "compliance": {
    "soc2": "type_2",
    "hipaa": true,
    "gdpr": true,
    "iso_27001": true,
    "pci_dss": true,
    "sla_published": true,
    "sla_url": "https://cloud.google.com/speech-to-text/sla",
    "data_retention_policy_url": "https://docs.cloud.google.com/speech-to-text/docs/v1/data-usage-faq",
    "documented_rate_limits": "V2 API: Resource requests 100/60s; Operation requests 150/60s; Synchronous recognition 300/60s; Batch recognition 150/60s (all per region). V1 API: 900 recognition requests per 60 seconds per project (global). Daily audio processing limit: 480 hours per day. Synchronous audio max: ~1 min. Streaming session max: ~5 min. Async audio max: ~480 min. Local file max: 10 MB.",
    "known_restrictions": [
      "Synchronous recognition limited to ~1 minute of audio",
      "Streaming sessions limited to ~5 minutes; session must be restarted for longer audio",
      "Asynchronous audio over ~1 minute must be referenced via a Cloud Storage URI (gs://)",
      "Local file upload limit: 10 MB per request; no limit for Cloud Storage URIs",
      "Multi-channel audio billed per channel (stereo = 2x rate)",
      "Maximum 5,000 phrases per adaptation request; 100,000 total characters; 100 characters per phrase",
      "900 recognition requests per 60 seconds per project on V1 (soft quota, adjustable)",
      "480 hours of audio per day (daily quota, resets midnight PST/PDT)",
      "Custom speech model training is allowlist-only feature",
      "No native webhook/push-notification for async job completion; polling or Cloud Storage triggers required",
      "HIPAA users must not opt into the data logging program",
      "Medical models (medical_conversation, medical_dictation) are V1 API only"
    ]
  },
  "developer": {
    "docs_url": "https://docs.cloud.google.com/",
    "api_reference_url": null,
    "openapi_spec_url": null,
    "postman_collection_url": null,
    "changelog_url": null,
    "status_page_url": "https://status.cloud.google.com",
    "llms_txt_url": null,
    "markdown_docs_url": null,
    "rendering": "static"
  },
  "adoption": {
    "launched_at": "2016-01-01",
    "ga_date": "2017-04-18",
    "github_stars": null,
    "github_stars_at": null,
    "notable_customers": [
      "HubSpot",
      "InteractiveTel",
      "Embodied",
      "iGenius",
      "LogMeIn"
    ]
  },
  "scores": {
    "agent_friendliness": 20,
    "pricing_transparency": 100,
    "setup_speed": 85,
    "docs_quality": 15,
    "procurement_friction": 100,
    "trust_readiness": 100,
    "best_for": [
      "Prototypes and side projects - free to start, no sales call",
      "Regulated or enterprise workloads - compliance attestations and an enterprise plan",
      "Teams needing broad API coverage out of the box"
    ],
    "avoid_if": []
  },
  "sources": [
    {
      "field": "vendor_description",
      "url": "https://cloud.google.com/speech-to-text",
      "excerpt": "Accurate voice typing and transcription powered by Gemini.",
      "confidence": "high"
    },
    {
      "field": "categories",
      "url": "https://cloud.google.com/text-to-speech/pricing",
      "excerpt": "Review pricing for Text-to-Speech | Google Cloud — Text-to-Speech is a separate Google Cloud product with separate pricing.",
      "confidence": "high"
    },
    {
      "field": "supported_languages",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/speech-to-text-supported-languages",
      "excerpt": "Cloud Speech-to-Text V2 supports 190+ language variants across multiple regions and models. Language is specified within a recognition request's languageCodes parameter.",
      "confidence": "high"
    },
    {
      "field": "free_tier_available",
      "url": "https://brasstranscripts.com/blog/google-cloud-speech-to-text-pricing-2025-gcp-integration-costs",
      "excerpt": "60 minutes/month ongoing free tier for Speech-to-Text",
      "confidence": "high"
    },
    {
      "field": "pricing_model",
      "url": "https://cloud.google.com/blog/products/ai-machine-learning/google-cloud-speech-to-text-v2-api",
      "excerpt": "Standard (Real-time/Batch): $0.016 per minute (down from $0.024)",
      "confidence": "high"
    },
    {
      "field": "categories",
      "url": "https://cloud.google.com/speech-to-text",
      "excerpt": "Accurate voice typing and transcription powered by Gemini. Speech-to-Text API. Transcribe audio to text with a simple API call.",
      "confidence": "high"
    },
    {
      "field": "supported_languages",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/speech-to-text-supported-languages",
      "excerpt": "This page lists all languages supported by Cloud Speech-to-Text.",
      "confidence": "high"
    },
    {
      "field": "free_tier_available",
      "url": "https://cloud.google.com/speech-to-text/pricing",
      "excerpt": "All users can send up to 60 minutes of audio to Cloud Speech-to-Text for free each month.",
      "confidence": "high"
    },
    {
      "field": "pricing_model",
      "url": "https://cloud.google.com/speech-to-text/pricing",
      "excerpt": "Speech-to-Text is priced based on the amount of audio successfully processed by the service each month, measured in increments of one second.",
      "confidence": "high"
    },
    {
      "field": "has_published_pricing",
      "url": "https://cloud.google.com/speech-to-text/pricing",
      "excerpt": "Google has lowered the cost of real-time and batch transcription from $0.024 per minute to $0.016 per minute.",
      "confidence": "high"
    },
    {
      "field": "soc2",
      "url": "https://cloud.google.com/security/compliance/services-in-scope",
      "excerpt": "SOC 1, 2, 3 Reports ... Speech recognition and transcription across 125 languages",
      "confidence": "high"
    },
    {
      "field": "hipaa",
      "url": "https://cloud.google.com/security/compliance/hipaa",
      "excerpt": "If you are using Cloud Speech-to-Text, and you have entered into a BAA with Google covering any PHI obligations under HIPAA, then you should not opt into the data logging program.",
      "confidence": "high"
    },
    {
      "field": "iso_27001",
      "url": "https://cloud.google.com/security/compliance/services-in-scope",
      "excerpt": "ISO 27001, 27017, 27018 ... Speech-to-Text",
      "confidence": "high"
    },
    {
      "field": "pci_dss",
      "url": "https://cloud.google.com/security/compliance/services-in-scope",
      "excerpt": "PCI DSS Certification ... Speech recognition and transcription across 125 languages",
      "confidence": "high"
    },
    {
      "field": "sla_published",
      "url": "https://cloud.google.com/speech-to-text/sla",
      "excerpt": "Google Cloud Speech-to-Text provides a monthly uptime percentage of >= 99.9%. If Google does not meet the SLO, and if the Customer meets its obligations under this SLA, the Customer will be eligible to receive Financial Credits.",
      "confidence": "high"
    },
    {
      "field": "sandbox_available",
      "url": "https://cloud.google.com/speech-to-text/pricing",
      "excerpt": "All users can send up to 60 minutes of audio to Cloud Speech-to-Text for free each month. — this is a live-environment free tier, not a dedicated sandbox environment.",
      "confidence": "high"
    },
    {
      "field": "has_published_pricing",
      "url": "https://cloud.google.com/blog/products/ai-machine-learning/google-cloud-speech-to-text-v2-api",
      "excerpt": "Standard volume tiers allow costs as low as $0.004 per minute",
      "confidence": "high"
    },
    {
      "field": "soc2",
      "url": "https://cloud.google.com/security/compliance/soc-2",
      "excerpt": "Below are Google Cloud services that are in scope for SOC 2.",
      "confidence": "high"
    },
    {
      "field": "hipaa",
      "url": "https://cloud.google.com/terms/hipaa-baa",
      "excerpt": "The Google Cloud BAA covers Google Cloud's entire infrastructure (all regions, all zones, all network paths, all points of presence), and the services listed below.",
      "confidence": "high"
    },
    {
      "field": "iso_27001",
      "url": "https://cloud.google.com/security/compliance/iso-27001",
      "excerpt": "Google Cloud is ISO/IEC 27001:2022 compliant",
      "confidence": "high"
    },
    {
      "field": "gdpr",
      "url": "https://cloud.google.com/security/compliance",
      "excerpt": "Google Cloud supports GDPR compliance requirements.",
      "confidence": "high"
    },
    {
      "field": "webhooks_supported",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/overview",
      "excerpt": "Asynchronous requests use long-running operations that require periodic polling for results rather than push-based notifications.",
      "confidence": "high"
    },
    {
      "field": "supported_actions",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/concepts",
      "excerpt": "Transcribe long audio files ... Transcribe streaming audio ... Detect different speakers ... Automatically detect spoken language ... Enable automatic punctuation ... Enable spoken punctuation and spoken emoji ... Enable profanity filtering ... Generate WebVTT & SRT Captions ... Improve transcription with model adaptation",
      "confidence": "high"
    },
    {
      "field": "sdk_languages",
      "url": "https://github.com/googleapis/google-cloud-cpp",
      "excerpt": "google-cloud-cpp speech — official C++ client library for Google Cloud APIs including Speech-to-Text",
      "confidence": "high"
    },
    {
      "field": "documented_rate_limits",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/v1/quotas",
      "excerpt": "Recognition requests: 900 per 60 seconds ... Adaptation resource requests: 10 per 60 seconds ... 480 hours of audio per day",
      "confidence": "high"
    },
    {
      "field": "known_restrictions",
      "url": "https://costbench.com/software/ai-transcription-apis/google-speech-to-text/",
      "excerpt": "Multi-channel audio is billed per channel, effectively doubling stereo recordings to $0.032/min",
      "confidence": "high"
    },
    {
      "field": "supported_regions",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/locations",
      "excerpt": "In Cloud Speech-to-Text API V2, there are different availabilities in different regions. To understand the availabilities, use the Locations API.",
      "confidence": "medium"
    },
    {
      "field": "base_url",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/reference/rest",
      "excerpt": "Base URL: https://speech.googleapis.com",
      "confidence": "high"
    },
    {
      "field": "versioning_scheme",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/reference/rest",
      "excerpt": "Uses semantic versioning with stability indicators (v1=stable, v1p1beta1=beta, v2=current). Converts audio to text by applying powerful neural network models.",
      "confidence": "high"
    },
    {
      "field": "auth_methods",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/authentication",
      "excerpt": "To authenticate calls to Google Cloud APIs, client libraries support Application Default Credentials (ADC); the libraries look for credentials in a set of defined locations and use those credentials to authenticate requests to the API.",
      "confidence": "high"
    },
    {
      "field": "auth_docs_url",
      "url": "https://cloud.google.com/speech-to-text/docs/authentication",
      "excerpt": "Authenticate to Cloud STT | Cloud Speech-to-Text | Google Cloud Documentation",
      "confidence": "high"
    },
    {
      "field": "quickstart_url",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/quickstarts/transcribe-client-libraries",
      "excerpt": "Transcribe speech to text by using client libraries | Cloud Speech-to-Text | Google Cloud Documentation",
      "confidence": "high"
    },
    {
      "field": "rate_limit_window",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/quotas",
      "excerpt": "Resource requests: 100 per 60 seconds; Operation requests: 150 per 60 seconds; Synchronous recognition: 300 per 60 seconds; Batch recognition: 150 per 60 seconds",
      "confidence": "high"
    },
    {
      "field": "price_basis",
      "url": "https://cloud.google.com/speech-to-text/pricing",
      "excerpt": "Speech-to-Text is priced based on the amount of audio successfully processed by the service each month, measured in increments of one second.",
      "confidence": "high"
    },
    {
      "field": "sla_url",
      "url": "https://cloud.google.com/speech-to-text/sla",
      "excerpt": "Speech-to-Text Service Level Agreement (SLA) | Google Cloud",
      "confidence": "high"
    },
    {
      "field": "ga_date",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/release-notes",
      "excerpt": "First GA Release: April 18, 2017 — Release of Cloud Speech-to-Text v1.",
      "confidence": "high"
    },
    {
      "field": "notable_customers",
      "url": "https://cloud.google.com/blog/products/ai-machine-learning/learn-how-google-cloud-customers-use-speech-ai-in-innovative-ways",
      "excerpt": "InteractiveTel uses the Speech API to transcribe phone calls for automobile dealers; HubSpot uses the Speech-to-Text API as part of their Conversation Intelligence products; Embodied uses the Speech API for Moxie, an interactive robot for children's social-emotional learning.",
      "confidence": "high"
    },
    {
      "field": "deprecation_policy_url",
      "url": "https://cloud.google.com/terms/deprecation",
      "excerpt": "Google Cloud Platform Services Subject to Deprecation | Google Cloud",
      "confidence": "high"
    },
    {
      "field": "api_style",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/speech-to-text-requests",
      "excerpt": "Streaming Recognition (gRPC only) performs recognition on audio data provided within a gRPC bi-directional stream. The service uses REST for batch/sync and gRPC for streaming; primary documented interface is REST.",
      "confidence": "high"
    },
    {
      "field": "sdk_languages",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/libraries",
      "excerpt": "Client libraries make it easier to access Google Cloud APIs from a supported language ... C# ... Go ... Java ... Node.js ... PHP ... Python ... Ruby",
      "confidence": "high"
    },
    {
      "field": "documented_rate_limits",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/quotas",
      "excerpt": "Resource requests: 100 per 60 seconds; Operation requests: 150 per 60 seconds; Synchronous recognition: 300 per 60 seconds; Batch recognition: 150 per 60 seconds",
      "confidence": "high"
    },
    {
      "field": "known_restrictions",
      "url": "https://docs.cloud.google.com/speech-to-text/quotas",
      "excerpt": "Synchronous: ~1 Minute ... Asynchronous: ~480 Minutes (audio over ~1 minute requires Cloud Storage URI) ... Streaming: ~5 Minutes ... Local files: 10 MB maximum per request",
      "confidence": "high"
    },
    {
      "field": "mcp_server_available",
      "url": "https://docs.cloud.google.com/mcp/supported-products",
      "excerpt": "Google Cloud Speech-to-Text is not listed as a supported product for Google Cloud MCP servers.",
      "confidence": "high"
    },
    {
      "field": "supported_regions",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/speech-to-text-supported-languages",
      "excerpt": "asia-northeast1, asia-south1, asia-southeast1, eu, europe-west2, europe-west3, europe-west4, global, northamerica-northeast1, us, us-central1",
      "confidence": "medium"
    },
    {
      "field": "api_version",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/reference/rest",
      "excerpt": "The service provides three API versions: v2 (current/stable), v1p1beta1 (beta), v1 (legacy)",
      "confidence": "high"
    },
    {
      "field": "stability",
      "url": "https://cloud.google.com/blog/products/ai-machine-learning/google-cloud-speech-to-text-v2-api",
      "excerpt": "August 9, 2023 - Speech-to-Text V2 API and Chirp reached General Availability",
      "confidence": "high"
    },
    {
      "field": "auth_methods",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/authentication",
      "excerpt": "Like any principal, a service account can authenticate itself to Google, obtain an OAuth 2.0 access token, and call Google APIs.",
      "confidence": "high"
    },
    {
      "field": "sdk_packages",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/libraries",
      "excerpt": "Python: google-cloud-speech | pip install --upgrade google-cloud-speech | github.com/googleapis/python-speech; Node.js: @google-cloud/speech | npm install @google-cloud/speech | github.com/googleapis/nodejs-speech; Java: google-cloud-speech | com.google.cloud:google-cloud-speech:4.88.0 | github.com/googleapis/java-speech",
      "confidence": "high"
    },
    {
      "field": "rate_limit_requests",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/quotas",
      "excerpt": "Synchronous recognition: 300 per 60 seconds (per region)",
      "confidence": "high"
    },
    {
      "field": "starting_price_usd",
      "url": "https://cloud.google.com/blog/products/ai-machine-learning/google-cloud-speech-to-text-v2-api",
      "excerpt": "Standard (Real-time/Batch): $0.016 per minute (down from $0.024)",
      "confidence": "high"
    },
    {
      "field": "free_tier_limit",
      "url": "https://cloud.google.com/speech-to-text/pricing",
      "excerpt": "All users can send up to 60 minutes of audio to Cloud Speech-to-Text for free each month.",
      "confidence": "high"
    },
    {
      "field": "data_retention_policy_url",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/v1/data-usage-faq",
      "excerpt": "Without opt-in to data logging, Google does not use any of your content for any purpose except to provide you with the Cloud Speech-to-Text API service. Input audio data is not stored by the Cloud Speech-to-Text API service (async transcripts retained approximately 5 days).",
      "confidence": "high"
    },
    {
      "field": "launched_at",
      "url": "https://www.infoq.com/news/2017/05/Google-Cloud-Speech-API/",
      "excerpt": "The API was launched, in open beta, last summer (referring to summer 2016)",
      "confidence": "medium"
    },
    {
      "field": "error_format",
      "url": "https://docs.cloud.google.com/speech-to-text/docs/error-messages",
      "excerpt": "{\"error\": {\"code\": 403, \"message\": \"The request is missing a valid API key.\", \"status\": \"PERMISSION_DENIED\"}}",
      "confidence": "high"
    },
    {
      "field": "mcp_url",
      "url": "https://docs.cloud.google.com/mcp/supported-products",
      "excerpt": "No Speech-to-Text MCP server listed in the 50+ Google Cloud MCP servers available.",
      "confidence": "high"
    }
  ],
  "fields_not_found": [
    "exact V1 medical model per-minute pricing confirmed from live pricing page (page rendering issues prevented full table extraction)",
    "complete static list of all V2 supported regions (Google directs to Locations API)",
    "SLA uptime percentage confirmed from live SLA page (page truncated; 99.9% widely cited)",
    "idempotency_supported",
    "webhook_signing",
    "webhook_events_url",
    "mcp_url"
  ],
  "source_confidence": "high",
  "last_verified_at": "2026-06-21T00:00:00.000Z",
  "contribute": {
    "note": "This data is crowd-editable. Suggest corrections or leave a review via these endpoints - no auth required, requests are rate-limited, and every submission is reviewed before it goes live. For a field edit, {field} is any key in this response and a citation is required.",
    "endpoints": [
      {
        "action": "review",
        "label": "Leave a review or comment",
        "method": "POST",
        "url": "https://apio.sh/api/feedback/google-speech-to-text",
        "example_body": {
          "kind": "review",
          "rating": 5,
          "body": "Your experience with this API…"
        }
      },
      {
        "action": "field_edit",
        "label": "Suggest a correction to a field (cite a source)",
        "method": "POST",
        "url": "https://apio.sh/api/suggest/google-speech-to-text/{field}",
        "example_body": {
          "value": "corrected value",
          "citations": [
            {
              "url": "https://source.example/page",
              "excerpt": "supporting quote"
            }
          ],
          "note": "what changed and why"
        }
      },
      {
        "action": "new_api",
        "label": "Suggest a new API to add (only name is required - send as much as you can cite)",
        "method": "POST",
        "url": "https://apio.sh/api/suggest/api",
        "example_body": {
          "value": {
            "name": "Acme Email API",
            "website_url": "https://acme.example",
            "vendor_name": "Acme",
            "categories": [
              "email"
            ],
            "pricing_model": "usage_based",
            "has_published_pricing": true,
            "free_tier_available": true,
            "price_points": [
              {
                "plan": "Pay as you go",
                "item": "1,000 emails",
                "amount_usd": 1,
                "per": "1,000 emails",
                "source_url": "https://acme.example/pricing"
              }
            ],
            "soc2": "type_2",
            "docs_url": "https://docs.acme.example"
          },
          "citations": [
            {
              "url": "https://acme.example/pricing",
              "excerpt": "$1 per 1,000 emails"
            }
          ]
        },
        "value_schema": [
          {
            "field": "name",
            "type": "string",
            "label": "Product name (the only required field)"
          },
          {
            "field": "website_url",
            "type": "string",
            "label": "Marketing website URL"
          },
          {
            "field": "vendor_name",
            "type": "string",
            "label": "Company/vendor name behind the product"
          },
          {
            "field": "vendor_description",
            "type": "string",
            "label": "One-line description, quoted from the vendor"
          },
          {
            "field": "categories",
            "type": "string[]",
            "label": "Category/leaf slugs it belongs to, e.g. [\"email\",\"sms\"]"
          },
          {
            "field": "primary_use_cases",
            "type": "string[]",
            "label": "What it's used for"
          },
          {
            "field": "supported_actions",
            "type": "string[]",
            "label": "Concrete API actions/capabilities"
          },
          {
            "field": "supported_regions",
            "type": "string[]",
            "label": "Countries/regions/data-residency"
          },
          {
            "field": "supported_languages",
            "type": "string[]",
            "label": "Human/spoken languages supported"
          },
          {
            "field": "input_types",
            "type": "string[]",
            "label": "Accepted input types/formats"
          },
          {
            "field": "output_types",
            "type": "string[]",
            "label": "Produced output types/formats"
          },
          {
            "field": "webhooks_supported",
            "type": "bool",
            "label": "Supports webhooks?"
          },
          {
            "field": "sandbox_available",
            "type": "bool",
            "label": "Dedicated sandbox/test mode?"
          },
          {
            "field": "sdk_languages",
            "type": "string[]",
            "label": "Languages with an official SDK"
          },
          {
            "field": "mcp_server_available",
            "type": "bool",
            "label": "Official MCP server?"
          },
          {
            "field": "pricing_model",
            "type": "enum",
            "label": "Pricing model",
            "values": [
              "usage_based",
              "subscription",
              "seat_based",
              "hybrid",
              "contact_sales"
            ]
          },
          {
            "field": "has_published_pricing",
            "type": "bool",
            "label": "Concrete prices published publicly?"
          },
          {
            "field": "free_tier_available",
            "type": "bool",
            "label": "Recurring/perpetual free tier (not a trial)?"
          },
          {
            "field": "free_tier_details",
            "type": "string",
            "label": "What the free tier includes"
          },
          {
            "field": "minimum_commitment",
            "type": "string",
            "label": "Any stated minimum spend/commitment"
          },
          {
            "field": "self_serve_signup",
            "type": "bool",
            "label": "Get an API key without talking to sales?"
          },
          {
            "field": "requires_sales_call",
            "type": "bool",
            "label": "Does going live require sales?"
          },
          {
            "field": "enterprise_plan_available",
            "type": "bool",
            "label": "Named enterprise tier?"
          },
          {
            "field": "starting_price_usd",
            "type": "number",
            "label": "Lowest published paid entry price (USD number)"
          },
          {
            "field": "price_basis",
            "type": "string",
            "label": "Unit the starting price is per, e.g. '1,000 emails'"
          },
          {
            "field": "free_tier_limit",
            "type": "string",
            "label": "Free-tier ceiling in literal terms"
          },
          {
            "field": "price_points",
            "type": "object[]",
            "label": "Structured prices: [{plan,item,amount_usd,amount_percent,per,source_url}]"
          },
          {
            "field": "soc2",
            "type": "enum",
            "label": "SOC 2 status",
            "values": [
              "type_2",
              "type_1",
              "in_progress",
              "none",
              "unknown"
            ]
          },
          {
            "field": "hipaa",
            "type": "bool",
            "label": "HIPAA (e.g. BAA available)?"
          },
          {
            "field": "gdpr",
            "type": "bool",
            "label": "GDPR compliance stated?"
          },
          {
            "field": "iso_27001",
            "type": "bool",
            "label": "ISO 27001 certified?"
          },
          {
            "field": "pci_dss",
            "type": "bool",
            "label": "PCI DSS compliant?"
          },
          {
            "field": "sla_published",
            "type": "bool",
            "label": "Published SLA / uptime commitment?"
          },
          {
            "field": "documented_rate_limits",
            "type": "string",
            "label": "Documented rate limits, quoted"
          },
          {
            "field": "known_restrictions",
            "type": "string[]",
            "label": "Notable documented restrictions/limits"
          },
          {
            "field": "auth_methods",
            "type": "string[]",
            "label": "Auth methods",
            "values": [
              "api_key",
              "oauth2",
              "jwt",
              "basic",
              "hmac_signature",
              "mtls",
              "session"
            ]
          },
          {
            "field": "api_style",
            "type": "enum",
            "label": "Primary API style",
            "values": [
              "rest",
              "graphql",
              "grpc",
              "soap",
              "websocket"
            ]
          },
          {
            "field": "base_url",
            "type": "string",
            "label": "API root/base URL"
          },
          {
            "field": "api_version",
            "type": "string",
            "label": "Current API version string"
          },
          {
            "field": "quickstart_url",
            "type": "string",
            "label": "Quickstart / hello-world URL"
          },
          {
            "field": "docs_url",
            "type": "string",
            "label": "Developer docs URL"
          },
          {
            "field": "api_reference_url",
            "type": "string",
            "label": "API reference URL"
          },
          {
            "field": "openapi_spec_url",
            "type": "string",
            "label": "OpenAPI spec URL"
          },
          {
            "field": "changelog_url",
            "type": "string",
            "label": "Changelog URL"
          },
          {
            "field": "status_page_url",
            "type": "string",
            "label": "Status page URL"
          },
          {
            "field": "notable_customers",
            "type": "string[]",
            "label": "Named public customers"
          },
          {
            "field": "launched_at",
            "type": "string",
            "label": "Launch date (ISO date or year)"
          }
        ]
      },
      {
        "action": "token",
        "label": "Optional - raise your rate limit",
        "method": "GET",
        "url": "https://apio.sh/api/feedback/token"
      }
    ]
  }
}