{
  "name": "OpenAI Speech-to-Text",
  "slug": "openai-transcribe",
  "website_url": "https://platform.openai.com/docs/guides/speech-to-text",
  "vendor_description": "\"The Audio API provides two speech-to-text endpoints, transcriptions and translations, based on our state-of-the-art open source large-v2 Whisper model.\"",
  "categories": [
    "speech-to-text"
  ],
  "summary": "OpenAI Speech-to-Text is a REST API offering batch, streaming, and real-time audio transcription, speaker diarization, language detection, and translation to English, built on Whisper and newer gpt-4o-based models. It is priced at $0.003 per minute on a self-serve, pay-as-you-go basis with no sales call required, and an enterprise plan is available. The API ships official SDKs for Python, Node.js, Java, Go, Ruby, and .NET, and holds SOC 2 Type II, HIPAA, GDPR, ISO 27001, and PCI DSS certifications.",
  "capabilities": {
    "supported_actions": [
      "transcribe_batch",
      "transcribe_streaming",
      "transcribe_realtime",
      "translation_to_english",
      "speaker_diarization",
      "word_timestamps",
      "segment_timestamps",
      "language_detection",
      "prompting_for_accuracy",
      "logprobs_confidence_scoring",
      "voice_activity_detection"
    ],
    "supported_regions": [],
    "supported_languages": [
      "99+ languages including Afrikaans, Arabic, Armenian, Azerbaijani, Basque, Belarusian, Bosnian, Breton, Bulgarian, Catalan, Chinese, Croatian, Czech, Danish, Dutch, English, Estonian, Faroese, Finnish, French, Galician, German, Greek, Gujarati, Haitian Creole, Hawaiian, Hebrew, Hindi, Hungarian, Icelandic, Indonesian, Italian, Japanese, Javanese, Kannada, Kazakh, Khmer, Korean, Lao, Latin, Latvian, Lingala, Lithuanian, Luxembourgish, Macedonian, Malagasy, Malay, Malayalam, Maltese, Maori, Marathi, Mongolian, Myanmar, Nepali, Norwegian, Nynorsk, Occitan, Pashto, Persian, Polish, Portuguese, Punjabi, Romanian, Russian, Sanskrit, Serbian, Shona, Sindhi, Sinhala, Slovak, Slovenian, Somali, Spanish, Sundanese, Swahili, Swedish, Tagalog, Tajik, Tamil, Tatar, Telugu, Thai, Tibetan, Turkish, Turkmen, Ukrainian, Urdu, Uzbek, Vietnamese, Welsh, Yiddish, Yoruba"
    ],
    "input_types": [
      "audio/mp3",
      "audio/mp4",
      "audio/mpeg",
      "audio/mpga",
      "audio/m4a",
      "audio/wav",
      "audio/webm",
      "WebSocket (realtime streaming)",
      "WebRTC (realtime browser)"
    ],
    "output_types": [
      "JSON",
      "plain text",
      "SRT",
      "VTT",
      "verbose JSON",
      "diarized JSON",
      "word timestamps",
      "segment timestamps",
      "streaming transcript deltas"
    ],
    "webhooks_supported": false,
    "sandbox_available": false,
    "sdk_languages": [
      "Python",
      "Node.js",
      "Java",
      "Go",
      "Ruby",
      ".NET"
    ],
    "mcp_server_available": true
  },
  "integration": {
    "api_style": "rest",
    "base_url": "https://api.openai.com/v1",
    "api_version": "v1",
    "versioning_scheme": "url",
    "stability": "ga",
    "deprecation_policy_url": "https://developers.openai.com/api/docs/deprecations",
    "auth_methods": [
      "api_key"
    ],
    "auth_docs_url": "https://developers.openai.com/api/docs/quickstart",
    "idempotency_supported": null,
    "error_format": "vendor-specific",
    "webhook_signing": "hmac_sha256",
    "webhook_events_url": "https://developers.openai.com/api/docs/guides/webhooks",
    "rate_limit_requests": 500,
    "rate_limit_window": "minute",
    "sdk_packages": [
      {
        "package": "openai",
        "language": "Python",
        "official": true,
        "repo_url": "https://github.com/openai/openai-python"
      },
      {
        "package": "openai",
        "language": "Node.js",
        "official": true,
        "repo_url": "https://github.com/openai/openai-node"
      },
      {
        "package": "com.openai:openai-java",
        "language": "Java",
        "official": true,
        "repo_url": "https://github.com/openai/openai-java"
      },
      {
        "package": "github.com/openai/openai-go",
        "language": "Go",
        "official": true,
        "repo_url": "https://github.com/openai/openai-go"
      },
      {
        "package": "openai",
        "language": "Ruby",
        "official": true,
        "repo_url": "https://github.com/openai/openai-ruby"
      },
      {
        "package": "OpenAI",
        "language": ".NET",
        "official": true,
        "repo_url": null
      }
    ],
    "mcp_url": "https://developers.openai.com/mcp",
    "quickstart_url": "https://developers.openai.com/api/docs/guides/speech-to-text"
  },
  "pricing": {
    "pricing_model": "usage_based",
    "has_published_pricing": true,
    "starting_price_usd": "0.0030",
    "price_basis": "minute",
    "free_tier_available": false,
    "free_tier_limit": null,
    "free_tier_details": null,
    "minimum_commitment": null,
    "self_serve_signup": true,
    "requires_sales_call": false,
    "requires_verification": false,
    "enterprise_plan_available": true,
    "price_points": [
      {
        "plan": null,
        "item": "whisper-1 transcription",
        "amount_usd": "0.0060",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://developers.openai.com/api/docs/models/whisper-1"
      },
      {
        "plan": null,
        "item": "gpt-4o-transcribe audio input",
        "amount_usd": "2.5000",
        "amount_percent": null,
        "per": "1M tokens",
        "currency": "USD",
        "source_url": "https://developers.openai.com/api/docs/pricing"
      },
      {
        "plan": null,
        "item": "gpt-4o-transcribe text output",
        "amount_usd": "10.0000",
        "amount_percent": null,
        "per": "1M tokens",
        "currency": "USD",
        "source_url": "https://developers.openai.com/api/docs/pricing"
      },
      {
        "plan": null,
        "item": "gpt-4o-transcribe estimated cost",
        "amount_usd": "0.0060",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://developers.openai.com/api/docs/pricing"
      },
      {
        "plan": null,
        "item": "gpt-4o-mini-transcribe audio input (snapshots: gpt-4o-mini-transcribe-2025-12-15, gpt-4o-mini-transcribe-2025-03-20)",
        "amount_usd": "1.2500",
        "amount_percent": null,
        "per": "1M tokens",
        "currency": "USD",
        "source_url": "https://developers.openai.com/api/docs/models/gpt-4o-mini-transcribe"
      },
      {
        "plan": null,
        "item": "gpt-4o-mini-transcribe text output",
        "amount_usd": "5.0000",
        "amount_percent": null,
        "per": "1M tokens",
        "currency": "USD",
        "source_url": "https://developers.openai.com/api/docs/models/gpt-4o-mini-transcribe"
      },
      {
        "plan": null,
        "item": "gpt-4o-mini-transcribe estimated cost",
        "amount_usd": "0.0030",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://developers.openai.com/api/docs/pricing"
      },
      {
        "plan": null,
        "item": "gpt-4o-transcribe-diarize audio input (speaker diarization)",
        "amount_usd": "2.5000",
        "amount_percent": null,
        "per": "1M tokens",
        "currency": "USD",
        "source_url": "https://developers.openai.com/api/docs/models/gpt-4o-transcribe-diarize"
      },
      {
        "plan": null,
        "item": "gpt-4o-transcribe-diarize text output (speaker diarization)",
        "amount_usd": "10.0000",
        "amount_percent": null,
        "per": "1M tokens",
        "currency": "USD",
        "source_url": "https://developers.openai.com/api/docs/models/gpt-4o-transcribe-diarize"
      },
      {
        "plan": null,
        "item": "gpt-4o-transcribe-diarize estimated cost (speaker diarization)",
        "amount_usd": "0.0060",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://costgoat.com/pricing/openai-transcription"
      },
      {
        "plan": null,
        "item": "gpt-realtime-whisper streaming transcription (audio duration)",
        "amount_usd": "0.0170",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://developers.openai.com/api/docs/models/gpt-realtime-whisper"
      },
      {
        "plan": null,
        "item": "gpt-realtime-translate streaming speech translation (audio duration)",
        "amount_usd": "0.0340",
        "amount_percent": null,
        "per": "minute",
        "currency": "USD",
        "source_url": "https://developers.openai.com/api/docs/pricing"
      }
    ]
  },
  "compliance": {
    "soc2": "type_2",
    "hipaa": true,
    "gdpr": true,
    "iso_27001": true,
    "pci_dss": true,
    "sla_published": true,
    "sla_url": "https://openai.com/api-scale-tier/",
    "data_retention_policy_url": "https://developers.openai.com/api/docs/guides/your-data",
    "documented_rate_limits": "whisper-1: Free 3 RPM / 200 RPD; Tier 1: 500 RPM; Tier 2: 2,500 RPM; Tier 3: 5,000 RPM; Tier 4: 7,500 RPM; Tier 5: 10,000 RPM. gpt-4o-transcribe / gpt-4o-transcribe-diarize: Tier 1: 500 RPM / 10K TPM; Tier 2: 2,000 RPM / 100K TPM; Tier 3: 5,000 RPM / 400K TPM; Tier 4: 10,000 RPM / 2M TPM; Tier 5: 10,000 RPM / 6M TPM. gpt-4o-mini-transcribe: Tier 1: 500 RPM / 50K TPM; Tier 2: 2,000 RPM / 150K TPM; Tier 3: 5,000 RPM / 600K TPM; Tier 4: 10,000 RPM / 2M TPM; Tier 5: 10,000 RPM / 8M TPM. gpt-realtime-whisper: Tier 1: 100 min/min; Tier 2: 350 min/min; Tier 3: 650 min/min; Tier 4: 1,000 min/min; Tier 5: 1,300 min/min.",
    "known_restrictions": [
      "Maximum file upload size: 25 MB",
      "Translation endpoint outputs English only (whisper-1 only; not available on gpt-4o-transcribe models)",
      "Speaker diarization (gpt-4o-transcribe-diarize) requires chunking_strategy for audio longer than 30 seconds",
      "gpt-4o-transcribe-diarize does not support prompts, logprobs, or timestamp_granularities[]",
      "Prompt steering not supported for gpt-realtime-whisper in realtime sessions",
      "Context window: 16,000 tokens; max output: 2,000 tokens (gpt-4o-transcribe models)",
      "gpt-4o-transcribe and gpt-4o-mini-transcribe output JSON or plain text only (not SRT/VTT)"
    ]
  },
  "developer": {
    "docs_url": "https://developers.openai.com/api/docs",
    "api_reference_url": "https://platform.openai.com/api/reference/overview",
    "openapi_spec_url": null,
    "postman_collection_url": null,
    "changelog_url": null,
    "status_page_url": null,
    "llms_txt_url": null,
    "markdown_docs_url": "https://platform.openai.com/docs/guides/speech-to-text.md",
    "rendering": "static"
  },
  "adoption": {
    "launched_at": "2023-03-01",
    "ga_date": "2025-04-01",
    "github_stars": null,
    "github_stars_at": null,
    "notable_customers": [
      "Speak"
    ]
  },
  "scores": {
    "agent_friendliness": 50,
    "pricing_transparency": 85,
    "setup_speed": 60,
    "docs_quality": 50,
    "procurement_friction": 85,
    "trust_readiness": 100,
    "best_for": [
      "Regulated or enterprise workloads - compliance attestations and an enterprise plan",
      "AI agents and automation - an agent-ready surface (MCP / llms.txt)",
      "Teams needing broad API coverage out of the box"
    ],
    "avoid_if": [
      "You want to try it free before paying"
    ]
  },
  "sources": [
    {
      "field": "vendor_description",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "The Audio API provides two speech-to-text endpoints, transcriptions and translations, based on our state-of-the-art open source large-v2 Whisper model.",
      "confidence": "high"
    },
    {
      "field": "supported_actions",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "Supported models: gpt-4o-transcribe, gpt-4o-mini-transcribe, gpt-4o-transcribe-diarize, whisper-1. Speaker Diarization: Identifies and labels different speakers in audio. Word-Level Timestamps: Precise timing for individual words. Translation: Transcribe and translate audio into English.",
      "confidence": "high"
    },
    {
      "field": "supported_actions",
      "url": "https://developers.openai.com/api/docs/guides/realtime-transcription",
      "excerpt": "gpt-realtime-whisper is an alternative for live transcription... supports streaming transcript deltas as audio arrives, tunable latency via the delay parameter, voice activity detection (VAD) support.",
      "confidence": "high"
    },
    {
      "field": "supported_languages",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "Over 99 languages including major languages like English, Spanish, French, German, Mandarin, Japanese, and many others. The platform prioritizes languages with less than 50% word error rate.",
      "confidence": "high"
    },
    {
      "field": "supported_languages",
      "url": "https://github.com/openai/whisper",
      "excerpt": "Whisper supports transcription and translation for 99 languages. It was trained on 680,000 hours of supervised multilingual audio data.",
      "confidence": "high"
    },
    {
      "field": "input_types",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "Input Formats: MP3, MP4, MPEG, MPGA, M4A, WAV, WebM. File Size Limit: 25 MB maximum.",
      "confidence": "high"
    },
    {
      "field": "input_types",
      "url": "https://developers.openai.com/api/docs/guides/realtime-transcription",
      "excerpt": "gpt-realtime-whisper is the primary model for live transcription... Supports WebSocket (server-side pipelines) or WebRTC (browser audio).",
      "confidence": "high"
    },
    {
      "field": "output_types",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "Output Formats: whisper-1: JSON, text, SRT, verbose_json, VTT; gpt-4o-transcribe/mini: JSON, text; gpt-4o-transcribe-diarize: JSON, text, diarized_json.",
      "confidence": "high"
    },
    {
      "field": "pricing_model",
      "url": "https://developers.openai.com/api/docs/models/whisper-1",
      "excerpt": "Cost per minute: $0.006 for transcription.",
      "confidence": "high"
    },
    {
      "field": "free_tier_available",
      "url": "https://developers.openai.com/api/docs/models/whisper-1",
      "excerpt": "Free: 3 requests per minute (RPM), 200 daily requests — rate-limited access tied to the trial credit, not a recurring free-minutes allowance.",
      "confidence": "high"
    },
    {
      "field": "iso_27001",
      "url": "https://trust.openai.com/",
      "excerpt": "ISO/IEC 27001:2022 certified. Also holds ISO/IEC 27017:2015 and ISO/IEC 27018:2019 certifications.",
      "confidence": "high"
    },
    {
      "field": "hipaa",
      "url": "https://help.openai.com/en/articles/8660679-how-can-i-get-a-business-associate-agreement-baa-with-openai",
      "excerpt": "OpenAI is able to sign Business Associate Agreements (BAA) in support of customers' compliance with the Health Insurance Portability and Accountability Act (HIPAA). The API platform can be a great fit for any covered entity or business associate looking to process protected health information.",
      "confidence": "high"
    },
    {
      "field": "sla_published",
      "url": "https://openai.com/api-scale-tier/",
      "excerpt": "Scale Tier traffic offers a 99.9% uptime SLA and prioritized compute.",
      "confidence": "high"
    },
    {
      "field": "documented_rate_limits",
      "url": "https://developers.openai.com/api/docs/models/gpt-realtime-whisper",
      "excerpt": "Tier 1: 100 minutes/minute; Tier 2: 350 minutes/minute; Tier 3: 650 minutes/minute; Tier 4: 1,000 minutes/minute; Tier 5: 1,300 minutes/minute.",
      "confidence": "high"
    },
    {
      "field": "known_restrictions",
      "url": "https://developers.openai.com/api/docs/guides/realtime-transcription",
      "excerpt": "Prompt steering is not supported for gpt-realtime-whisper in GA Realtime sessions.",
      "confidence": "high"
    },
    {
      "field": "mcp_server_available",
      "url": "https://developers.openai.com/learn/docs-mcp",
      "excerpt": "OpenAI hosts a public Model Context Protocol (MCP) server for developer documentation on developers.openai.com. The server can be accessed at https://developers.openai.com/mcp with read-only access to OpenAI developer documentation.",
      "confidence": "high"
    },
    {
      "field": "webhooks_supported",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "No webhook functionality mentioned for transcription endpoints; streaming is handled via WebSocket/WebRTC delta events.",
      "confidence": "medium"
    },
    {
      "field": "base_url",
      "url": "https://developers.openai.com/api/docs/quickstart",
      "excerpt": "Base URL: `https://api.openai.com/v1`",
      "confidence": "high"
    },
    {
      "field": "api_style",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "REST-based with two primary endpoints: `/v1/audio/transcriptions` and `/v1/audio/translations`",
      "confidence": "high"
    },
    {
      "field": "deprecation_policy_url",
      "url": "https://developers.openai.com/api/docs/deprecations",
      "excerpt": "Deprecations | OpenAI API — the official page listing all API deprecations, along with recommended replacements.",
      "confidence": "high"
    },
    {
      "field": "mcp_url",
      "url": "https://developers.openai.com/learn/docs-mcp",
      "excerpt": "Official URL: `https://developers.openai.com/mcp` — This MCP server is documentation-only. It does not call the OpenAI API on your behalf.",
      "confidence": "high"
    },
    {
      "field": "error_format",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "Standard HTTP status codes with JSON error responses",
      "confidence": "medium"
    },
    {
      "field": "webhook_events_url",
      "url": "https://developers.openai.com/api/docs/guides/webhooks",
      "excerpt": "The documentation references 'the full list of webhook events' in the API reference but only explicitly mentions `response.completed`. The page indicates webhooks support events like batch completion, background response generation, and fine-tuning job completion.",
      "confidence": "high"
    },
    {
      "field": "data_retention_policy_url",
      "url": "https://developers.openai.com/api/docs/guides/your-data",
      "excerpt": "By default, abuse monitoring logs are generated for all API feature usage and retained for up to 30 days, unless longer retention is required by law.",
      "confidence": "high"
    },
    {
      "field": "starting_price_usd",
      "url": "https://developers.openai.com/api/docs/models/whisper-1",
      "excerpt": "Cost per minute of audio: $0.006",
      "confidence": "high"
    },
    {
      "field": "launched_at",
      "url": "https://openai.com/index/introducing-chatgpt-and-whisper-apis/",
      "excerpt": "On March 1st 2023, OpenAI announced that developers could access the OpenAI Whisper Speech-to-Text model via easy-to-use REST APIs.",
      "confidence": "high"
    },
    {
      "field": "notable_customers",
      "url": "https://openai.com/index/introducing-chatgpt-and-whisper-apis/",
      "excerpt": "Speak, an AI-powered language learning app focused on building the best path to spoken fluency, is the fastest-growing English app in South Korea, and is already using the Whisper API to power a new AI speaking companion product.",
      "confidence": "medium"
    },
    {
      "field": "sla_url",
      "url": "https://openai.com/api-scale-tier/",
      "excerpt": "Scale Tier traffic offers a 99.9% uptime SLA and prioritized compute — standard tier has no published SLA.",
      "confidence": "low"
    },
    {
      "field": "pricing_model",
      "url": "https://developers.openai.com/api/docs/pricing",
      "excerpt": "gpt-4o-transcribe: Input $2.50 / Output $10.00 per 1M tokens (~$0.006/min). gpt-4o-mini-transcribe: Input $1.25 / Output $5.00 per 1M tokens (~$0.003/min). gpt-realtime-whisper: $0.017 per minute. gpt-realtime-translate: $0.034 per minute.",
      "confidence": "high"
    },
    {
      "field": "has_published_pricing",
      "url": "https://developers.openai.com/api/docs/pricing",
      "excerpt": "gpt-4o-transcribe: Input $2.50 / Output $10.00 per 1M tokens (~$0.006/min). gpt-4o-mini-transcribe: Input $1.25 / Output $5.00 per 1M tokens (~$0.003/min).",
      "confidence": "high"
    },
    {
      "field": "soc2",
      "url": "https://trust.openai.com/",
      "excerpt": "Our products are covered in our SOC 2 Type 2 report and have been evaluated by an independent third-party auditor to confirm that our controls align with industry standards for security, confidentiality, privacy and availability.",
      "confidence": "high"
    },
    {
      "field": "gdpr",
      "url": "https://trust.openai.com/",
      "excerpt": "GDPR compliance documentation available. Data Processing Agreement provided.",
      "confidence": "high"
    },
    {
      "field": "pci_dss",
      "url": "https://trust.openai.com/",
      "excerpt": "PCI DSS v4.0.1 — listed as a compliance certification on the OpenAI trust page.",
      "confidence": "high"
    },
    {
      "field": "documented_rate_limits",
      "url": "https://developers.openai.com/api/docs/models/whisper-1",
      "excerpt": "Free: 3 RPM / 200 RPD; Tier 1: 500 RPM; Tier 2: 2,500 RPM; Tier 3: 5,000 RPM; Tier 4: 7,500 RPM; Tier 5: 10,000 RPM.",
      "confidence": "high"
    },
    {
      "field": "known_restrictions",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "File Size Limit: 25 MB maximum. gpt-4o-transcribe-diarize requires chunking_strategy when audio is longer than 30 seconds. Translation available only for whisper-1 model.",
      "confidence": "high"
    },
    {
      "field": "sdk_languages",
      "url": "https://developers.openai.com/api/docs/libraries",
      "excerpt": "OpenAI provides first-party support for: JavaScript/TypeScript, Python, C#/.NET (developed in collaboration with Microsoft), Java (currently in beta), Go (currently in beta), Ruby.",
      "confidence": "high"
    },
    {
      "field": "enterprise_plan_available",
      "url": "https://openai.com/api-scale-tier/",
      "excerpt": "Scale Tier traffic offers a 99.9% uptime SLA and prioritized compute. Available to Enterprise customers.",
      "confidence": "high"
    },
    {
      "field": "sandbox_available",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "No dedicated sandbox/test environment mentioned; developers use live API keys against production endpoints.",
      "confidence": "high"
    },
    {
      "field": "auth_methods",
      "url": "https://developers.openai.com/api/docs/quickstart",
      "excerpt": "Header format: `Authorization: Bearer $OPENAI_API_KEY`",
      "confidence": "high"
    },
    {
      "field": "versioning_scheme",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "Not explicitly versioned; uses `/v1/` endpoint structure",
      "confidence": "high"
    },
    {
      "field": "sdk_packages",
      "url": "https://developers.openai.com/api/docs/libraries",
      "excerpt": "JavaScript `openai` (npm) github.com/openai/openai-node; Python `openai` (pip) github.com/openai/openai-python; Java `com.openai:openai-java` github.com/openai/openai-java; Go `github.com/openai/openai-go`; Ruby `openai` gem github.com/openai/openai-ruby",
      "confidence": "high"
    },
    {
      "field": "quickstart_url",
      "url": "https://developers.openai.com/api/docs/guides/speech-to-text",
      "excerpt": "Available at `/api/docs/guides/speech-to-text`",
      "confidence": "high"
    },
    {
      "field": "webhook_signing",
      "url": "https://developers.openai.com/api/docs/guides/webhooks",
      "excerpt": "Webhooks use HMAC-based signatures following the Standard Webhooks specification... The signature format: `\"v1,<base64-encoded-signature>\"`",
      "confidence": "high"
    },
    {
      "field": "rate_limit_requests",
      "url": "https://developers.openai.com/api/docs/models/whisper-1",
      "excerpt": "Tier 1: 500 RPM (Requests/Min)",
      "confidence": "high"
    },
    {
      "field": "starting_price_usd",
      "url": "https://developers.openai.com/api/docs/pricing",
      "excerpt": "gpt-4o-mini-transcribe: $0.003/minute; gpt-4o-transcribe: $0.006/minute",
      "confidence": "high"
    },
    {
      "field": "price_basis",
      "url": "https://developers.openai.com/api/docs/models/whisper-1",
      "excerpt": "Cost per minute of audio: $0.006 — Billing basis: Tokens used (audio duration-based)",
      "confidence": "high"
    },
    {
      "field": "ga_date",
      "url": "https://developers.openai.com/api/docs/models/gpt-4o-transcribe",
      "excerpt": "gpt-4o-transcribe and gpt-4o-mini-transcribe became available for Global Deployment in April 2025",
      "confidence": "medium"
    },
    {
      "field": "requires_verification",
      "url": "https://help.openai.com/en/articles/10910291-api-organization-verification",
      "excerpt": "OpenAI released Verified Organization status, a new way for developers to unlock access to the most advanced models and capabilities on the OpenAI Platform... you can continue using OpenAI's platform with your existing access even without completing the new verification process",
      "confidence": "medium"
    }
  ],
  "fields_not_found": [
    "supported_regions (no explicit data residency regions listed for the STT API)",
    "gpt-4o-transcribe snapshot version (none documented; only gpt-4o-mini-transcribe has dated snapshots)",
    "gpt-realtime-translate exact supported languages",
    "idempotency_supported",
    "free_tier_limit",
    "ga_date_exact"
  ],
  "source_confidence": "high",
  "last_verified_at": "2026-06-21T00:00:00.000Z",
  "contribute": {
    "note": "This data is crowd-editable. Suggest corrections or leave a review via these endpoints - no auth required, requests are rate-limited, and every submission is reviewed before it goes live. For a field edit, {field} is any key in this response and a citation is required.",
    "endpoints": [
      {
        "action": "review",
        "label": "Leave a review or comment",
        "method": "POST",
        "url": "https://apio.sh/api/feedback/openai-transcribe",
        "example_body": {
          "kind": "review",
          "rating": 5,
          "body": "Your experience with this API…"
        }
      },
      {
        "action": "field_edit",
        "label": "Suggest a correction to a field (cite a source)",
        "method": "POST",
        "url": "https://apio.sh/api/suggest/openai-transcribe/{field}",
        "example_body": {
          "value": "corrected value",
          "citations": [
            {
              "url": "https://source.example/page",
              "excerpt": "supporting quote"
            }
          ],
          "note": "what changed and why"
        }
      },
      {
        "action": "new_api",
        "label": "Suggest a new API to add (only name is required - send as much as you can cite)",
        "method": "POST",
        "url": "https://apio.sh/api/suggest/api",
        "example_body": {
          "value": {
            "name": "Acme Email API",
            "website_url": "https://acme.example",
            "vendor_name": "Acme",
            "categories": [
              "email"
            ],
            "pricing_model": "usage_based",
            "has_published_pricing": true,
            "free_tier_available": true,
            "price_points": [
              {
                "plan": "Pay as you go",
                "item": "1,000 emails",
                "amount_usd": 1,
                "per": "1,000 emails",
                "source_url": "https://acme.example/pricing"
              }
            ],
            "soc2": "type_2",
            "docs_url": "https://docs.acme.example"
          },
          "citations": [
            {
              "url": "https://acme.example/pricing",
              "excerpt": "$1 per 1,000 emails"
            }
          ]
        },
        "value_schema": [
          {
            "field": "name",
            "type": "string",
            "label": "Product name (the only required field)"
          },
          {
            "field": "website_url",
            "type": "string",
            "label": "Marketing website URL"
          },
          {
            "field": "vendor_name",
            "type": "string",
            "label": "Company/vendor name behind the product"
          },
          {
            "field": "vendor_description",
            "type": "string",
            "label": "One-line description, quoted from the vendor"
          },
          {
            "field": "categories",
            "type": "string[]",
            "label": "Category/leaf slugs it belongs to, e.g. [\"email\",\"sms\"]"
          },
          {
            "field": "primary_use_cases",
            "type": "string[]",
            "label": "What it's used for"
          },
          {
            "field": "supported_actions",
            "type": "string[]",
            "label": "Concrete API actions/capabilities"
          },
          {
            "field": "supported_regions",
            "type": "string[]",
            "label": "Countries/regions/data-residency"
          },
          {
            "field": "supported_languages",
            "type": "string[]",
            "label": "Human/spoken languages supported"
          },
          {
            "field": "input_types",
            "type": "string[]",
            "label": "Accepted input types/formats"
          },
          {
            "field": "output_types",
            "type": "string[]",
            "label": "Produced output types/formats"
          },
          {
            "field": "webhooks_supported",
            "type": "bool",
            "label": "Supports webhooks?"
          },
          {
            "field": "sandbox_available",
            "type": "bool",
            "label": "Dedicated sandbox/test mode?"
          },
          {
            "field": "sdk_languages",
            "type": "string[]",
            "label": "Languages with an official SDK"
          },
          {
            "field": "mcp_server_available",
            "type": "bool",
            "label": "Official MCP server?"
          },
          {
            "field": "pricing_model",
            "type": "enum",
            "label": "Pricing model",
            "values": [
              "usage_based",
              "subscription",
              "seat_based",
              "hybrid",
              "contact_sales"
            ]
          },
          {
            "field": "has_published_pricing",
            "type": "bool",
            "label": "Concrete prices published publicly?"
          },
          {
            "field": "free_tier_available",
            "type": "bool",
            "label": "Recurring/perpetual free tier (not a trial)?"
          },
          {
            "field": "free_tier_details",
            "type": "string",
            "label": "What the free tier includes"
          },
          {
            "field": "minimum_commitment",
            "type": "string",
            "label": "Any stated minimum spend/commitment"
          },
          {
            "field": "self_serve_signup",
            "type": "bool",
            "label": "Get an API key without talking to sales?"
          },
          {
            "field": "requires_sales_call",
            "type": "bool",
            "label": "Does going live require sales?"
          },
          {
            "field": "enterprise_plan_available",
            "type": "bool",
            "label": "Named enterprise tier?"
          },
          {
            "field": "starting_price_usd",
            "type": "number",
            "label": "Lowest published paid entry price (USD number)"
          },
          {
            "field": "price_basis",
            "type": "string",
            "label": "Unit the starting price is per, e.g. '1,000 emails'"
          },
          {
            "field": "free_tier_limit",
            "type": "string",
            "label": "Free-tier ceiling in literal terms"
          },
          {
            "field": "price_points",
            "type": "object[]",
            "label": "Structured prices: [{plan,item,amount_usd,amount_percent,per,source_url}]"
          },
          {
            "field": "soc2",
            "type": "enum",
            "label": "SOC 2 status",
            "values": [
              "type_2",
              "type_1",
              "in_progress",
              "none",
              "unknown"
            ]
          },
          {
            "field": "hipaa",
            "type": "bool",
            "label": "HIPAA (e.g. BAA available)?"
          },
          {
            "field": "gdpr",
            "type": "bool",
            "label": "GDPR compliance stated?"
          },
          {
            "field": "iso_27001",
            "type": "bool",
            "label": "ISO 27001 certified?"
          },
          {
            "field": "pci_dss",
            "type": "bool",
            "label": "PCI DSS compliant?"
          },
          {
            "field": "sla_published",
            "type": "bool",
            "label": "Published SLA / uptime commitment?"
          },
          {
            "field": "documented_rate_limits",
            "type": "string",
            "label": "Documented rate limits, quoted"
          },
          {
            "field": "known_restrictions",
            "type": "string[]",
            "label": "Notable documented restrictions/limits"
          },
          {
            "field": "auth_methods",
            "type": "string[]",
            "label": "Auth methods",
            "values": [
              "api_key",
              "oauth2",
              "jwt",
              "basic",
              "hmac_signature",
              "mtls",
              "session"
            ]
          },
          {
            "field": "api_style",
            "type": "enum",
            "label": "Primary API style",
            "values": [
              "rest",
              "graphql",
              "grpc",
              "soap",
              "websocket"
            ]
          },
          {
            "field": "base_url",
            "type": "string",
            "label": "API root/base URL"
          },
          {
            "field": "api_version",
            "type": "string",
            "label": "Current API version string"
          },
          {
            "field": "quickstart_url",
            "type": "string",
            "label": "Quickstart / hello-world URL"
          },
          {
            "field": "docs_url",
            "type": "string",
            "label": "Developer docs URL"
          },
          {
            "field": "api_reference_url",
            "type": "string",
            "label": "API reference URL"
          },
          {
            "field": "openapi_spec_url",
            "type": "string",
            "label": "OpenAPI spec URL"
          },
          {
            "field": "changelog_url",
            "type": "string",
            "label": "Changelog URL"
          },
          {
            "field": "status_page_url",
            "type": "string",
            "label": "Status page URL"
          },
          {
            "field": "notable_customers",
            "type": "string[]",
            "label": "Named public customers"
          },
          {
            "field": "launched_at",
            "type": "string",
            "label": "Launch date (ISO date or year)"
          }
        ]
      },
      {
        "action": "token",
        "label": "Optional - raise your rate limit",
        "method": "GET",
        "url": "https://apio.sh/api/feedback/token"
      }
    ]
  }
}