{
  "name": "Amazon Textract",
  "slug": "aws-textract",
  "website_url": "https://aws.amazon.com/textract/",
  "vendor_description": "\"Automatically extract printed text, handwriting, layout elements, and data from any document\"",
  "categories": [
    "ocr"
  ],
  "summary": "Amazon Textract is an AWS document intelligence service that extracts printed text, handwriting, form fields, tables, and structured data from PDFs and images, targeting industries such as healthcare, financial services, and lending. Pricing is usage-based starting at $0.0015 per page, with a free tier of 1,000 pages per month for the first three months and no sales call required to get started. The service is available across 16 AWS regions including GovCloud, holds SOC 2 Type II, HIPAA, GDPR, ISO 27001, and PCI DSS certifications, and offers SDKs for seven languages.",
  "capabilities": {
    "supported_actions": [
      "DetectDocumentText",
      "AnalyzeDocument (Forms, Tables, Queries, Signatures, Layout, Custom Queries)",
      "AnalyzeExpense",
      "AnalyzeID",
      "StartDocumentTextDetection",
      "StartDocumentAnalysis",
      "StartExpenseAnalysis",
      "StartIDDocumentAnalysis",
      "GetDocumentTextDetection",
      "GetDocumentAnalysis",
      "GetExpenseAnalysis",
      "GetIDDocumentAnalysis",
      "StartLendingAnalysis",
      "GetLendingAnalysis",
      "GetLendingAnalysisSummary",
      "CreateAdapter",
      "CreateAdapterVersion",
      "DeleteAdapter",
      "DeleteAdapterVersion",
      "UpdateAdapter",
      "GetAdapter",
      "GetAdapterVersion",
      "ListAdapters",
      "ListAdapterVersions"
    ],
    "supported_regions": [
      "US East (N. Virginia) us-east-1",
      "US East (Ohio) us-east-2",
      "US West (N. California) us-west-1",
      "US West (Oregon) us-west-2",
      "Asia Pacific (Mumbai) ap-south-1",
      "Asia Pacific (Seoul) ap-northeast-2",
      "Asia Pacific (Singapore) ap-southeast-1",
      "Asia Pacific (Sydney) ap-southeast-2",
      "Canada (Central) ca-central-1",
      "Europe (Frankfurt) eu-central-1",
      "Europe (Ireland) eu-west-1",
      "Europe (London) eu-west-2",
      "Europe (Paris) eu-west-3",
      "Europe (Spain) eu-south-2",
      "AWS GovCloud (US-East) us-gov-east-1",
      "AWS GovCloud (US-West) us-gov-west-1"
    ],
    "supported_languages": [
      "English",
      "French",
      "German",
      "Italian",
      "Portuguese",
      "Spanish"
    ],
    "input_types": [
      "JPEG",
      "PNG",
      "PDF",
      "TIFF"
    ],
    "output_types": [
      "JSON"
    ],
    "webhooks_supported": true,
    "sandbox_available": false,
    "sdk_languages": [
      "Python",
      "JavaScript/Node.js",
      "Java",
      ".NET",
      "Go",
      "Ruby",
      "PHP"
    ],
    "mcp_server_available": false
  },
  "integration": {
    "api_style": "rest",
    "base_url": "https://textract.{region}.amazonaws.com",
    "api_version": "2018-06-27",
    "versioning_scheme": "header",
    "stability": "ga",
    "deprecation_policy_url": "https://docs.aws.amazon.com/general/latest/gr/service-lifecycle.html",
    "auth_methods": [
      "hmac_signature"
    ],
    "auth_docs_url": "https://docs.aws.amazon.com/textract/latest/dg/security-iam.html",
    "idempotency_supported": true,
    "error_format": "vendor-specific",
    "webhook_signing": null,
    "webhook_events_url": "https://docs.aws.amazon.com/textract/latest/dg/async-notification-payload.html",
    "rate_limit_requests": 25,
    "rate_limit_window": "second",
    "sdk_packages": [
      {
        "package": "boto3",
        "language": "Python",
        "official": true,
        "repo_url": "https://github.com/boto/boto3"
      },
      {
        "package": "@aws-sdk/client-textract",
        "language": "JavaScript/Node.js",
        "official": true,
        "repo_url": "https://github.com/aws/aws-sdk-js-v3"
      },
      {
        "package": "software.amazon.awssdk:textract",
        "language": "Java",
        "official": true,
        "repo_url": "https://github.com/aws/aws-sdk-java-v2"
      },
      {
        "package": "AWSSDK.Textract",
        "language": ".NET",
        "official": true,
        "repo_url": "https://github.com/aws/aws-sdk-net"
      },
      {
        "package": "github.com/aws/aws-sdk-go-v2/service/textract",
        "language": "Go",
        "official": true,
        "repo_url": "https://github.com/aws/aws-sdk-go-v2"
      },
      {
        "package": "aws-sdk-textract",
        "language": "Ruby",
        "official": true,
        "repo_url": "https://github.com/aws/aws-sdk-ruby"
      },
      {
        "package": "aws/aws-sdk-php",
        "language": "PHP",
        "official": true,
        "repo_url": "https://github.com/aws/aws-sdk-php"
      }
    ],
    "mcp_url": null,
    "quickstart_url": "https://docs.aws.amazon.com/textract/latest/dg/getting-started.html"
  },
  "pricing": {
    "pricing_model": "usage_based",
    "has_published_pricing": true,
    "starting_price_usd": "0.0015",
    "price_basis": "page",
    "free_tier_available": false,
    "free_tier_limit": "1,000 pages/month for Detect Document Text (first 3 months)",
    "free_tier_details": "3-month time-limited trial for new AWS customers only: Detect Document Text 1,000 pages/month; Analyze Document (Signatures) 1,000 pages/month; Analyze Document (Forms/Tables/Layout/Queries) 100 pages/month; Analyze Expense 100 pages/month; Analyze ID 100 pages/month; Analyze Lending 2,000 pages/month. Not a perpetual free tier.",
    "minimum_commitment": null,
    "self_serve_signup": true,
    "requires_sales_call": false,
    "requires_verification": false,
    "enterprise_plan_available": true,
    "price_points": [
      {
        "plan": "Trial (3-month, new AWS customers only)",
        "item": "Detect Document Text API — 1,000 pages/month",
        "amount_usd": "0.0000",
        "amount_percent": null,
        "per": "month",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Trial (3-month, new AWS customers only)",
        "item": "Analyze Document API (Signatures only) — 1,000 pages/month",
        "amount_usd": "0.0000",
        "amount_percent": null,
        "per": "month",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Trial (3-month, new AWS customers only)",
        "item": "Analyze Document API (Forms, Tables, Layout, Queries) — 100 pages/month each",
        "amount_usd": "0.0000",
        "amount_percent": null,
        "per": "month",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Trial (3-month, new AWS customers only)",
        "item": "Analyze Expense API — 100 pages/month",
        "amount_usd": "0.0000",
        "amount_percent": null,
        "per": "month",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Trial (3-month, new AWS customers only)",
        "item": "Analyze ID API — 100 pages/month",
        "amount_usd": "0.0000",
        "amount_percent": null,
        "per": "month",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Trial (3-month, new AWS customers only)",
        "item": "Analyze Lending API — 2,000 pages/month",
        "amount_usd": "0.0000",
        "amount_percent": null,
        "per": "month",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Detect Document Text API — first 1M pages",
        "amount_usd": "0.0015",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Detect Document Text API — after 1M pages",
        "amount_usd": "0.0006",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Forms) — first 1M pages",
        "amount_usd": "0.0500",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Forms) — after 1M pages",
        "amount_usd": "0.0400",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Tables) — first 1M pages",
        "amount_usd": "0.0150",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Tables) — after 1M pages",
        "amount_usd": "0.0100",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Queries) — first 1M pages",
        "amount_usd": "0.0150",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Tables + Queries) — first 1M pages",
        "amount_usd": "0.0200",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Tables + Queries) — after 1M pages",
        "amount_usd": "0.0150",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Forms + Tables + Queries) — first 1M pages",
        "amount_usd": "0.0700",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Forms + Tables + Queries) — after 1M pages",
        "amount_usd": "0.0550",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Signatures) — first 1M pages",
        "amount_usd": "0.0035",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Signatures) — after 1M pages",
        "amount_usd": "0.0014",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Custom Queries) — first 1M pages",
        "amount_usd": "0.0250",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Custom Queries) — after 1M pages",
        "amount_usd": "0.0150",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Forms + Custom Queries) — first 1M pages",
        "amount_usd": "0.0650",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Document API (Forms + Custom Queries) — after 1M pages",
        "amount_usd": "0.0500",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Expense API — first 1M pages",
        "amount_usd": "0.0100",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Expense API — after 1M pages",
        "amount_usd": "0.0080",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze ID API — first 100K pages",
        "amount_usd": "0.0250",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze ID API — after 100K pages",
        "amount_usd": "0.0100",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Lending API — first 1M pages (classified and extracted pages only)",
        "amount_usd": "0.0700",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      },
      {
        "plan": "Pay As You Go",
        "item": "Analyze Lending API — after 1M pages (classified and extracted pages only)",
        "amount_usd": "0.0550",
        "amount_percent": null,
        "per": "page",
        "currency": "USD",
        "source_url": "https://aws.amazon.com/textract/pricing/"
      }
    ]
  },
  "compliance": {
    "soc2": "type_2",
    "hipaa": true,
    "gdpr": true,
    "iso_27001": true,
    "pci_dss": true,
    "sla_published": true,
    "sla_url": "https://aws.amazon.com/textract/sla/",
    "data_retention_policy_url": "https://docs.aws.amazon.com/textract/latest/dg/data-protection.html",
    "documented_rate_limits": "Default TPS quotas vary by region and API. In US East (N. Virginia): DetectDocumentText sync=25 TPS, AnalyzeDocument sync=10 TPS, AnalyzeExpense sync=5 TPS, AnalyzeID sync=5 TPS; StartDocumentTextDetection async=15 TPS, StartDocumentAnalysis async=10 TPS, StartExpenseAnalysis async=5 TPS, StartLendingAnalysis async=5 TPS; Maximum concurrent async jobs=600 in us-east-1/us-west-2. Synchronous ops: max 15 queries per page; Asynchronous ops: max 30 queries per page. Limits are adjustable via AWS Service Quotas console.",
    "known_restrictions": [
      "Supported file formats: JPEG, PNG, PDF, TIFF only (no XFA-based PDFs)",
      "Sync operations: max 10 MB file size, PDF/TIFF limited to 1 page",
      "Async operations: PDF/TIFF max 500 MB and 3,000 pages; JPEG/PNG max 10 MB",
      "PDF max height/width: 40 inches and 9,000 points; cannot be password protected",
      "Max image resolution: 10,000 pixels on all sides",
      "Handwritten text recognition supported in English only",
      "Query feature (natural language) available in English documents only",
      "AnalyzeID supports US passports and US driver's licenses only",
      "Vertical text (e.g., Japanese, Chinese vertical layout) not supported",
      "Minimum text height: 15 pixels (equivalent to 8pt font at 150 DPI)",
      "Up to 15 queries per page (sync) and 30 queries per page (async)",
      "PCI DSS users must opt out of content use for service improvement via AWS Support",
      "Max 10 adapters per account; max 10 adapter versions per month; max 3 in-progress adapter training jobs",
      "Layout feature is free when used with the Tables feature"
    ]
  },
  "developer": {
    "docs_url": "https://docs.aws.amazon.com",
    "api_reference_url": null,
    "openapi_spec_url": null,
    "postman_collection_url": null,
    "changelog_url": null,
    "status_page_url": "https://status.aws.amazon.com",
    "llms_txt_url": "https://docs.aws.amazon.com/llms.txt",
    "markdown_docs_url": null,
    "rendering": "static"
  },
  "adoption": {
    "launched_at": "2018-11-28",
    "ga_date": "2019-05-29",
    "github_stars": null,
    "github_stars_at": null,
    "notable_customers": [
      "Change Healthcare",
      "Roche",
      "Elevance Health",
      "Pennymac",
      "Cox Automotive",
      "The Washington Post",
      "HelloSign",
      "PitchBook"
    ]
  },
  "scores": {
    "agent_friendliness": 35,
    "pricing_transparency": 85,
    "setup_speed": 60,
    "docs_quality": 25,
    "procurement_friction": 85,
    "trust_readiness": 100,
    "best_for": [
      "Regulated or enterprise workloads - compliance attestations and an enterprise plan",
      "AI agents and automation - an agent-ready surface (MCP / llms.txt)",
      "Teams needing broad API coverage out of the box"
    ],
    "avoid_if": [
      "You want to try it free before paying"
    ]
  },
  "sources": [
    {
      "field": "vendor_description",
      "url": "https://aws.amazon.com/textract/",
      "excerpt": "A machine learning (ML) service that automatically extracts text, handwriting, layout elements, and data from scanned documents.",
      "confidence": "high"
    },
    {
      "field": "vendor_description",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/what-is.html",
      "excerpt": "Amazon Textract helps you add document text detection and analysis to your applications.",
      "confidence": "high"
    },
    {
      "field": "primary_use_cases",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/what-is.html",
      "excerpt": "Process invoices and receipts with the AnalyzeExpense API. Process ID documents such as drivers licenses and passports issued by U.S. government, using the AnalyzeID API. Upload and process mortgage loan packages, through automatic routing of the the document pages to the appropriate Amazon Textract analysis operations using the Analyze Lending workflow.",
      "confidence": "high"
    },
    {
      "field": "primary_use_cases",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/what-is.html",
      "excerpt": "Creating an intelligent search index – Using Amazon Textract you can create libraries of text that is detected in image and PDF files. Using intelligent text extraction for natural language processing (NLP)",
      "confidence": "high"
    },
    {
      "field": "supported_actions",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/API_Operations.html",
      "excerpt": "The following actions are supported: AnalyzeDocument, AnalyzeExpense, AnalyzeID, CreateAdapter, CreateAdapterVersion, DeleteAdapter, DeleteAdapterVersion, DetectDocumentText, GetAdapter, GetAdapterVersion, GetDocumentAnalysis, GetDocumentTextDetection, GetExpenseAnalysis, GetLendingAnalysis, GetLendingAnalysisSummary, ListAdapters, ListAdapterVersions, StartDocumentAnalysis, StartDocumentTextDetection, StartExpenseAnalysis, StartLendingAnalysis, UpdateAdapter",
      "confidence": "high"
    },
    {
      "field": "supported_actions",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/what-is.html",
      "excerpt": "Extract text, forms, and tables from documents with structured data, using the Amazon Textract Document Analysis API. Specify and extract information from documents using the Queries feature within the Amazon Textract Analyze Document API.",
      "confidence": "high"
    },
    {
      "field": "supported_regions",
      "url": "https://docs.aws.amazon.com/general/latest/gr/textract.html",
      "excerpt": "US East (Ohio) us-east-2 ... US East (N. Virginia) us-east-1 ... US West (N. California) us-west-1 ... US West (Oregon) us-west-2 ... Asia Pacific (Mumbai) ap-south-1 ... Asia Pacific (Seoul) ap-northeast-2 ... Asia Pacific (Singapore) ap-southeast-1 ... Asia Pacific (Sydney) ap-southeast-2 ... Canada (Central) ca-central-1 ... Europe (Frankfurt) eu-central-1 ... Europe (Ireland) eu-west-1 ... Europe (London) eu-west-2 ... Europe (Paris) eu-west-3 ... Europe (Spain) eu-south-2 ... AWS GovCloud (US-East) us-gov-east-1 ... AWS GovCloud (US-West) us-gov-west-1",
      "confidence": "high"
    },
    {
      "field": "supported_regions",
      "url": "https://aws.amazon.com/textract/faqs/",
      "excerpt": "Amazon Textract operates in: US East (Northern Virginia), US East (Ohio), US West (Oregon), US West (N. California), AWS GovCloud (US-West), AWS GovCloud (US-East), Canada (Central), EU (Ireland), EU (London), EU (Frankfurt), EU (Paris), Asia Pacific (Singapore), Asia Pacific (Sydney), Asia Pacific (Seoul), and Asia Pacific (Mumbai).",
      "confidence": "high"
    },
    {
      "field": "supported_languages",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/limits-document.html",
      "excerpt": "Amazon Textract supports English, French, German, Italian, Portuguese, and Spanish text detection. Query detection is only available in English document detection.",
      "confidence": "high"
    },
    {
      "field": "supported_languages",
      "url": "https://aws.amazon.com/textract/faqs/",
      "excerpt": "The service handles \"printed text, forms and tables in English, German, French, Spanish, Italian and Portuguese.\" Handwriting detection, invoice/receipt processing, identity document analysis, and query features are \"in English only.\"",
      "confidence": "high"
    },
    {
      "field": "input_types",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/limits-document.html",
      "excerpt": "Operations support JPEG, PNG, PDF, and TIFF files. (JPEG 2000-encoded images within PDFs are supported). Textract does not support XFA based PDFs.",
      "confidence": "high"
    },
    {
      "field": "input_types",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/API_DetectDocumentText.html",
      "excerpt": "The input document must be in one of the following image formats: JPEG, PNG, PDF, or TIFF.",
      "confidence": "high"
    },
    {
      "field": "output_types",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/API_DetectDocumentText.html",
      "excerpt": "DetectDocumentText returns the detected text in an array of Block objects. ... If the action is successful, the service sends back an HTTP 200 response. The following data is returned in JSON format by the service.",
      "confidence": "high"
    },
    {
      "field": "webhooks_supported",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/async-notification-payload.html",
      "excerpt": "Amazon Textract sends the status of an analysis request to an Amazon Simple Notification Service (Amazon SNS) topic. To get the notification from an Amazon SNS topic, use an Amazon SQS queue or an AWS Lambda function.",
      "confidence": "high"
    },
    {
      "field": "sdk_languages",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/setup-awscli-sdk.html",
      "excerpt": "Download and install the AWS CLI and the AWS SDKs that you want to use. This guide provides examples for the AWS CLI, Java, and Python. For information about other AWS SDKs, see Tools for Amazon Web Services.",
      "confidence": "high"
    },
    {
      "field": "pricing_model",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/what-is.html",
      "excerpt": "Low cost – With Amazon Textract, you only pay for the documents you analyze. There are no minimum fees or upfront commitments.",
      "confidence": "high"
    },
    {
      "field": "free_tier_available",
      "url": "https://aws.amazon.com/textract/pricing/",
      "excerpt": "Free Tier (3 months for new AWS customers): Detect Document Text API: 1,000 pages/month; Analyze Document API: 100-1,000 pages/month (varies by feature); Analyze Expense API: 100 pages/month; Analyze ID API: 100 pages/month; Analyze Lending API: 2,000 pages/month",
      "confidence": "high"
    },
    {
      "field": "self_serve_signup",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/setting-up.html",
      "excerpt": "To get started with AWS, you need an AWS account. For information about creating an AWS account, see Getting started with an AWS account in the AWS Account Management Reference Guide.",
      "confidence": "high"
    },
    {
      "field": "enterprise_plan_available",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/what-is.html",
      "excerpt": "Low cost – With Amazon Textract, you only pay for the documents you analyze. There are no minimum fees or upfront commitments. You can get started for free, and save more as you grow with our tiered pricing model.",
      "confidence": "medium"
    },
    {
      "field": "hipaa",
      "url": "https://aws.amazon.com/compliance/hipaa-eligible-services-reference/",
      "excerpt": "Amazon Textract",
      "confidence": "high"
    },
    {
      "field": "gdpr",
      "url": "https://aws.amazon.com/compliance/gdpr-center/",
      "excerpt": "AWS customers can use all AWS services to process personal data (as defined in the GDPR) that is uploaded to the AWS services under their AWS accounts (customer data) in compliance with the GDPR.",
      "confidence": "medium"
    },
    {
      "field": "iso_27001",
      "url": "https://aws.amazon.com/compliance/iso-certified/",
      "excerpt": "Amazon Textract",
      "confidence": "high"
    },
    {
      "field": "pci_dss",
      "url": "https://aws.amazon.com/textract/faqs/",
      "excerpt": "The service is \"HIPAA eligible\" and \"compliant with PCI, ISO, and SOC.\"",
      "confidence": "medium"
    },
    {
      "field": "sla_published",
      "url": "https://aws.amazon.com/textract/sla/",
      "excerpt": "Availability is calculated for each 5-minute interval as the percentage of Requests processed that \"do not fail with Errors and relate solely to the provisioned Amazon Textract function.\"",
      "confidence": "high"
    },
    {
      "field": "documented_rate_limits",
      "url": "https://docs.aws.amazon.com/general/latest/gr/textract.html",
      "excerpt": "DetectDocumentText: US East (N. Virginia) 25 TPS, US West (Oregon) 25 TPS ... AnalyzeDocument: 10 TPS ... AnalyzeExpense: 5 TPS ... AnalyzeID: 5 TPS ... Maximum number of asynchronous jobs per account that can simultaneously exist: 600 (us-east-1, us-west-2)",
      "confidence": "high"
    },
    {
      "field": "known_restrictions",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/limits-document.html",
      "excerpt": "For synchronous operations, JPEG, PNG, PDF, and TIFF files have a limit of 10 MB in memory. PDF and TIFF files also have a limit of 1 page. For asynchronous operations ... PDF and TIFF files have a limit of 500 MB in memory and a limit of 3,000 pages.",
      "confidence": "high"
    },
    {
      "field": "auth_methods",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/security-iam.html",
      "excerpt": "For programmatic access, AWS provides an SDK and CLI to cryptographically sign requests. For more information, see AWS Signature Version 4 for API requests in the IAM User Guide.",
      "confidence": "high"
    },
    {
      "field": "api_style",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/API_DetectDocumentText.html",
      "excerpt": "The request accepts the following data in JSON format. ... If the action is successful, the service sends back an HTTP 200 response. The following data is returned in JSON format by the service.",
      "confidence": "high"
    },
    {
      "field": "base_url",
      "url": "https://docs.aws.amazon.com/general/latest/gr/textract.html",
      "excerpt": "US East (N. Virginia) | us-east-1 | textract.us-east-1.amazonaws.com ... US West (Oregon) | us-west-2 | textract.us-west-2.amazonaws.com | HTTPS",
      "confidence": "high"
    },
    {
      "field": "api_version",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/API_StartDocumentTextDetection.html",
      "excerpt": "AWS SDK for Go v2 ... SdkForGoV2/textract-2018-06-27/StartDocumentTextDetection ... AWS SDK for Java V2 ... SdkForJavaV2/textract-2018-06-27/StartDocumentTextDetection",
      "confidence": "high"
    },
    {
      "field": "idempotency_supported",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/api-async.html",
      "excerpt": "To prevent accidental duplication of analysis jobs, you can optionally provide an idempotent token, ClientRequestToken. If you supply a value for ClientRequestToken, the Start operation returns the same JobId for multiple identical calls to the Start operation.",
      "confidence": "high"
    },
    {
      "field": "error_format",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/API_DetectDocumentText.html",
      "excerpt": "AccessDeniedException — You aren't authorized to perform the action. HTTP Status Code: 400 ... BadDocumentException — Amazon Textract isn't able to read the document. HTTP Status Code: 400 ... ProvisionedThroughputExceededException — The number of requests exceeded your throughput limit. HTTP Status Code: 400",
      "confidence": "high"
    },
    {
      "field": "rate_limit_requests",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/limits-quotas-explained.html",
      "excerpt": "TPS quotas determine how often you can request that Textract process a new document. TPS quotas are unique to API, Synchronous or Asynchronous operations, and Region.",
      "confidence": "high"
    },
    {
      "field": "notable_customers",
      "url": "https://aws.amazon.com/textract/customers/",
      "excerpt": "Healthcare: Change Healthcare, Roche, Elevance Health ... Lending: Pennymac ... Software & Internet: Cox Automotive ... The Washington Post ... HelloSign ... PitchBook",
      "confidence": "high"
    },
    {
      "field": "webhooks_supported",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/api-async.html",
      "excerpt": "The completion status of the request is published to an Amazon Simple Notification Service (Amazon SNS) topic. To get the completion status from the Amazon SNS topic, you can use an Amazon Simple Queue Service (Amazon SQS) queue or an AWS Lambda function.",
      "confidence": "high"
    },
    {
      "field": "sdk_languages",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/API_DetectDocumentText.html",
      "excerpt": "AWS SDK for .NET V4 ... AWS SDK for Go v2 ... AWS SDK for Java V2 ... AWS SDK for JavaScript V3 ... AWS SDK for PHP V3 ... AWS SDK for Python ... AWS SDK for Ruby V3",
      "confidence": "high"
    },
    {
      "field": "pricing_model",
      "url": "https://aws.amazon.com/textract/pricing/",
      "excerpt": "Detect Document Text API — first 1M pages: $0.0015/page ... After 1M pages: $0.0006/page",
      "confidence": "high"
    },
    {
      "field": "has_published_pricing",
      "url": "https://aws.amazon.com/textract/pricing/",
      "excerpt": "Detect Document Text API — First 1M pages: $0.0015/page; After 1M pages: $0.0006/page ... Analyze Document API - Forms: $0.05/page (first 1M) ... Analyze Lending API: $0.07/page (first 1M), $0.055/page (after)",
      "confidence": "high"
    },
    {
      "field": "free_tier_available",
      "url": "https://aws.amazon.com/textract/faqs/",
      "excerpt": "New AWS customers receive three months of complimentary access including: Detect Document Text (1,000 pages/month), Analyze Document with Signatures (1,000 pages/month), Analyze Expense API (100 pages/month), Analyze ID API (100 pages/month), and Analyze Lending API (2,000 pages/month).",
      "confidence": "high"
    },
    {
      "field": "self_serve_signup",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/getting-started.html",
      "excerpt": "You can try the API by using the demonstration in the Amazon Textract console. For more information, see https://console.aws.amazon.com/textract/.",
      "confidence": "high"
    },
    {
      "field": "enterprise_plan_available",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/limits-quotas-explained.html",
      "excerpt": "When requesting an increase to a default quota, there are several recommended best practices to follow. ... Contact AWS Support if you find that your average number of concurrent requests can't be managed by an Amazon SQS queue.",
      "confidence": "medium"
    },
    {
      "field": "hipaa",
      "url": "https://aws.amazon.com/textract/faqs/",
      "excerpt": "The service is \"HIPAA eligible\" and \"compliant with PCI, ISO, and SOC.\"",
      "confidence": "high"
    },
    {
      "field": "gdpr",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/data-protection.html",
      "excerpt": "For information about data protection in Europe, see the AWS Shared Responsibility Model and GDPR blog post on the AWS Security Blog.",
      "confidence": "medium"
    },
    {
      "field": "iso_27001",
      "url": "https://aws.amazon.com/textract/faqs/",
      "excerpt": "The service is \"HIPAA eligible\" and \"compliant with PCI, ISO, and SOC.\"",
      "confidence": "high"
    },
    {
      "field": "soc2",
      "url": "https://aws.amazon.com/textract/faqs/",
      "excerpt": "The service is \"HIPAA eligible\" and \"compliant with PCI, ISO, and SOC.\"",
      "confidence": "medium"
    },
    {
      "field": "sla_published",
      "url": "https://aws.amazon.com/textract/sla/",
      "excerpt": "Service Credit Tiers: 99–99.9% uptime: 10% credit; Below 99% uptime: 25% credit; Below 95% uptime: 100% credit.",
      "confidence": "high"
    },
    {
      "field": "documented_rate_limits",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/limits-quotas-explained.html",
      "excerpt": "TPS quotas determine how often you can request that Textract process a new document. TPS quotas are unique to API, Synchronous or Asynchronous operations, and Region. ... Default quotas can be viewed or changed via the Service Quotas console.",
      "confidence": "high"
    },
    {
      "field": "known_restrictions",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/limits-document.html",
      "excerpt": "Amazon Textract supports images with a resolution less than or equal to 10000 pixels on all sides. ... Amazon Textract does not support vertical text (text written vertically, as is common in languages like Japanese and Chinese) ... The minimum height for text to be detected is 15 pixels. At 150 DPI, this would be the same as 8 point font. ... AnalyzeID only supports US passports, and US driver's licenses.",
      "confidence": "high"
    },
    {
      "field": "auth_methods",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/CommonParameters.html",
      "excerpt": "X-Amz-Algorithm — The hash algorithm that you used to create the request signature. Valid Values: AWS4-HMAC-SHA256",
      "confidence": "high"
    },
    {
      "field": "api_style",
      "url": "https://docs.aws.amazon.com/textract/latest/dg/data-protection.html",
      "excerpt": "Amazon Textract communicates exclusively through HTTPS endpoints, which are supported in all Regions supported by Amazon Textract",
      "confidence": "high"
    },
    {
      "field": "api_version",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/API_DetectDocumentText.html",
      "excerpt": "AWS Command Line Interface V2 ... textract-2018-06-27/DetectDocumentText ... AWS SDK for .NET V4 ... textract-2018-06-27/DetectDocumentText ... AWS SDK for Python ... boto3/textract-2018-06-27/DetectDocumentText",
      "confidence": "high"
    },
    {
      "field": "idempotency_supported",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/API_StartDocumentTextDetection.html",
      "excerpt": "ClientRequestToken — The idempotent token that's used to identify the start request. If you use the same token with multiple StartDocumentTextDetection requests, the same JobId is returned. Use ClientRequestToken to prevent the same job from being accidentally started more than once.",
      "confidence": "high"
    },
    {
      "field": "error_format",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/CommonErrors.html",
      "excerpt": "AccessDeniedException — You don't have permission to perform this action. Verify that your IAM policy includes the required permissions. HTTP Status Code: 403 ... ThrottlingException — Your request rate is too high. HTTP Status Code: 400",
      "confidence": "high"
    },
    {
      "field": "rate_limit_requests",
      "url": "https://docs.aws.amazon.com/general/latest/gr/textract.html",
      "excerpt": "DetectDocumentText | US East (N. Virginia) 25 | US West (Oregon) 25 | US East (Ohio) 10 | Europe (Ireland) 5 | Asia Pacific (Mumbai) 5 | Other Regions 1",
      "confidence": "high"
    },
    {
      "field": "starting_price_usd",
      "url": "https://aws.amazon.com/textract/pricing/",
      "excerpt": "Detect Document Text API — first 1M pages: $0.0015/page",
      "confidence": "high"
    },
    {
      "field": "launched_at",
      "url": "https://docs.aws.amazon.com/textract/latest/APIReference/API_DetectDocumentText.html",
      "excerpt": "AWS Command Line Interface V2 ... textract-2018-06-27/DetectDocumentText",
      "confidence": "medium"
    }
  ],
  "fields_not_found": [
    "mcp_url",
    "webhook_signing"
  ],
  "source_confidence": "high",
  "last_verified_at": "2026-06-14T00:00:00.000Z",
  "contribute": {
    "note": "This data is crowd-editable. Suggest corrections or leave a review via these endpoints - no auth required, requests are rate-limited, and every submission is reviewed before it goes live. For a field edit, {field} is any key in this response and a citation is required.",
    "endpoints": [
      {
        "action": "review",
        "label": "Leave a review or comment",
        "method": "POST",
        "url": "https://apio.sh/api/feedback/aws-textract",
        "example_body": {
          "kind": "review",
          "rating": 5,
          "body": "Your experience with this API…"
        }
      },
      {
        "action": "field_edit",
        "label": "Suggest a correction to a field (cite a source)",
        "method": "POST",
        "url": "https://apio.sh/api/suggest/aws-textract/{field}",
        "example_body": {
          "value": "corrected value",
          "citations": [
            {
              "url": "https://source.example/page",
              "excerpt": "supporting quote"
            }
          ],
          "note": "what changed and why"
        }
      },
      {
        "action": "new_api",
        "label": "Suggest a new API to add",
        "method": "POST",
        "url": "https://apio.sh/api/suggest/api",
        "example_body": {
          "value": {
            "name": "Acme API",
            "website_url": "https://acme.example"
          },
          "citations": [
            {
              "url": "https://acme.example"
            }
          ]
        }
      },
      {
        "action": "token",
        "label": "Optional - raise your rate limit",
        "method": "GET",
        "url": "https://apio.sh/api/feedback/token"
      }
    ]
  }
}