<?xml version="1.0" encoding="UTF-8"?><rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>Amazon Textract &#8211; Noise</title>
	<atom:link href="https://noise.getoto.net/tag/amazon-textract/feed/" rel="self" type="application/rss+xml" />
	<link>https://noise.getoto.net</link>
	<description>The collective thoughts of the interwebz</description>
	<lastBuildDate>Wed, 26 Nov 2025 21:41:51 +0000</lastBuildDate>
	<language>en-US</language>
	<sy:updatePeriod>
	hourly	</sy:updatePeriod>
	<sy:updateFrequency>
	1	</sy:updateFrequency>
	<generator>https://wordpress.org/?v=6.8.2</generator>
	<item>
		<title>Orchestrating large-scale document processing with AWS Step Functions and Amazon Bedrock batch inference</title>
		<link>https://noise.getoto.net/2025/11/26/orchestrating-large-scale-document-processing-with-aws-step-functions-and-amazon-bedrock-batch-inference/</link>
		
		<dc:creator><![CDATA[Brian Zambrano]]></dc:creator>
		<pubDate>Wed, 26 Nov 2025 21:41:51 +0000</pubDate>
				<category><![CDATA[Amazon Bedrock]]></category>
		<category><![CDATA[Amazon Bedrock Knowledge Bases]]></category>
		<category><![CDATA[Amazon Nova]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[AWS Step Functions]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=ac0487467809cf2e10f0c351e2451f28</guid>

					<description><![CDATA[Organizations often have large volumes of documents containing valuable information that remains locked away and unsearchable. This solution addresses the need for a 
<strong>scalable, automated text extraction and knowledge base pipeline</strong> that transforms static document collections into intelligent, searchable repositories for generative AI applications.]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>How to enhance Amazon Macie data discovery capabilities using Amazon Textract</title>
		<link>https://noise.getoto.net/2025/01/06/how-to-enhance-amazon-macie-data-discovery-capabilities-using-amazon-textract/</link>
		
		<dc:creator><![CDATA[ZhiWei Huang]]></dc:creator>
		<pubDate>Mon, 06 Jan 2025 17:02:27 +0000</pubDate>
				<category><![CDATA[Amazon Macie]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[Intermediate (200)]]></category>
		<category><![CDATA[Security Blog]]></category>
		<category><![CDATA[Security, Identity & Compliance]]></category>
		<category><![CDATA[Technical How-to]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=7bae91274d83792338582902e3a752e9</guid>

					<description><![CDATA[Amazon Macie is a managed service that uses machine learning (ML) and deterministic pattern matching to help discover sensitive data that’s stored in Amazon Simple Storage Service (Amazon S3) buckets. Macie can detect sensitive data in many different formats, including commonly used compression and archive formats. However, Macie doesn’t support the discovery of sensitive data […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>Top Architecture Blog Posts of 2023</title>
		<link>https://noise.getoto.net/2024/02/29/top-architecture-blog-posts-of-2023/</link>
		
		<dc:creator><![CDATA[Andrea Courtright]]></dc:creator>
		<pubDate>Wed, 28 Feb 2024 23:47:51 +0000</pubDate>
				<category><![CDATA[Amazon API Gateway]]></category>
		<category><![CDATA[Amazon CloudFront]]></category>
		<category><![CDATA[Amazon CloudWatch]]></category>
		<category><![CDATA[Amazon Comprehend]]></category>
		<category><![CDATA[Amazon Elastic Container Service]]></category>
		<category><![CDATA[Amazon Elastic Kubernetes Service]]></category>
		<category><![CDATA[Amazon EventBridge]]></category>
		<category><![CDATA[Amazon Machine Learning]]></category>
		<category><![CDATA[Amazon Managed Workflows for Apache Airflow (Amazon MWAA)]]></category>
		<category><![CDATA[Amazon OpenSearch Service]]></category>
		<category><![CDATA[Amazon Redshift]]></category>
		<category><![CDATA[Amazon Route 53]]></category>
		<category><![CDATA[Amazon Sagemaker]]></category>
		<category><![CDATA[Amazon Simple Queue Service (SQS)]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[announcements]]></category>
		<category><![CDATA[Architecture]]></category>
		<category><![CDATA[artificial intelligence]]></category>
		<category><![CDATA[AWS Glue]]></category>
		<category><![CDATA[AWS Lambda]]></category>
		<category><![CDATA[AWS Managed Services]]></category>
		<category><![CDATA[AWS Step Functions]]></category>
		<category><![CDATA[AWS Well-Architected Framework]]></category>
		<category><![CDATA[AWS Well-Architected Tool]]></category>
		<category><![CDATA[communication]]></category>
		<category><![CDATA[container]]></category>
		<category><![CDATA[data architecture]]></category>
		<category><![CDATA[Disaster Recovery]]></category>
		<category><![CDATA[Disaster Recovery with AWS Managed Services series]]></category>
		<category><![CDATA[event driven architecture]]></category>
		<category><![CDATA[fault injection]]></category>
		<category><![CDATA[Let's Architect]]></category>
		<category><![CDATA[microservices]]></category>
		<category><![CDATA[NLP]]></category>
		<category><![CDATA[python]]></category>
		<category><![CDATA[RDS for PostgreSQL]]></category>
		<category><![CDATA[Regions]]></category>
		<category><![CDATA[Resiliency]]></category>
		<category><![CDATA[SaaS]]></category>
		<category><![CDATA[serverless]]></category>
		<category><![CDATA[Solutions Architecture]]></category>
		<category><![CDATA[Top 10]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=ef51f99168ffdac5341350134f7083e4</guid>

					<description><![CDATA[2023 was a rollercoaster year in tech, and we at the AWS Architecture Blog feel so fortunate to have shared in the excitement. As we move into 2024 and all of the new technologies we could see, we want to take a moment to highlight the brightest stars from 2023. As always, thanks to our […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>Unstructured data management and governance using AWS AI/ML and analytics services</title>
		<link>https://noise.getoto.net/2023/10/25/unstructured-data-management-and-governance-using-aws-ai-ml-and-analytics-services/</link>
		
		<dc:creator><![CDATA[Sakti Mishra]]></dc:creator>
		<pubDate>Wed, 25 Oct 2023 18:52:03 +0000</pubDate>
				<category><![CDATA[Amazon Athena]]></category>
		<category><![CDATA[Amazon Bedrock]]></category>
		<category><![CDATA[Amazon Comprehend]]></category>
		<category><![CDATA[Amazon DataZone]]></category>
		<category><![CDATA[Amazon Redshift]]></category>
		<category><![CDATA[Amazon Rekognition]]></category>
		<category><![CDATA[Amazon Sagemaker]]></category>
		<category><![CDATA[Amazon Simple Storage Service (S3)]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[Amazon Transcribe]]></category>
		<category><![CDATA[Analytics]]></category>
		<category><![CDATA[Architecture]]></category>
		<category><![CDATA[artificial intelligence]]></category>
		<category><![CDATA[AWS Big Data]]></category>
		<category><![CDATA[AWS Glue]]></category>
		<category><![CDATA[AWS Lambda]]></category>
		<category><![CDATA[AWS Step Functions]]></category>
		<category><![CDATA[generative AI]]></category>
		<category><![CDATA[Technical How-to]]></category>
		<category><![CDATA[Thought Leadership]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=e96bf1477afe89a67eaddc7493e3db63</guid>

					<description><![CDATA[In this post, we discuss how AWS can help you successfully address the challenges of extracting insights from unstructured data. We discuss various design patterns and architectures for extracting and cataloging valuable insights from unstructured data using AWS. Additionally, we show how to use AWS AI/ML services for analyzing unstructured data.]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>Optimizing data with automated intelligent document processing solutions</title>
		<link>https://noise.getoto.net/2023/04/28/optimizing-data-with-automated-intelligent-document-processing-solutions/</link>
		
		<dc:creator><![CDATA[Deependra Shekhawat]]></dc:creator>
		<pubDate>Fri, 28 Apr 2023 13:36:54 +0000</pubDate>
				<category><![CDATA[Amazon Comprehend]]></category>
		<category><![CDATA[Amazon Machine Learning]]></category>
		<category><![CDATA[Amazon Sagemaker]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[Architecture]]></category>
		<category><![CDATA[artificial intelligence]]></category>
		<category><![CDATA[Customer Solutions]]></category>
		<category><![CDATA[data architecture]]></category>
		<category><![CDATA[NLP]]></category>
		<category><![CDATA[python]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=29c250a292fd32beba2786f8fdcebb66</guid>

					<description><![CDATA[Many organizations struggle to effectively manage and derive insights from the large amount of unstructured data locked in emails, PDFs, images, scanned documents, and more. The variety of formats, document layouts, and text makes it difficult for any standard Optical Character Recognition (OCR) to extract key insights from these data sources. To help organizations overcome […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>Classifying and Extracting Mortgage Loan Data with Amazon Textract</title>
		<link>https://noise.getoto.net/2022/11/28/classifying-and-extracting-mortgage-loan-data-with-amazon-textract/</link>
		
		<dc:creator><![CDATA[Steve Roberts]]></dc:creator>
		<pubDate>Mon, 28 Nov 2022 05:10:34 +0000</pubDate>
				<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[announcements]]></category>
		<category><![CDATA[AWS re:Invent]]></category>
		<category><![CDATA[launch]]></category>
		<category><![CDATA[news]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=8cb2012cbfe776750cf74ea829a1ee24</guid>

					<description><![CDATA[Mortgage loan applications, at least in the United States, comprise around 500 or more pages of diverse documents. In order for applications to be reviewed, all these documents need to be classified, and the data on each form extracted. This isn’t as easy as it might sound! Besides different data structures in each document, the […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>AWS Week in Review – November 7, 2022</title>
		<link>https://noise.getoto.net/2022/11/07/aws-week-in-review-november-7-2022/</link>
		
		<dc:creator><![CDATA[Jeff Barr]]></dc:creator>
		<pubDate>Mon, 07 Nov 2022 19:13:15 +0000</pubDate>
				<category><![CDATA[Amazon Braket]]></category>
		<category><![CDATA[Amazon EC2]]></category>
		<category><![CDATA[Amazon MemoryDB for Redis]]></category>
		<category><![CDATA[Amazon Simple Notification Service (SNS)]]></category>
		<category><![CDATA[Amazon Simple Storage Service (S3)]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[announcements]]></category>
		<category><![CDATA[AWS CloudFormation]]></category>
		<category><![CDATA[AWS Outposts]]></category>
		<category><![CDATA[AWS re:Invent]]></category>
		<category><![CDATA[Events]]></category>
		<category><![CDATA[Internet of Things]]></category>
		<category><![CDATA[launch]]></category>
		<category><![CDATA[news]]></category>
		<category><![CDATA[open source]]></category>
		<category><![CDATA[Week in Review]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=f6335f5cb6eda737d5830938e87ed86f</guid>

					<description><![CDATA[With three weeks to go until AWS re:Invent opens in Las Vegas, the AWS News Blog Team is hard at work creating blog posts to share the latest launches and previews with you. As usual, we have a strong mix of new services, new features, and a surprise or two. Last Week’s Launches Here are […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>Automate your Data Extraction for Oil Well Data with Amazon Textract</title>
		<link>https://noise.getoto.net/2022/02/24/automate-your-data-extraction-for-oil-well-data-with-amazon-textract/</link>
		
		<dc:creator><![CDATA[Ashutosh Pateriya]]></dc:creator>
		<pubDate>Thu, 24 Feb 2022 17:49:55 +0000</pubDate>
				<category><![CDATA[Amazon Comprehend]]></category>
		<category><![CDATA[Amazon Simple Notification Service (SNS)]]></category>
		<category><![CDATA[Amazon Simple Queue Service (SQS)]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[Architecture]]></category>
		<category><![CDATA[AWS Lambda]]></category>
		<category><![CDATA[Energy (Oil & Gas)]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=3585ef68df248f79b1eaf5891cc528c5</guid>

					<description><![CDATA[Traditionally, many businesses archive physical formats of their business documents. These can be invoices, sales memos, purchase orders, vendor-related documents, and inventory documents. As more and more businesses are moving towards digitizing their business processes, it is becoming challenging to effectively manage these documents and perform business analytics on them. For example, in the Oil […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>17 additional AWS services authorized for DoD workloads in the AWS GovCloud Regions</title>
		<link>https://noise.getoto.net/2021/09/09/17-additional-aws-services-authorized-for-dod-workloads-in-the-aws-govcloud-regions/</link>
		
		<dc:creator><![CDATA[Tyler Harding]]></dc:creator>
		<pubDate>Wed, 08 Sep 2021 23:33:22 +0000</pubDate>
				<category><![CDATA[Amazon Cognito]]></category>
		<category><![CDATA[Amazon EKS]]></category>
		<category><![CDATA[Amazon Pinpoint]]></category>
		<category><![CDATA[Amazon SES]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[announcements]]></category>
		<category><![CDATA[AWS Backup]]></category>
		<category><![CDATA[AWS Budgets]]></category>
		<category><![CDATA[AWS CodePipeline]]></category>
		<category><![CDATA[AWS Cost & Usage Report]]></category>
		<category><![CDATA[AWS Cost Explorer]]></category>
		<category><![CDATA[AWS Fargate]]></category>
		<category><![CDATA[AWS License Manager]]></category>
		<category><![CDATA[AWS Marketplace]]></category>
		<category><![CDATA[AWS Personal Health Dashboard]]></category>
		<category><![CDATA[AWS Security Hub]]></category>
		<category><![CDATA[AWS Systems Manager]]></category>
		<category><![CDATA[AWS X-Ray]]></category>
		<category><![CDATA[DoD IL 4]]></category>
		<category><![CDATA[DoD IL 5]]></category>
		<category><![CDATA[Federal]]></category>
		<category><![CDATA[FedRAMP]]></category>
		<category><![CDATA[Foundational (100)]]></category>
		<category><![CDATA[Government]]></category>
		<category><![CDATA[NIST SP 800-53]]></category>
		<category><![CDATA[P-ATO]]></category>
		<category><![CDATA[Public Sector]]></category>
		<category><![CDATA[Security Blog]]></category>
		<category><![CDATA[Security, Identity & Compliance]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=1869cbf7b90f6bd21fe39fad4f4c875f</guid>

					<description><![CDATA[I’m pleased to announce that the Defense Information Systems Agency (DISA) has authorized 17 additional Amazon Web Services (AWS) services and features in the AWS GovCloud (US) Regions, bringing the total to 105 services and major features that are authorized for use by the U.S. Department of Defense (DoD). AWS now offers additional services to […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>Amazon Textract Updates: Up to 32% Price Reduction in 8 AWS Regions and Up to 50% Reduction in Asynchronous Job Processing Times</title>
		<link>https://noise.getoto.net/2021/08/26/amazon-textract-updates-up-to-32-price-reduction-in-8-aws-regions-and-up-to-50-reduction-in-asynchronous-job-processing-times/</link>
		
		<dc:creator><![CDATA[Channy Yun]]></dc:creator>
		<pubDate>Thu, 26 Aug 2021 16:03:49 +0000</pubDate>
				<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[Price Reduction]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=91c1d5e74e2918a59d9b2e4cbc4084d1</guid>

					<description><![CDATA[Introduced at AWS re:Invent 2018, Amazon Textract is a machine learning service that automatically extracts text, handwriting and data from scanned documents that goes beyond simple optical character recognition (OCR) to identify, understand, and extract data from forms and tables. In the past few months, we introduced specialized support for processing invoices and receipts and […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>Automate Document Processing in Logistics using AI</title>
		<link>https://noise.getoto.net/2021/08/19/automate-document-processing-in-logistics-using-ai/</link>
		
		<dc:creator><![CDATA[Manikanth Pasumarti]]></dc:creator>
		<pubDate>Wed, 18 Aug 2021 23:04:05 +0000</pubDate>
				<category><![CDATA[Amazon Comprehend]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[Architecture]]></category>
		<category><![CDATA[artificial intelligence]]></category>
		<category><![CDATA[AWS Step Functions]]></category>
		<category><![CDATA[Document Processing]]></category>
		<category><![CDATA[Intermediate (200)]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=d00617c49d44023b108a552fde5ea802</guid>

					<description><![CDATA[Multi-modal transportation is one of the biggest developments in the logistics industry. There has been a successful collaboration across different transportation partners in supply chain freight forwarding for many decades. But there’s still a considerable overhead of paperwork processing for each leg of the trip. Tens of billions of documents are processed in ocean freight […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>CohnReznick Automates Claim Validation Workflow Using AWS AI Services</title>
		<link>https://noise.getoto.net/2021/07/23/cohnreznick-automates-claim-validation-workflow-using-aws-ai-services/</link>
		
		<dc:creator><![CDATA[Rajeswari Malladi]]></dc:creator>
		<pubDate>Fri, 23 Jul 2021 15:56:16 +0000</pubDate>
				<category><![CDATA[Amazon Augmented AI]]></category>
		<category><![CDATA[Amazon Comprehend]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[Architecture]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=a4bf5f1cf480717634e9216188d85942</guid>

					<description><![CDATA[This post was co-written by Winn Oo and Brendan Byam of CohnReznick and Rajeswari Malladi and Shanthan Kesharaju CohnReznick is a leading advisory, assurance, and tax firm serving clients around the world. CohnReznick’s government and public sector practice provides claims audit and verification services for state agencies. This process begins with recipients submitting documentation as […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>Getting started with RPA using AWS Step Functions and Amazon Textract</title>
		<link>https://noise.getoto.net/2020/11/16/getting-started-with-rpa-using-aws-step-functions-and-amazon-textract/</link>
		
		<dc:creator><![CDATA[James Beswick]]></dc:creator>
		<pubDate>Mon, 16 Nov 2020 15:26:19 +0000</pubDate>
				<category><![CDATA[Amazon Simple Notification Service (SNS)]]></category>
		<category><![CDATA[Amazon Simple Queue Service (SQS)]]></category>
		<category><![CDATA[Amazon Simple Storage Services (S3)]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[AWS Step Functions]]></category>
		<category><![CDATA[serverless]]></category>
		<category><![CDATA[Technical How-to]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=3ae9190ac19571383ceb2888a05c6f6a</guid>

					<description><![CDATA[This post is courtesy of Joe Tringali, Solutions Architect. Many organizations are using robotic process automation (RPA) to automate workflow, back-office processes that are labor-intensive. RPA, as software bots, can often handle many of these activities. Often RPA workflows contain repetitive manual tasks that must be done by humans, such as viewing invoices to find [&#8230;]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>Building a serverless document scanner using Amazon Textract and AWS Amplify</title>
		<link>https://noise.getoto.net/2020/09/03/building-a-serverless-document-scanner-using-amazon-textract-and-aws-amplify/</link>
		
		<dc:creator><![CDATA[Moheeb Zara]]></dc:creator>
		<pubDate>Thu, 03 Sep 2020 20:12:17 +0000</pubDate>
				<category><![CDATA[Amazon API Gateway]]></category>
		<category><![CDATA[Amazon Cognito]]></category>
		<category><![CDATA[Amazon DynamoDB]]></category>
		<category><![CDATA[Amazon Simple Storage Services (S3)]]></category>
		<category><![CDATA[Amazon Textract]]></category>
		<category><![CDATA[AWS Amplify]]></category>
		<category><![CDATA[AWS Lambda]]></category>
		<category><![CDATA[AWS Serverless Application Model]]></category>
		<category><![CDATA[AWS Serverless Application Repository]]></category>
		<category><![CDATA[DynamoDB]]></category>
		<category><![CDATA[serverless]]></category>
		<category><![CDATA[Uncategorized]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=e05e69a38244b7183e350dda2f583cee</guid>

					<description><![CDATA[This guide demonstrates creating and deploying a production ready document scanning application. It allows users to manage projects, upload images, and generate a PDF from detected text. The sample can be used as a template for building expense tracking applications, handling forms and legal documents, or for digitizing books and notes. The frontend application is [&#8230;]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
	</channel>
</rss>

<!--
Performance optimized by W3 Total Cache. Learn more: https://www.boldgrid.com/w3-total-cache/

Object Caching 80/434 objects using Memcached
Page Caching using Disk: Enhanced 
Lazy Loading (feed)
Database Caching using Memcached

Served from: noise.getoto.net @ 2025-12-07 14:53:30 by W3 Total Cache
-->