<?xml version="1.0" encoding="UTF-8"?><rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>Vara Bonthu &#8211; Noise</title>
	<atom:link href="https://noise.getoto.net/author/vara-bonthu/feed/" rel="self" type="application/rss+xml" />
	<link>https://noise.getoto.net</link>
	<description>The collective thoughts of the interwebz</description>
	<lastBuildDate>Wed, 14 Sep 2022 15:44:27 +0000</lastBuildDate>
	<language>en-US</language>
	<sy:updatePeriod>
	hourly	</sy:updatePeriod>
	<sy:updateFrequency>
	1	</sy:updateFrequency>
	<generator>https://wordpress.org/?v=6.8.2</generator>
	<item>
		<title>Run Apache Spark with Amazon EMR on EKS backed by Amazon FSx for Lustre storage</title>
		<link>https://noise.getoto.net/2022/09/14/run-apache-spark-with-amazon-emr-on-eks-backed-by-amazon-fsx-for-lustre-storage/</link>
		
		<dc:creator><![CDATA[Vara Bonthu]]></dc:creator>
		<pubDate>Wed, 14 Sep 2022 15:44:27 +0000</pubDate>
				<category><![CDATA[Amazon EMR]]></category>
		<category><![CDATA[Amazon FSx for Lustre]]></category>
		<category><![CDATA[Analytics]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=caa3b71b6728bd17ef9719eb1b9f0421</guid>

					<description><![CDATA[Traditionally, Spark workloads have been run on a dedicated setup like a Hadoop stack with YARN or MESOS as a resource manager. Starting from Apache Spark 2.3, Spark added support for Kubernetes as a resource manager. The new Kubernetes scheduler natively supports the submission of Spark jobs to a Kubernetes cluster. Spark on Kubernetes provides […]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
		<item>
		<title>Building a serverless data quality and analysis framework with Deequ and AWS Glue</title>
		<link>https://noise.getoto.net/2020/12/29/building-a-serverless-data-quality-and-analysis-framework-with-deequ-and-aws-glue/</link>
		
		<dc:creator><![CDATA[Vara Bonthu]]></dc:creator>
		<pubDate>Tue, 29 Dec 2020 17:33:00 +0000</pubDate>
				<category><![CDATA[AWS Big Data]]></category>
		<category><![CDATA[AWS Glue]]></category>
		<guid isPermaLink="false">http://noise.getoto.net/?guid=efd98b5d899469206311b55a6bdf0f24</guid>

					<description><![CDATA[With ever-increasing amounts of data at their disposal, large organizations struggle to cope with not only the volume but also the quality of the data they manage. Indeed, alongside volume and velocity, veracity is an equally critical issue in data analysis, often seen as a precondition to analyzing data and guaranteeing its value. High-quality data [&#8230;]]]></description>
		
		
		<enclosure url="" length="0" type="" />

			</item>
	</channel>
</rss>

<!--
Performance optimized by W3 Total Cache. Learn more: https://www.boldgrid.com/w3-total-cache/

Object Caching 42/44 objects using Memcached
Page Caching using Disk: Enhanced 
Lazy Loading (feed)
Database Caching using Memcached

Served from: noise.getoto.net @ 2026-02-09 19:47:02 by W3 Total Cache
-->