<?xml version="1.0" encoding="UTF-8"?><rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>Apache Spark - Wikitechy</title>
	<atom:link href="https://www.wikitechy.com/interview-questions/category/apache-spark/feed/" rel="self" type="application/rss+xml" />
	<link>https://www.wikitechy.com/interview-questions/category/apache-spark/</link>
	<description>Interview Questions</description>
	<lastBuildDate>Tue, 14 Sep 2021 10:04:46 +0000</lastBuildDate>
	<language>en-US</language>
	<sy:updatePeriod>
	hourly	</sy:updatePeriod>
	<sy:updateFrequency>
	1	</sy:updateFrequency>
	<generator>https://wordpress.org/?v=6.9.4</generator>

<image>
	<url>https://www.wikitechy.com/interview-questions/wp-content/uploads/2025/10/cropped-wikitechy-icon-32x32.png</url>
	<title>Apache Spark - Wikitechy</title>
	<link>https://www.wikitechy.com/interview-questions/category/apache-spark/</link>
	<width>32</width>
	<height>32</height>
</image> 
	<item>
		<title>What is Shark ?</title>
		<link>https://www.wikitechy.com/interview-questions/apache-spark/what-is-shark/</link>
					<comments>https://www.wikitechy.com/interview-questions/apache-spark/what-is-shark/#respond</comments>
		
		<dc:creator><![CDATA[Editor]]></dc:creator>
		<pubDate>Mon, 12 Jul 2021 16:16:52 +0000</pubDate>
				<category><![CDATA[Apache Spark]]></category>
		<category><![CDATA[Accenture interview questions and answers]]></category>
		<category><![CDATA[Altimetrik India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[apache analytics software]]></category>
		<category><![CDATA[apache hadoop and spark]]></category>
		<category><![CDATA[apache hadoop vs apache spark]]></category>
		<category><![CDATA[apache hadoop vs spark]]></category>
		<category><![CDATA[apache hive]]></category>
		<category><![CDATA[apache hive spark]]></category>
		<category><![CDATA[apache hive vs spark]]></category>
		<category><![CDATA[apache shark]]></category>
		<category><![CDATA[apache spark]]></category>
		<category><![CDATA[apache spark analytics]]></category>
		<category><![CDATA[apache spark and hadoop]]></category>
		<category><![CDATA[apache spark architecture]]></category>
		<category><![CDATA[apache spark big data]]></category>
		<category><![CDATA[apache spark cassandra]]></category>
		<category><![CDATA[apache spark cloudapache spark cost]]></category>
		<category><![CDATA[apache spark distribution]]></category>
		<category><![CDATA[apache spark engine]]></category>
		<category><![CDATA[apache spark framework]]></category>
		<category><![CDATA[apache spark hadoop]]></category>
		<category><![CDATA[apache spark hdfs]]></category>
		<category><![CDATA[apache spark hive]]></category>
		<category><![CDATA[apache spark in memory]]></category>
		<category><![CDATA[apache spark in memory database]]></category>
		<category><![CDATA[apache spark libraries]]></category>
		<category><![CDATA[apache spark open source]]></category>
		<category><![CDATA[apache spark or hadoop]]></category>
		<category><![CDATA[apache spark orgapache spark projects]]></category>
		<category><![CDATA[apache spark sql]]></category>
		<category><![CDATA[apache spark tools]]></category>
		<category><![CDATA[apache spark use cases]]></category>
		<category><![CDATA[apache spark vs apache hadoop]]></category>
		<category><![CDATA[apache spark vs hadoop]]></category>
		<category><![CDATA[apache spark vs hive]]></category>
		<category><![CDATA[Big Data for Big Sharks]]></category>
		<category><![CDATA[Capgemini interview questions and answers]]></category>
		<category><![CDATA[CASTING NETWORKS INDIA PVT LIMITED interview questions and answers]]></category>
		<category><![CDATA[CGI Group Inc interview questions and answers]]></category>
		<category><![CDATA[Collabera Technologies interview questions and answers]]></category>
		<category><![CDATA[Dell International Services India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Flipkart interview questions and answers]]></category>
		<category><![CDATA[Genpact interview questions and answers]]></category>
		<category><![CDATA[Hive on Spark]]></category>
		<category><![CDATA[IBM interview questions and answers]]></category>
		<category><![CDATA[JPMorgan Chase & Co interview questions and answers]]></category>
		<category><![CDATA[L&T Infotech interview questions and answers]]></category>
		<category><![CDATA[Mindtree interview questions and answers]]></category>
		<category><![CDATA[Oracle Corporation interview questions and answers]]></category>
		<category><![CDATA[Prokarma Softech Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[R Systems interview questions and answers]]></category>
		<category><![CDATA[RBS India Development Centre Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Reliance Industries Ltd interview questions and answers]]></category>
		<category><![CDATA[Sapient Consulting Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Shark]]></category>
		<category><![CDATA[Shark - SQL on Spark]]></category>
		<category><![CDATA[Shark and Spark SQL]]></category>
		<category><![CDATA[shark in spark]]></category>
		<category><![CDATA[shark spark drone]]></category>
		<category><![CDATA[shark vs spark]]></category>
		<category><![CDATA[Spark and shark]]></category>
		<category><![CDATA[spark shark fish hunt]]></category>
		<category><![CDATA[spark sql]]></category>
		<category><![CDATA[spark vs shark]]></category>
		<category><![CDATA[Synechron Te interview questions and answers]]></category>
		<category><![CDATA[Tata Consultancy Service interview questions and answers]]></category>
		<category><![CDATA[Tech Mahindra interview questions and answers]]></category>
		<category><![CDATA[the future of SQL on Apache]]></category>
		<category><![CDATA[Trigent Software interview questions and answers]]></category>
		<category><![CDATA[UnitedHealth Group interview questions and answers]]></category>
		<category><![CDATA[Virtusa Consulting Services Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Wells Fargo interview questions and answers]]></category>
		<category><![CDATA[What is Apache Shark?]]></category>
		<category><![CDATA[Wipro Infotech interview questions and answers]]></category>
		<category><![CDATA[Xoriant Solutions Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Yodlee Infotech Pvt Ltd interview questions and answers]]></category>
		<guid isPermaLink="false">https://www.wikitechy.com/interview-questions/?p=254</guid>

					<description><![CDATA[Answer : Shark is a tool, developed for people who are from...]]></description>
										<content:encoded><![CDATA[<div class="TextHeading">
<div class="hddn">
<h2 id="what-is-shark" class="color-pink" style="text-align: justify;">What is Shark ?</h2>
</div>
</div>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li>Shark is a tool, developed for people who are from a database background &#8211; to access Scala MLib capabilities through Hive like <a href="https://www.wikitechy.com/tutorials/sql/" target="_blank" rel="noopener">SQL</a> interface.</li>
<li>Shark tool helps data users run Hive on <a href="https://forums.wikitechy.com/qa-tag/apache-spark/" target="_blank" rel="noopener">Spark</a> &#8211; offering compatibility with Hive metastore, queries and data.</li>
<li>Like Hive, Spark queries are written using a SQL-like language called HiveQL, which Spark translates into Spark Directed Acyclic Graphs (DAGs) that are executed on the Hadoop cluster.</li>
<li>More complex queries are supported through User Defined Functions (UDFs) that can be written in <a href="https://www.wikitechy.com/tutorials/java/" target="_blank" rel="noopener">Java </a>and referenced by a HiveQL query.</li>
</ul>
</div>
</div>
<div class="text-center row" style="text-align: justify;"></div>
<div class="ImageContent">
<div class="hddn"><img decoding="async" class="img-responsive center-block aligncenter" src="https://cdn.wikitechy.com/interview-questions/apache-spark/what-is-shark.jpg" alt="What is Shark" /></div>
</div>
]]></content:encoded>
					
					<wfw:commentRss>https://www.wikitechy.com/interview-questions/apache-spark/what-is-shark/feed/</wfw:commentRss>
			<slash:comments>0</slash:comments>
		
		
			</item>
		<item>
		<title>What is the difference between Spark and Hadoop MapReduce ?</title>
		<link>https://www.wikitechy.com/interview-questions/apache-spark/what-is-the-difference-between-spark-and-hadoop-mapreduce/</link>
					<comments>https://www.wikitechy.com/interview-questions/apache-spark/what-is-the-difference-between-spark-and-hadoop-mapreduce/#respond</comments>
		
		<dc:creator><![CDATA[Editor]]></dc:creator>
		<pubDate>Mon, 12 Jul 2021 16:09:43 +0000</pubDate>
				<category><![CDATA[Apache Spark]]></category>
		<category><![CDATA[Accenture interview questions and answers]]></category>
		<category><![CDATA[Altimetrik India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[big data vs hadoop difference]]></category>
		<category><![CDATA[can you explain the difference between hadoop and spark]]></category>
		<category><![CDATA[Capgemini interview questions and answers]]></category>
		<category><![CDATA[cassandra hadoop difference]]></category>
		<category><![CDATA[CASTING NETWORKS INDIA PVT LIMITED interview questions and answers]]></category>
		<category><![CDATA[CGI Group Inc interview questions and answers]]></category>
		<category><![CDATA[Collabera Technologies interview questions and answers]]></category>
		<category><![CDATA[Dell International Services India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[difference between apache spark and hadoop]]></category>
		<category><![CDATA[difference between apache spark and storm]]></category>
		<category><![CDATA[difference between apache storm and spark]]></category>
		<category><![CDATA[difference between big data and hadoop]]></category>
		<category><![CDATA[difference between cloudera and hadoop]]></category>
		<category><![CDATA[difference between hadoop and cassandra]]></category>
		<category><![CDATA[difference between hadoop and cloud computing]]></category>
		<category><![CDATA[difference between hadoop and cloudera]]></category>
		<category><![CDATA[difference between hadoop and data warehouse]]></category>
		<category><![CDATA[difference between hadoop and hbase]]></category>
		<category><![CDATA[difference between hadoop and hdfs]]></category>
		<category><![CDATA[difference between hadoop and hdfs commands]]></category>
		<category><![CDATA[difference between hadoop and hive]]></category>
		<category><![CDATA[difference between hadoop and mapreduce]]></category>
		<category><![CDATA[difference between hadoop and spark]]></category>
		<category><![CDATA[difference between hadoop and sql]]></category>
		<category><![CDATA[difference between hdfs and mapreduce]]></category>
		<category><![CDATA[difference between hive and hadoop]]></category>
		<category><![CDATA[difference between hive and hbase]]></category>
		<category><![CDATA[difference between hive and spark]]></category>
		<category><![CDATA[difference between mapreduce and spark]]></category>
		<category><![CDATA[difference between mapreduce and yarn]]></category>
		<category><![CDATA[difference between node and cluster in hadoop]]></category>
		<category><![CDATA[difference between spark and mapreduce]]></category>
		<category><![CDATA[difference between spark and scala]]></category>
		<category><![CDATA[difference between sql and hadoop]]></category>
		<category><![CDATA[Flipkart interview questions and answers]]></category>
		<category><![CDATA[Genpact interview questions and answers]]></category>
		<category><![CDATA[hadoop and spark difference]]></category>
		<category><![CDATA[hadoop spark difference]]></category>
		<category><![CDATA[IBM interview questions and answers]]></category>
		<category><![CDATA[JPMorgan Chase & Co interview questions and answers]]></category>
		<category><![CDATA[L&T Infotech interview questions and answers]]></category>
		<category><![CDATA[mapreduce vs spark differences]]></category>
		<category><![CDATA[Mindtree interview questions and answers]]></category>
		<category><![CDATA[Oracle Corporation interview questions and answers]]></category>
		<category><![CDATA[Prokarma Softech Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[R Systems interview questions and answers]]></category>
		<category><![CDATA[RBS India Development Centre Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Reliance Industries Ltd interview questions and answers]]></category>
		<category><![CDATA[Sapient Consulting Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Synechron Te interview questions and answers]]></category>
		<category><![CDATA[Tata Consultancy Service interview questions and answers]]></category>
		<category><![CDATA[Tech Mahindra interview questions and answers]]></category>
		<category><![CDATA[Trigent Software interview questions and answers]]></category>
		<category><![CDATA[UnitedHealth Group interview questions and answers]]></category>
		<category><![CDATA[Virtusa Consulting Services Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Wells Fargo interview questions and answers]]></category>
		<category><![CDATA[what is difference between hadoop and bigdata]]></category>
		<category><![CDATA[what is the difference between big data and hadoop]]></category>
		<category><![CDATA[what is the difference between hadoop and mapreduce]]></category>
		<category><![CDATA[what is the difference between hadoop and spark]]></category>
		<category><![CDATA[what is the difference between spark and hadoop]]></category>
		<category><![CDATA[What is the difference between Spark and Hadoop MapReduce]]></category>
		<category><![CDATA[what is the relationship between hadoop and spark]]></category>
		<category><![CDATA[Wipro Infotech interview questions and answers]]></category>
		<category><![CDATA[Xoriant Solutions Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Yodlee Infotech Pvt Ltd interview questions and answers]]></category>
		<guid isPermaLink="false">https://www.wikitechy.com/interview-questions/?p=252</guid>

					<description><![CDATA[Answer : Apache Spark is an open-source distributed cluster-computing...]]></description>
										<content:encoded><![CDATA[<div class="TextHeading">
<div class="hddn">
<h2 id="what-is-apache-spark" class="color-pink" style="text-align: justify;"><span style="font-family: inherit; font-size: 2rem;">What is Apache Spark</span></h2>
</div>
</div>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li>Apache Spark is an open-source distributed cluster-computing framework.</li>
<li>Spark is a data processing engine developed to provide faster and ease-of-use analytics than Hadoop MapReduce.</li>
<li>Before Apache Software Foundation took possession of Spark, it was under the control of University of California, Berkeley’s AMP Lab.</li>
</ul>
</div>
</div>
<div class="TextHeading" style="text-align: justify;">
<div class="hddn">
<h2 id="what-is-apache-hadoop" class="color-purple">What is Apache Hadoop</h2>
</div>
</div>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li>Apache Hadoop is an open-source framework written in Java that allows us to store and process Big Data in a distributed environment, across various clusters of computers using simple programming constructs.</li>
<li>To do this, Hadoop uses an algorithm called MapReduce, which divides the task into small parts and assigns them to a set of computers.</li>
<li>Hadoop also has its own file system, Hadoop Distributed File System (HDFS), which is based on the Google File System (GFS).</li>
<li>HDFS is designed to run on low-cost hardware.</li>
</ul>
</div>
</div>
<div class="ImageContent">
<div class="hddn"><img decoding="async" class="img-responsive center-block aligncenter" src="https://cdn.wikitechy.com/interview-questions/apache-spark/apache-hadoop-vs-apache-spark.png" alt=" " /></div>
<div>
<div class="hddn" style="text-align: justify;">
<table class="table-bordered table-striped table table-responsive">
<tbody>
<tr>
<th>CRITERIA</th>
<th>SPARK</th>
<th>HADOOP MAPREDUCE</th>
</tr>
<tr>
<td class="text-leftalign">Memory</td>
<td class="text-leftalign">Let&#8217;s save data on memory with<br />
the use of RDD&#8217;s.</td>
<td class="text-leftalign">Does not leverage the memory of the hadoop cluster to maximum.</td>
</tr>
<tr>
<td class="text-leftalign">Disk usage</td>
<td class="text-leftalign"><a href="https://forums.wikitechy.com/question-category/apache-spark/" target="_blank" rel="noopener">Spark</a> caches data in-memory<br />
and ensures low latency.</td>
<td class="text-leftalign">MapReduce is disk oriented.</td>
</tr>
<tr>
<td class="text-leftalign">Processing</td>
<td class="text-leftalign">Supports real-time processing through<br />
spark streaming.</td>
<td class="text-leftalign">Only batch processing is supported</td>
</tr>
<tr>
<td class="text-leftalign">Installation</td>
<td class="text-leftalign">Is not bound to Hadoop.</td>
<td class="text-leftalign">Is bound to <a href="https://forums.wikitechy.com/question-category/hadoop/" target="_blank" rel="noopener">hadoop</a>.</td>
</tr>
<tr>
<td class="text-leftalign">Storage</td>
<td class="text-leftalign">Leverage exciting</td>
<td class="text-leftalign">HDFS</td>
</tr>
<tr>
<td class="text-leftalign">Speed</td>
<td class="text-leftalign">10 &#8211; 100X faster.</td>
<td class="text-leftalign">Fast.</td>
</tr>
<tr>
<td class="text-leftalign">Rsource management</td>
<td class="text-leftalign">standalone</td>
<td class="text-leftalign">YARN</td>
</tr>
</tbody>
</table>
</div>
<div class="ImageContent">
<div class="hddn"><img decoding="async" class="img-responsive center-block aligncenter" src="https://cdn.wikitechy.com/interview-questions/apache-spark/hadoop-vs-spark.png" alt="Hadoop Vs Spark" /></div>
</div>
</div>
</div>
]]></content:encoded>
					
					<wfw:commentRss>https://www.wikitechy.com/interview-questions/apache-spark/what-is-the-difference-between-spark-and-hadoop-mapreduce/feed/</wfw:commentRss>
			<slash:comments>0</slash:comments>
		
		
			</item>
		<item>
		<title>What is RDD ?</title>
		<link>https://www.wikitechy.com/interview-questions/apache-spark/what-is-rdd/</link>
					<comments>https://www.wikitechy.com/interview-questions/apache-spark/what-is-rdd/#respond</comments>
		
		<dc:creator><![CDATA[Editor]]></dc:creator>
		<pubDate>Mon, 12 Jul 2021 15:56:56 +0000</pubDate>
				<category><![CDATA[Apache Spark]]></category>
		<category><![CDATA[Accenture interview questions and answers]]></category>
		<category><![CDATA[apache spark]]></category>
		<category><![CDATA[Applied Materials interview questions and answers]]></category>
		<category><![CDATA[Capgemini interview questions and answers]]></category>
		<category><![CDATA[CASTING NETWORKS INDIA PVT LIMITED interview questions and answers]]></category>
		<category><![CDATA[CGI Group Inc interview questions and answers]]></category>
		<category><![CDATA[characteristics of rdd]]></category>
		<category><![CDATA[Chetu interview questions and answers]]></category>
		<category><![CDATA[Ciena Corporation interview questions and answers]]></category>
		<category><![CDATA[Collabera Technologies interview questions and answers]]></category>
		<category><![CDATA[Dell International Services India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Flipkart interview questions and answers]]></category>
		<category><![CDATA[hat is rdd in apache spark]]></category>
		<category><![CDATA[IBM interview questions and answers]]></category>
		<category><![CDATA[Indecomm Global Services interview questions and answers]]></category>
		<category><![CDATA[Indiabulls Technology Solutions Ltd interview questions and answers]]></category>
		<category><![CDATA[Infosys Technologies interview questions and answers]]></category>
		<category><![CDATA[Mavenir interview questions and answers]]></category>
		<category><![CDATA[Mphasis interview questions and answers]]></category>
		<category><![CDATA[Nagarro Software Pvt. Ltd interview questions and answers]]></category>
		<category><![CDATA[NetApp interview questions and answers]]></category>
		<category><![CDATA[Opentext Technologies interview questions and answers]]></category>
		<category><![CDATA[Oracle Corporation interview questions and answers]]></category>
		<category><![CDATA[Persistent Systems interview questions and answers]]></category>
		<category><![CDATA[RBS India Development Centre Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[rdd basics]]></category>
		<category><![CDATA[rdd in memory]]></category>
		<category><![CDATA[rdd meaning]]></category>
		<category><![CDATA[rdd properties]]></category>
		<category><![CDATA[resilient distributed dataset]]></category>
		<category><![CDATA[rrd extension]]></category>
		<category><![CDATA[rrd file format]]></category>
		<category><![CDATA[rrd file viewer]]></category>
		<category><![CDATA[rrd server]]></category>
		<category><![CDATA[SAP Labs India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[spark dataframe]]></category>
		<category><![CDATA[spark hadoop file]]></category>
		<category><![CDATA[spark hadoop file example]]></category>
		<category><![CDATA[spark rdd]]></category>
		<category><![CDATA[spark rdd api]]></category>
		<category><![CDATA[spark rdd collect]]></category>
		<category><![CDATA[spark rdd explained]]></category>
		<category><![CDATA[spark rdd filter]]></category>
		<category><![CDATA[spark rdd functions]]></category>
		<category><![CDATA[spark rdd internals]]></category>
		<category><![CDATA[spark rdd join]]></category>
		<category><![CDATA[spark rdd last element]]></category>
		<category><![CDATA[spark rdd map]]></category>
		<category><![CDATA[spark rdd mean]]></category>
		<category><![CDATA[spark rdd operations]]></category>
		<category><![CDATA[spark rdd partition]]></category>
		<category><![CDATA[spark rdd persist]]></category>
		<category><![CDATA[spark rdd print]]></category>
		<category><![CDATA[spark rdd sample]]></category>
		<category><![CDATA[spark rdd to dataframe]]></category>
		<category><![CDATA[spark rdd to df]]></category>
		<category><![CDATA[spark rdd transformations]]></category>
		<category><![CDATA[spark rdd vs dataframe]]></category>
		<category><![CDATA[spark sql]]></category>
		<category><![CDATA[spark tutorial]]></category>
		<category><![CDATA[Tech Mahindra interview questions and answers]]></category>
		<category><![CDATA[types of operations that can be performed on rdd]]></category>
		<category><![CDATA[types of rdd]]></category>
		<category><![CDATA[types of spark rdd operations]]></category>
		<category><![CDATA[UnitedHealth Group interview questions and answers]]></category>
		<category><![CDATA[Virtusa Consulting Services Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Wells Fargo interview questions and answers]]></category>
		<category><![CDATA[what does rdd mean]]></category>
		<category><![CDATA[what does rdd mean in texting]]></category>
		<category><![CDATA[what is a spark rdd]]></category>
		<category><![CDATA[what is an rdd object]]></category>
		<category><![CDATA[what is an rddw]]></category>
		<category><![CDATA[what is rdd]]></category>
		<category><![CDATA[what is rdd in spark]]></category>
		<category><![CDATA[what is rdd in spark with example]]></category>
		<category><![CDATA[what is spark rdd]]></category>
		<category><![CDATA[WM Global Technology Services India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Xoriant Solutions Pvt Ltd interview questions and answers]]></category>
		<guid isPermaLink="false">https://www.wikitechy.com/interview-questions/?p=250</guid>

					<description><![CDATA[Answer : Resilient Distributed Datasets (RDD) is a fundamental data structure...]]></description>
										<content:encoded><![CDATA[<div class="TextHeading">
<div class="hddn">
<h2 id="what-is-rdd" class="color-pink" style="text-align: justify;">What is RDD ?</h2>
</div>
</div>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li>Resilient Distributed Datasets (RDD) is a fundamental data structure of <a href="https://forums.wikitechy.com/qa-tag/apache-spark/" target="_blank" rel="noopener">Spark</a>. It is an immutable distributed collection of objects.</li>
<li>Each dataset in RDD is divided into logical partitions, which may be computed on different nodes of the cluster.</li>
<li>Formally, an RDD is a read-only, partitioned collection of records.</li>
<li>RDDs can be created through deterministic operations on either data on stable storage or other RDDs.</li>
<li>RDD is a fault-tolerant collection of elements that can be operated in parallel.</li>
</ul>
</div>
</div>
<div class="ImageContent">
<div class="hddn"><img decoding="async" class="img-responsive center-block aligncenter" src="https://cdn.wikitechy.com/interview-questions/apache-spark/what-is-rdd.png" alt="what is RDD" /></div>
</div>
]]></content:encoded>
					
					<wfw:commentRss>https://www.wikitechy.com/interview-questions/apache-spark/what-is-rdd/feed/</wfw:commentRss>
			<slash:comments>0</slash:comments>
		
		
			</item>
	</channel>
</rss>
