<?xml version="1.0" encoding="UTF-8"?><rss version="2.0"
	xmlns:content="http://purl.org/rss/1.0/modules/content/"
	xmlns:wfw="http://wellformedweb.org/CommentAPI/"
	xmlns:dc="http://purl.org/dc/elements/1.1/"
	xmlns:atom="http://www.w3.org/2005/Atom"
	xmlns:sy="http://purl.org/rss/1.0/modules/syndication/"
	xmlns:slash="http://purl.org/rss/1.0/modules/slash/"
	>

<channel>
	<title>difference between big data and hadoop - Wikitechy</title>
	<atom:link href="https://www.wikitechy.com/interview-questions/tag/difference-between-big-data-and-hadoop/feed/" rel="self" type="application/rss+xml" />
	<link>https://www.wikitechy.com/interview-questions/tag/difference-between-big-data-and-hadoop/</link>
	<description>Interview Questions</description>
	<lastBuildDate>Tue, 14 Sep 2021 10:01:41 +0000</lastBuildDate>
	<language>en-US</language>
	<sy:updatePeriod>
	hourly	</sy:updatePeriod>
	<sy:updateFrequency>
	1	</sy:updateFrequency>
	<generator>https://wordpress.org/?v=6.9</generator>

<image>
	<url>https://www.wikitechy.com/interview-questions/wp-content/uploads/2025/10/cropped-wikitechy-icon-32x32.png</url>
	<title>difference between big data and hadoop - Wikitechy</title>
	<link>https://www.wikitechy.com/interview-questions/tag/difference-between-big-data-and-hadoop/</link>
	<width>32</width>
	<height>32</height>
</image> 
	<item>
		<title>Difference between Hive and HBase ?</title>
		<link>https://www.wikitechy.com/interview-questions/big-data/difference-between-hive-and-hbase/</link>
					<comments>https://www.wikitechy.com/interview-questions/big-data/difference-between-hive-and-hbase/#respond</comments>
		
		<dc:creator><![CDATA[Editor]]></dc:creator>
		<pubDate>Mon, 12 Jul 2021 19:18:59 +0000</pubDate>
				<category><![CDATA[Big Data]]></category>
		<category><![CDATA[Accenture interview questions and answers]]></category>
		<category><![CDATA[AT&T interview questions and answers]]></category>
		<category><![CDATA[Atos interview questions and answers]]></category>
		<category><![CDATA[big data and hadoop difference]]></category>
		<category><![CDATA[big data vs hadoop difference]]></category>
		<category><![CDATA[Capgemini interview questions and answers]]></category>
		<category><![CDATA[CASTING NETWORKS INDIA PVT LIMITED interview questions and answers]]></category>
		<category><![CDATA[CGI Group Inc interview questions and answers]]></category>
		<category><![CDATA[Collabera Technologiesinterview questions and answers]]></category>
		<category><![CDATA[Dell International Services India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[difference between apache hadoop and cloudera hadoop]]></category>
		<category><![CDATA[difference between big data and hadoop]]></category>
		<category><![CDATA[difference between cassandra and hbase]]></category>
		<category><![CDATA[difference between hadoop and cassandra]]></category>
		<category><![CDATA[difference between hadoop and cloudera]]></category>
		<category><![CDATA[difference between hadoop and hbase]]></category>
		<category><![CDATA[difference between hadoop and hive]]></category>
		<category><![CDATA[difference between hadoop and mongodb]]></category>
		<category><![CDATA[difference between hadoop and nosql]]></category>
		<category><![CDATA[difference between hadoop and oracle]]></category>
		<category><![CDATA[difference between hadoop and spark]]></category>
		<category><![CDATA[difference between hadoop and sql]]></category>
		<category><![CDATA[difference between hbase and cassandra]]></category>
		<category><![CDATA[difference between hbase and hdfs]]></category>
		<category><![CDATA[difference between hbase and hive]]></category>
		<category><![CDATA[difference between hive and hadoop]]></category>
		<category><![CDATA[difference between hive and impala]]></category>
		<category><![CDATA[difference between hive and pig]]></category>
		<category><![CDATA[difference between hive and spark]]></category>
		<category><![CDATA[difference between hive and sql]]></category>
		<category><![CDATA[Difference between Hive vs HBase]]></category>
		<category><![CDATA[difference between hiveql and sql]]></category>
		<category><![CDATA[difference between impala and hive]]></category>
		<category><![CDATA[difference between mapreduce and spark]]></category>
		<category><![CDATA[difference between mongodb and hbase]]></category>
		<category><![CDATA[difference between pig and hive]]></category>
		<category><![CDATA[difference between spark and mapreduce]]></category>
		<category><![CDATA[difference between sql and hadoop]]></category>
		<category><![CDATA[difference between sql and hive]]></category>
		<category><![CDATA[Ernst & Young interview questions and answers]]></category>
		<category><![CDATA[Flipkart interview questions and answers]]></category>
		<category><![CDATA[Genpact interview questions and answers]]></category>
		<category><![CDATA[hadoop and spark difference]]></category>
		<category><![CDATA[hbase and hive difference]]></category>
		<category><![CDATA[hbase architecture]]></category>
		<category><![CDATA[hbase vs hdfs]]></category>
		<category><![CDATA[hbase vs hive vs cassandra]]></category>
		<category><![CDATA[hbase vs spark]]></category>
		<category><![CDATA[hdfs vs hbase vs hive]]></category>
		<category><![CDATA[hive and pig difference]]></category>
		<category><![CDATA[hive vs hbase vs impala]]></category>
		<category><![CDATA[hive vs hbase vs pig]]></category>
		<category><![CDATA[hive vs hbase vs spark]]></category>
		<category><![CDATA[hive vs pig]]></category>
		<category><![CDATA[IBM interview questions and answers]]></category>
		<category><![CDATA[Indecomm Global Services interview questions and answers]]></category>
		<category><![CDATA[L&T Infotech interview questions and answers]]></category>
		<category><![CDATA[Mindtree interview questions and answers]]></category>
		<category><![CDATA[NetApp interview questions and answers]]></category>
		<category><![CDATA[pig and hive difference]]></category>
		<category><![CDATA[R Systems interview questions and answers]]></category>
		<category><![CDATA[RBS India Development Centre Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[SAP Labs India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Tata Consultancy Service interview questions and answers]]></category>
		<category><![CDATA[Tech Mahindra interview questions and answers]]></category>
		<category><![CDATA[Trigent Software interview questions and answers]]></category>
		<category><![CDATA[UnitedHealth Group interview questions and answers]]></category>
		<category><![CDATA[Virtusa Consulting Services Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Wells Fargo interview questions and answers]]></category>
		<category><![CDATA[what is difference between hadoop and bigdata]]></category>
		<category><![CDATA[what is difference between hadoop and spark]]></category>
		<category><![CDATA[what is the difference between big data and hadoop]]></category>
		<category><![CDATA[What is the difference between HBase and Hive]]></category>
		<category><![CDATA[what is the difference between pig and hive in hadoop]]></category>
		<category><![CDATA[what is the difference between spark and hadoop]]></category>
		<category><![CDATA[Wipro Infotech interview questions and answers]]></category>
		<category><![CDATA[Wipro interview questions and answers]]></category>
		<category><![CDATA[Xoriant Solutions Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[ZS Associates interview questions and answers]]></category>
		<guid isPermaLink="false">https://www.wikitechy.com/interview-questions/?p=301</guid>

					<description><![CDATA[Answer : Hive is a datawarehousing package built on the top of Hadoop...]]></description>
										<content:encoded><![CDATA[<div class="TextHeading">
<div class="hddn">
<h2 id="difference-between-hive-and-hbase" class="color-pink" style="text-align: justify;">Difference between Hive and HBase ?</h2>
</div>
</div>
<div class="TextHeading" style="text-align: justify;">
<div class="hddn">
<h2 id="hive" class="color-purple">Hive</h2>
</div>
</div>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li><a href="https://www.wikitechy.com/tutorials/sqoop/sqoop-create-hive-table" target="_blank" rel="noopener">Hive</a> is a datawarehousing package built on the top of Hadoop. It is mainly used for data analysis. It generally target towards users already comfortable with Structured Query Language (SQL).</li>
<li>It is similar to <a href="https://www.wikitechy.com/tutorials/sql/" target="_blank" rel="noopener">SQL</a> and called Hive Query Language (HQL).</li>
<li>Hive manages and queries structured data. Moreover, hive abstracts complexity of Hadoop. It does not support
<ul>
<li>Not a full database.</li>
<li>Not a real time processing system.</li>
<li>Not SQL-92 compliant.</li>
<li>Does not provide row level insert, updates or deletes.</li>
<li>Doesn’t support transactions and limited sub-query support.</li>
<li>Query optimization in evolving stage.</li>
</ul>
</li>
</ul>
</div>
</div>
<div class="text-center row" style="text-align: justify;"></div>
<div class="TextHeading" style="text-align: justify;">
<div class="hddn">
<h2 id="hbase" class="color-purple">Hbase</h2>
</div>
</div>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li><a href="https://www.wikitechy.com/tutorials/sqoop/sqoop-import-to-hbase" target="_blank" rel="noopener">HBase</a> is a column-oriented database management system that runs on top of Hadoop Distributed File System (HDFS).</li>
<li>It is well suited for sparse data sets, which are common in many Big Data use cases.</li>
<li>It is an opensource, distributed database developed by Apache software foundations.</li>
<li>Initially, it was named Google Big Table, afterwards it was re-named as HBase and is primarily written in <a href="https://www.wikitechy.com/tutorials/java/" target="_blank" rel="noopener">Java</a>.</li>
<li>It can store massive amount of data from terabytes to petabytes.</li>
<li>It is built for low-latency operations and is used extensively for read and write operations.</li>
<li>It stores large amount of data in the form of tables.</li>
</ul>
</div>
</div>
<div class="ImageContent" style="text-align: justify;">
<div class="hddn"><img decoding="async" class="img-responsive center-block" src="https://cdn.wikitechy.com/interview-questions/hive/difference-between-hive-and-hbase.png" alt="Difference between HIVE and HBASE" /></div>
</div>
<div class="hddn">
<table class="table-bordered table-striped table table-responsive">
<tbody>
<tr style="text-align: justify;">
<th>HIVE</th>
<th>HBASE</th>
</tr>
<tr style="text-align: justify;">
<td class="text-leftalign">Hive is a query engine.</td>
<td class="text-leftalign">Data storage particularly for unstructured data.</td>
</tr>
<tr style="text-align: justify;">
<td class="text-leftalign">Mainly used for batch processing.</td>
<td class="text-leftalign">Extensively used for transactional processing.</td>
</tr>
<tr style="text-align: justify;">
<td class="text-leftalign">Not a real time processing.</td>
<td class="text-leftalign">Real-time processing.</td>
</tr>
<tr style="text-align: justify;">
<td class="text-leftalign">Only for analytical queries.</td>
<td class="text-leftalign">Real-time querying.</td>
</tr>
<tr style="text-align: justify;">
<td class="text-leftalign">Runs on the top of Hadoop.</td>
<td class="text-leftalign">Runs on the top of HDFS (Hadoop distributed file system).</td>
</tr>
<tr style="text-align: justify;">
<td class="text-leftalign">Apache Hive is not a database.</td>
<td class="text-leftalign">It support NoSQL database.</td>
</tr>
<tr style="text-align: justify;">
<td class="text-leftalign">It has schema model.</td>
<td class="text-leftalign">It is free from schema model.</td>
</tr>
<tr>
<td class="text-leftalign" style="text-align: justify;">Made for high latency operations.</td>
<td class="text-leftalign" style="text-align: justify;">Made for low level latency operations.</td>
</tr>
</tbody>
</table>
</div>
]]></content:encoded>
					
					<wfw:commentRss>https://www.wikitechy.com/interview-questions/big-data/difference-between-hive-and-hbase/feed/</wfw:commentRss>
			<slash:comments>0</slash:comments>
		
		
			</item>
		<item>
		<title>Why Hadoop used for Big Data Analytics ?</title>
		<link>https://www.wikitechy.com/interview-questions/big-data/why-hadoop-used-for-big-data-analytics/</link>
					<comments>https://www.wikitechy.com/interview-questions/big-data/why-hadoop-used-for-big-data-analytics/#respond</comments>
		
		<dc:creator><![CDATA[Editor]]></dc:creator>
		<pubDate>Mon, 12 Jul 2021 17:16:29 +0000</pubDate>
				<category><![CDATA[Big Data]]></category>
		<category><![CDATA[Accenture interview questions and answers]]></category>
		<category><![CDATA[AT&T interview questions and answers]]></category>
		<category><![CDATA[Atos interview questions and answers]]></category>
		<category><![CDATA[big data analytics]]></category>
		<category><![CDATA[big data hadoop]]></category>
		<category><![CDATA[big data hadoop certification]]></category>
		<category><![CDATA[big data hadoop tutorial]]></category>
		<category><![CDATA[big data notes]]></category>
		<category><![CDATA[big data toolshow big data and hadoop are linked]]></category>
		<category><![CDATA[big data tutorial]]></category>
		<category><![CDATA[Capgemini interview questions and answers]]></category>
		<category><![CDATA[CASTING NETWORKS INDIA PVT LIMITED interview questions and answers]]></category>
		<category><![CDATA[CGI Group Inc interview questions and answers]]></category>
		<category><![CDATA[Collabera Technologiesinterview questions and answers]]></category>
		<category><![CDATA[Dell International Services India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[difference between big data and data science]]></category>
		<category><![CDATA[difference between big data and hadoop]]></category>
		<category><![CDATA[difference between hadoop and spark]]></category>
		<category><![CDATA[Ernst & Young interview questions and answers]]></category>
		<category><![CDATA[Flipkart interview questions and answers]]></category>
		<category><![CDATA[Genpact interview questions and answers]]></category>
		<category><![CDATA[hadoop architecture]]></category>
		<category><![CDATA[hadoop as big data solution]]></category>
		<category><![CDATA[hadoop database]]></category>
		<category><![CDATA[hadoop example]]></category>
		<category><![CDATA[hadoop modules]]></category>
		<category><![CDATA[hadoop storage]]></category>
		<category><![CDATA[IBM interview questions and answers]]></category>
		<category><![CDATA[Indecomm Global Services interview questions and answers]]></category>
		<category><![CDATA[L&T Infotech interview questions and answers]]></category>
		<category><![CDATA[Mindtree interview questions and answers]]></category>
		<category><![CDATA[NetApp interview questions and answers]]></category>
		<category><![CDATA[R Systems interview questions and answers]]></category>
		<category><![CDATA[RBS India Development Centre Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[SAP Labs India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Tata Consultancy Service interview questions and answers]]></category>
		<category><![CDATA[Tech Mahindra interview questions and answers]]></category>
		<category><![CDATA[Trigent Software interview questions and answers]]></category>
		<category><![CDATA[UnitedHealth Group interview questions and answers]]></category>
		<category><![CDATA[Virtusa Consulting Services Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Wells Fargo interview questions and answers]]></category>
		<category><![CDATA[what is big data]]></category>
		<category><![CDATA[what is hadoop used for]]></category>
		<category><![CDATA[Wipro Infotech interview questions and answers]]></category>
		<category><![CDATA[Wipro interview questions and answers]]></category>
		<category><![CDATA[Xoriant Solutions Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[ZS Associates interview questions and answers]]></category>
		<guid isPermaLink="false">https://www.wikitechy.com/interview-questions/?p=269</guid>

					<description><![CDATA[Answer : Big data analytics is the process of examining large data...]]></description>
										<content:encoded><![CDATA[<div class="TextHeading">
<div class="hddn">
<h2 id="why-hadoop-used-for-big-data-analytics" class="color-pink" style="text-align: justify;">Why Hadoop used for Big Data Analytics ?</h2>
</div>
</div>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li><a href="https://www.wikitechy.com/interview-questions/hadoop/what-is-big-data/" target="_blank" rel="noopener">Big data</a> analytics is the process of examining large data sets to uncover hidden patterns, unknown correlations, market trends, customer preferences and other useful business information.</li>
<li>Hadoop is a framework to store and process big data. Hadoop specifically designed to provide distributed storage and parallel data processing that big data requires.</li>
</ul>
</div>
</div>
<div class="TextHeading" style="text-align: justify;">
<div class="hddn">
<h2 id="hadoop-is-the-best-solution-for-storing-and-processing-big-data-because" class="color-blue">Hadoop is the best solution for storing and processing big data because:</h2>
</div>
</div>
<p style="text-align: justify;">Hadoop stores huge files as they are (raw) without specifying any schema.</p>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li><b>High scalability</b> &#8211; We can add any number of nodes, hence enhancing performance dramatically.</li>
<li><b>High availability</b> &#8211; In <a href="https://www.wikitechy.com/interview-questions/apache-pig/what-is-the-advantages-of-pig-in-hadoop/" target="_blank" rel="noopener">hadoop</a> data is highly available despite hardware failure. If a machine or few hardware crashes, then we can access data from another path.</li>
<li><b>Reliable</b> &#8211; Data is reliably stored on the cluster despite of machine failure.</li>
<li><b>Economic</b> &#8211; Hadoop runs on a cluster of commodity hardware which is not very expensive.</li>
</ul>
</div>
</div>
<div class="text-center row" style="text-align: justify;"></div>
<div class="TextHeading" style="text-align: justify;">
<div class="hddn">
<h2 id="what-is-hadoop" class="color-purple">What is Hadoop ?</h2>
</div>
</div>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li><a href="https://www.wikitechy.com/interview-questions/apache-pig/what-is-the-difference-between-pig-hive-and-mapreduce" target="_blank" rel="noopener">Hadoop</a> is an open source project from Apache Software Foundation.</li>
<li>It provides a software framework for distributing and running applications on clusters of servers that is inspired by Google’s Map-Reduce programming model as well as its file system(GFS).</li>
<li>Hadoop was originally written for the nutch search engine project.</li>
<li>Hadoop is open source framework written in Java. It efficiently processes large volumes of data on a cluster of commodity hardware.</li>
<li>Hadoop can be setup on single machine , but the real power of Hadoop comes with a cluster of machines , it can be scaled from a single machine to thousands of nodes. Hadoop consists of two key parts,
<ul>
<li>Hadoop Distributes File System(HDFS)</li>
<li>Map-Reduce.</li>
</ul>
</li>
</ul>
</div>
</div>
<div class="ImageContent" style="text-align: justify;">
<div class="hddn"><img decoding="async" class="img-responsive center-block aligncenter" src="https://cdn.wikitechy.com/interview-questions/hadoop/hadoop-overview.png" alt="Hadoop Overview" /></div>
</div>
<div class="TextHeading" style="text-align: justify;">
<div class="hddn">
<h2 id="hadoop-distributed-file-systemhdfs" class="color-blue">Hadoop Distributed File System(HDFS)</h2>
</div>
</div>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li>HDFS is a highly fault tolerant, distributed, reliable, scalable file system for data storage.</li>
<li>HDFS stores multiple copies of data on different nodes; a file is split up into blocks (Default 64 MB) and stored across multiple machines.</li>
<li>Hadoop cluster typically has a single namenode and number of datanodes to form the HDFS cluster.</li>
</ul>
</div>
</div>
<div class="TextHeading" style="text-align: justify;">
<div class="hddn">
<h2 id="map-reduce" class="color-blue">Map-Reduce</h2>
</div>
</div>
<div class="Content">
<div class="hddn">
<ul>
<li style="text-align: justify;">Map-Reduce is a programming model designed for processing large volumes of data in parallel by dividing the work into a set of independent tasks.</li>
<li style="text-align: justify;">It is also a paradigm for distributed processing of large data set over a cluster of nodes.</li>
</ul>
</div>
</div>
]]></content:encoded>
					
					<wfw:commentRss>https://www.wikitechy.com/interview-questions/big-data/why-hadoop-used-for-big-data-analytics/feed/</wfw:commentRss>
			<slash:comments>0</slash:comments>
		
		
			</item>
		<item>
		<title>What is the difference between Spark and Hadoop MapReduce ?</title>
		<link>https://www.wikitechy.com/interview-questions/apache-spark/what-is-the-difference-between-spark-and-hadoop-mapreduce/</link>
					<comments>https://www.wikitechy.com/interview-questions/apache-spark/what-is-the-difference-between-spark-and-hadoop-mapreduce/#respond</comments>
		
		<dc:creator><![CDATA[Editor]]></dc:creator>
		<pubDate>Mon, 12 Jul 2021 16:09:43 +0000</pubDate>
				<category><![CDATA[Apache Spark]]></category>
		<category><![CDATA[Accenture interview questions and answers]]></category>
		<category><![CDATA[Altimetrik India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[big data vs hadoop difference]]></category>
		<category><![CDATA[can you explain the difference between hadoop and spark]]></category>
		<category><![CDATA[Capgemini interview questions and answers]]></category>
		<category><![CDATA[cassandra hadoop difference]]></category>
		<category><![CDATA[CASTING NETWORKS INDIA PVT LIMITED interview questions and answers]]></category>
		<category><![CDATA[CGI Group Inc interview questions and answers]]></category>
		<category><![CDATA[Collabera Technologies interview questions and answers]]></category>
		<category><![CDATA[Dell International Services India Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[difference between apache spark and hadoop]]></category>
		<category><![CDATA[difference between apache spark and storm]]></category>
		<category><![CDATA[difference between apache storm and spark]]></category>
		<category><![CDATA[difference between big data and hadoop]]></category>
		<category><![CDATA[difference between cloudera and hadoop]]></category>
		<category><![CDATA[difference between hadoop and cassandra]]></category>
		<category><![CDATA[difference between hadoop and cloud computing]]></category>
		<category><![CDATA[difference between hadoop and cloudera]]></category>
		<category><![CDATA[difference between hadoop and data warehouse]]></category>
		<category><![CDATA[difference between hadoop and hbase]]></category>
		<category><![CDATA[difference between hadoop and hdfs]]></category>
		<category><![CDATA[difference between hadoop and hdfs commands]]></category>
		<category><![CDATA[difference between hadoop and hive]]></category>
		<category><![CDATA[difference between hadoop and mapreduce]]></category>
		<category><![CDATA[difference between hadoop and spark]]></category>
		<category><![CDATA[difference between hadoop and sql]]></category>
		<category><![CDATA[difference between hdfs and mapreduce]]></category>
		<category><![CDATA[difference between hive and hadoop]]></category>
		<category><![CDATA[difference between hive and hbase]]></category>
		<category><![CDATA[difference between hive and spark]]></category>
		<category><![CDATA[difference between mapreduce and spark]]></category>
		<category><![CDATA[difference between mapreduce and yarn]]></category>
		<category><![CDATA[difference between node and cluster in hadoop]]></category>
		<category><![CDATA[difference between spark and mapreduce]]></category>
		<category><![CDATA[difference between spark and scala]]></category>
		<category><![CDATA[difference between sql and hadoop]]></category>
		<category><![CDATA[Flipkart interview questions and answers]]></category>
		<category><![CDATA[Genpact interview questions and answers]]></category>
		<category><![CDATA[hadoop and spark difference]]></category>
		<category><![CDATA[hadoop spark difference]]></category>
		<category><![CDATA[IBM interview questions and answers]]></category>
		<category><![CDATA[JPMorgan Chase & Co interview questions and answers]]></category>
		<category><![CDATA[L&T Infotech interview questions and answers]]></category>
		<category><![CDATA[mapreduce vs spark differences]]></category>
		<category><![CDATA[Mindtree interview questions and answers]]></category>
		<category><![CDATA[Oracle Corporation interview questions and answers]]></category>
		<category><![CDATA[Prokarma Softech Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[R Systems interview questions and answers]]></category>
		<category><![CDATA[RBS India Development Centre Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Reliance Industries Ltd interview questions and answers]]></category>
		<category><![CDATA[Sapient Consulting Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Synechron Te interview questions and answers]]></category>
		<category><![CDATA[Tata Consultancy Service interview questions and answers]]></category>
		<category><![CDATA[Tech Mahindra interview questions and answers]]></category>
		<category><![CDATA[Trigent Software interview questions and answers]]></category>
		<category><![CDATA[UnitedHealth Group interview questions and answers]]></category>
		<category><![CDATA[Virtusa Consulting Services Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Wells Fargo interview questions and answers]]></category>
		<category><![CDATA[what is difference between hadoop and bigdata]]></category>
		<category><![CDATA[what is the difference between big data and hadoop]]></category>
		<category><![CDATA[what is the difference between hadoop and mapreduce]]></category>
		<category><![CDATA[what is the difference between hadoop and spark]]></category>
		<category><![CDATA[what is the difference between spark and hadoop]]></category>
		<category><![CDATA[What is the difference between Spark and Hadoop MapReduce]]></category>
		<category><![CDATA[what is the relationship between hadoop and spark]]></category>
		<category><![CDATA[Wipro Infotech interview questions and answers]]></category>
		<category><![CDATA[Xoriant Solutions Pvt Ltd interview questions and answers]]></category>
		<category><![CDATA[Yodlee Infotech Pvt Ltd interview questions and answers]]></category>
		<guid isPermaLink="false">https://www.wikitechy.com/interview-questions/?p=252</guid>

					<description><![CDATA[Answer : Apache Spark is an open-source distributed cluster-computing...]]></description>
										<content:encoded><![CDATA[<div class="TextHeading">
<div class="hddn">
<h2 id="what-is-apache-spark" class="color-pink" style="text-align: justify;"><span style="font-family: inherit; font-size: 2rem;">What is Apache Spark</span></h2>
</div>
</div>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li>Apache Spark is an open-source distributed cluster-computing framework.</li>
<li>Spark is a data processing engine developed to provide faster and ease-of-use analytics than Hadoop MapReduce.</li>
<li>Before Apache Software Foundation took possession of Spark, it was under the control of University of California, Berkeley’s AMP Lab.</li>
</ul>
</div>
</div>
<div class="TextHeading" style="text-align: justify;">
<div class="hddn">
<h2 id="what-is-apache-hadoop" class="color-purple">What is Apache Hadoop</h2>
</div>
</div>
<div class="Content" style="text-align: justify;">
<div class="hddn">
<ul>
<li>Apache Hadoop is an open-source framework written in Java that allows us to store and process Big Data in a distributed environment, across various clusters of computers using simple programming constructs.</li>
<li>To do this, Hadoop uses an algorithm called MapReduce, which divides the task into small parts and assigns them to a set of computers.</li>
<li>Hadoop also has its own file system, Hadoop Distributed File System (HDFS), which is based on the Google File System (GFS).</li>
<li>HDFS is designed to run on low-cost hardware.</li>
</ul>
</div>
</div>
<div class="ImageContent">
<div class="hddn"><img decoding="async" class="img-responsive center-block aligncenter" src="https://cdn.wikitechy.com/interview-questions/apache-spark/apache-hadoop-vs-apache-spark.png" alt=" " /></div>
<div>
<div class="hddn" style="text-align: justify;">
<table class="table-bordered table-striped table table-responsive">
<tbody>
<tr>
<th>CRITERIA</th>
<th>SPARK</th>
<th>HADOOP MAPREDUCE</th>
</tr>
<tr>
<td class="text-leftalign">Memory</td>
<td class="text-leftalign">Let&#8217;s save data on memory with<br />
the use of RDD&#8217;s.</td>
<td class="text-leftalign">Does not leverage the memory of the hadoop cluster to maximum.</td>
</tr>
<tr>
<td class="text-leftalign">Disk usage</td>
<td class="text-leftalign"><a href="https://forums.wikitechy.com/question-category/apache-spark/" target="_blank" rel="noopener">Spark</a> caches data in-memory<br />
and ensures low latency.</td>
<td class="text-leftalign">MapReduce is disk oriented.</td>
</tr>
<tr>
<td class="text-leftalign">Processing</td>
<td class="text-leftalign">Supports real-time processing through<br />
spark streaming.</td>
<td class="text-leftalign">Only batch processing is supported</td>
</tr>
<tr>
<td class="text-leftalign">Installation</td>
<td class="text-leftalign">Is not bound to Hadoop.</td>
<td class="text-leftalign">Is bound to <a href="https://forums.wikitechy.com/question-category/hadoop/" target="_blank" rel="noopener">hadoop</a>.</td>
</tr>
<tr>
<td class="text-leftalign">Storage</td>
<td class="text-leftalign">Leverage exciting</td>
<td class="text-leftalign">HDFS</td>
</tr>
<tr>
<td class="text-leftalign">Speed</td>
<td class="text-leftalign">10 &#8211; 100X faster.</td>
<td class="text-leftalign">Fast.</td>
</tr>
<tr>
<td class="text-leftalign">Rsource management</td>
<td class="text-leftalign">standalone</td>
<td class="text-leftalign">YARN</td>
</tr>
</tbody>
</table>
</div>
<div class="ImageContent">
<div class="hddn"><img decoding="async" class="img-responsive center-block aligncenter" src="https://cdn.wikitechy.com/interview-questions/apache-spark/hadoop-vs-spark.png" alt="Hadoop Vs Spark" /></div>
</div>
</div>
</div>
]]></content:encoded>
					
					<wfw:commentRss>https://www.wikitechy.com/interview-questions/apache-spark/what-is-the-difference-between-spark-and-hadoop-mapreduce/feed/</wfw:commentRss>
			<slash:comments>0</slash:comments>
		
		
			</item>
	</channel>
</rss>
