<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Hive on Spark vs Impala in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Hive-on-Spark-vs-Impala/m-p/40857#M22068</link>
    <description>Can you please help me in this?&lt;BR /&gt;&lt;BR /&gt;&lt;A href="http://community.cloudera.com/t5/Advanced-Analytics-Apache-Spark/Pros-and-Cons-of-fetching-data-using-SparkSQL-vs-Hive-in-Spark/m-p/40855#U40855" target="_blank"&gt;http://community.cloudera.com/t5/Advanced-Analytics-Apache-Spark/Pros-and-Cons-of-fetching-data-using-SparkSQL-vs-Hive-in-Spark/m-p/40855#U40855&lt;/A&gt;</description>
    <pubDate>Mon, 16 May 2016 07:09:35 GMT</pubDate>
    <dc:creator>Raj2cool16</dc:creator>
    <dc:date>2016-05-16T07:09:35Z</dc:date>
    <item>
      <title>Hive on Spark vs Impala</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Hive-on-Spark-vs-Impala/m-p/38402#M22064</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;In CDH 5.6 there is Hive on Spark and Impala.&lt;/P&gt;&lt;P&gt;How should we choose between these 2 services? Are there any benchmarks that compare these 2 services?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thank you! &lt;span class="lia-unicode-emoji" title=":slightly_smiling_face:"&gt;🙂&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 16 Sep 2022 10:07:33 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Hive-on-Spark-vs-Impala/m-p/38402#M22064</guid>
      <dc:creator>AlinaGHERMAN</dc:creator>
      <dc:date>2022-09-16T10:07:33Z</dc:date>
    </item>
    <item>
      <title>Re: Hive on Spark vs Impala</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Hive-on-Spark-vs-Impala/m-p/38427#M22065</link>
      <description>&lt;P&gt;Hi Alina,&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Although Hive-on-Spark will definitely provide improved performance over MR for batch processing applications (eg ETL), that performance is not going to approach the interactive "BI" experience provided by Impala.&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Here's some recent Impala performance testing results:&lt;BR /&gt;&lt;BR /&gt;&lt;A href="http://blog.cloudera.com/blog/2016/02/new-sql-benchmarks-apache-impala-incubating-2-3-uniquely-delivers-analytic-database-performance/" target="_blank"&gt;http://blog.cloudera.com/blog/2016/02/new-sql-benchmarks-apache-impala-incubating-2-3-uniquely-delivers-analytic-database-performance/&lt;/A&gt;&lt;/P&gt;
&lt;P&gt;&amp;nbsp;&lt;/P&gt;
&lt;P&gt;Although Hive-on-Spark is not included, one would expect it to perform at levels similar to that of Hive-on-Tez (although having the added advantage of supporting consolidation onto the Spark API).&lt;/P&gt;</description>
      <pubDate>Mon, 07 Mar 2016 22:04:39 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Hive-on-Spark-vs-Impala/m-p/38427#M22065</guid>
      <dc:creator>jkestelyn</dc:creator>
      <dc:date>2016-03-07T22:04:39Z</dc:date>
    </item>
    <item>
      <title>Re: Hive on Spark vs Impala</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Hive-on-Spark-vs-Impala/m-p/39852#M22066</link>
      <description>&lt;P&gt;What is cloudera's take on usage for Impala vs Hive-on-Spark?&lt;/P&gt;&lt;P&gt;We would also like to know what are the long term implications of introducing Hive-on-Spark vs Impala.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;It would be definitely very interesting to have a head-to-head comparison between Impala, Hive on Spark and Stinger for example. I wouldnt include sparkSQL in here because in my opinion sparkSQL serves a totally different purpose.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;/Izhar&lt;/P&gt;</description>
      <pubDate>Mon, 18 Apr 2016 08:38:58 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Hive-on-Spark-vs-Impala/m-p/39852#M22066</guid>
      <dc:creator>izhar</dc:creator>
      <dc:date>2016-04-18T08:38:58Z</dc:date>
    </item>
    <item>
      <title>Re: Hive on Spark vs Impala</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Hive-on-Spark-vs-Impala/m-p/39871#M22067</link>
      <description>&lt;P&gt;Was there anything in my answers to these questions higher in the thread unclear?&lt;/P&gt;</description>
      <pubDate>Mon, 18 Apr 2016 18:17:38 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Hive-on-Spark-vs-Impala/m-p/39871#M22067</guid>
      <dc:creator>jkestelyn</dc:creator>
      <dc:date>2016-04-18T18:17:38Z</dc:date>
    </item>
    <item>
      <title>Re: Hive on Spark vs Impala</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Hive-on-Spark-vs-Impala/m-p/40857#M22068</link>
      <description>Can you please help me in this?&lt;BR /&gt;&lt;BR /&gt;&lt;A href="http://community.cloudera.com/t5/Advanced-Analytics-Apache-Spark/Pros-and-Cons-of-fetching-data-using-SparkSQL-vs-Hive-in-Spark/m-p/40855#U40855" target="_blank"&gt;http://community.cloudera.com/t5/Advanced-Analytics-Apache-Spark/Pros-and-Cons-of-fetching-data-using-SparkSQL-vs-Hive-in-Spark/m-p/40855#U40855&lt;/A&gt;</description>
      <pubDate>Mon, 16 May 2016 07:09:35 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Hive-on-Spark-vs-Impala/m-p/40857#M22068</guid>
      <dc:creator>Raj2cool16</dc:creator>
      <dc:date>2016-05-16T07:09:35Z</dc:date>
    </item>
  </channel>
</rss>

