<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: HDFS caching to hive performance in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150522#M113024</link>
    <description>&lt;P&gt;HDFS caching helps, however it helps only a bit since you are saving only the cost of moving bytes off disk and are still paying the cost of de-serialization, don't get JVM JIT etc. So, with technologies like Hive LLAP (coming in hive-2) you will get significantly better performance because LLAP caches de-serialized vectors in memory-efficient formats (2 bits for certain integer ranges - rather than 4 bytes), cpu-efficient filters (vectorized query processing via filters etc.) removes JVM startup cost for tasks (100s of ms), provides JIT-enhanced CPU performance etc. Rather excited about it!&lt;/P&gt;</description>
    <pubDate>Sat, 02 Apr 2016 05:27:36 GMT</pubDate>
    <dc:creator>acm</dc:creator>
    <dc:date>2016-04-02T05:27:36Z</dc:date>
    <item>
      <title>HDFS caching to hive performance</title>
      <link>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150519#M113021</link>
      <description>&lt;P&gt;One of the customer is exploring ways to improve their hive query performance - and they are wondering about HDFS caching. They wanted to check if this is something we recommend.&lt;/P&gt;</description>
      <pubDate>Thu, 31 Mar 2016 08:45:55 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150519#M113021</guid>
      <dc:creator>hduraiswamy</dc:creator>
      <dc:date>2016-03-31T08:45:55Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS caching to hive performance</title>
      <link>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150520#M113022</link>
      <description>&lt;P&gt;HDFS memory as a storage is in technical preview (link &lt;A href="https://docs.hortonworks.com/HDPDocuments/HDP2/HDP-2.3.0/bk_hdfs_admin_tools/content/ch08.html"&gt;here&lt;/A&gt;).   I recommend review hive performance tuning &lt;A href="http://docs.hortonworks.com/HDPDocuments/HDP2/HDP-2.4.0/bk_performance_tuning/content/ch_hive_hi_perf_best_practices.html"&gt;here&lt;/A&gt;.&lt;/P&gt;</description>
      <pubDate>Thu, 31 Mar 2016 08:50:32 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150520#M113022</guid>
      <dc:creator>sunile_manjee</dc:creator>
      <dc:date>2016-03-31T08:50:32Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS caching to hive performance</title>
      <link>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150521#M113023</link>
      <description>&lt;P&gt;Thanks.. exactly what I was looking for.&lt;/P&gt;</description>
      <pubDate>Thu, 31 Mar 2016 09:15:36 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150521#M113023</guid>
      <dc:creator>hduraiswamy</dc:creator>
      <dc:date>2016-03-31T09:15:36Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS caching to hive performance</title>
      <link>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150522#M113024</link>
      <description>&lt;P&gt;HDFS caching helps, however it helps only a bit since you are saving only the cost of moving bytes off disk and are still paying the cost of de-serialization, don't get JVM JIT etc. So, with technologies like Hive LLAP (coming in hive-2) you will get significantly better performance because LLAP caches de-serialized vectors in memory-efficient formats (2 bits for certain integer ranges - rather than 4 bytes), cpu-efficient filters (vectorized query processing via filters etc.) removes JVM startup cost for tasks (100s of ms), provides JIT-enhanced CPU performance etc. Rather excited about it!&lt;/P&gt;</description>
      <pubDate>Sat, 02 Apr 2016 05:27:36 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150522#M113024</guid>
      <dc:creator>acm</dc:creator>
      <dc:date>2016-04-02T05:27:36Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS caching to hive performance</title>
      <link>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150523#M113025</link>
      <description>&lt;P&gt;Thank you! I am excited about LLAP too. Do we yet have a timeline on which HDP release the new hive-2 will be packaged in?&lt;/P&gt;</description>
      <pubDate>Sun, 03 Apr 2016 06:52:03 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150523#M113025</guid>
      <dc:creator>hduraiswamy</dc:creator>
      <dc:date>2016-04-03T06:52:03Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS caching to hive performance</title>
      <link>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150524#M113026</link>
      <description>&lt;P&gt;Watch the Tim Hall townhall from this Friday.&lt;/P&gt;</description>
      <pubDate>Sun, 03 Apr 2016 06:57:36 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/HDFS-caching-to-hive-performance/m-p/150524#M113026</guid>
      <dc:creator>aervits</dc:creator>
      <dc:date>2016-04-03T06:57:36Z</dc:date>
    </item>
  </channel>
</rss>

