<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question CBO for Hive over hbase in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/CBO-for-Hive-over-hbase/m-p/149382#M32525</link>
    <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I have Hive running over HBase table. Is it interesting in this case to analyze the table for the CBO? Or is it only interesting whe nyou have hive with orc file?&lt;/P&gt;&lt;P&gt;Thanks in advance,&lt;/P&gt;&lt;P&gt;Michel&lt;/P&gt;</description>
    <pubDate>Tue, 21 Jun 2016 16:59:04 GMT</pubDate>
    <dc:creator>michelsumbul</dc:creator>
    <dc:date>2016-06-21T16:59:04Z</dc:date>
    <item>
      <title>CBO for Hive over hbase</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/CBO-for-Hive-over-hbase/m-p/149382#M32525</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I have Hive running over HBase table. Is it interesting in this case to analyze the table for the CBO? Or is it only interesting whe nyou have hive with orc file?&lt;/P&gt;&lt;P&gt;Thanks in advance,&lt;/P&gt;&lt;P&gt;Michel&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2016 16:59:04 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/CBO-for-Hive-over-hbase/m-p/149382#M32525</guid>
      <dc:creator>michelsumbul</dc:creator>
      <dc:date>2016-06-21T16:59:04Z</dc:date>
    </item>
    <item>
      <title>Re: CBO for Hive over hbase</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/CBO-for-Hive-over-hbase/m-p/149383#M32526</link>
      <description>&lt;P&gt;Hello Michel&lt;/P&gt;&lt;P&gt;Right now the Hive plan calculation does not reach out to get Hbases stats so currently no added benefit from the Hbase stats. This being said these are questions that are being worked on in different initiatives, so this will likely change in the future.&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2016 17:03:03 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/CBO-for-Hive-over-hbase/m-p/149383#M32526</guid>
      <dc:creator>nmaillard1</dc:creator>
      <dc:date>2016-06-21T17:03:03Z</dc:date>
    </item>
    <item>
      <title>Re: CBO for Hive over hbase</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/CBO-for-Hive-over-hbase/m-p/149384#M32527</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/1390/michelsumbul.html" nodeid="1390"&gt;@Michel Sumbul&lt;/A&gt;&lt;/P&gt;&lt;P&gt;CBO is mainly for optimization decisions which reduces the cost of query execution and is independent of storage formats like ORC. Below is some of decisions based on CBO:&lt;/P&gt;&lt;UL&gt;
&lt;LI&gt;How to order Join&lt;/LI&gt;&lt;LI&gt;What algorithm to use for a given Join&lt;/LI&gt;&lt;LI&gt;Should the intermediate result be persisted or should it be recomputed on operator failure.&lt;/LI&gt;&lt;LI&gt;The degree of parallelism at any operator (specifically number of reducers to use).&lt;/LI&gt;&lt;LI&gt;Semi Join selection&lt;/LI&gt;&lt;/UL&gt;&lt;P&gt;For details, please refer to below link:&lt;/P&gt;&lt;P&gt;&lt;A href="https://cwiki.apache.org/confluence/display/Hive/Cost-based+optimization+in+Hive" target="_blank"&gt;https://cwiki.apache.org/confluence/display/Hive/Cost-based+optimization+in+Hive&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Thanks and Regards,&lt;/P&gt;&lt;P&gt;Sindhu&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2016 17:05:06 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/CBO-for-Hive-over-hbase/m-p/149384#M32527</guid>
      <dc:creator>ssubhas</dc:creator>
      <dc:date>2016-06-21T17:05:06Z</dc:date>
    </item>
    <item>
      <title>Re: CBO for Hive over hbase</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/CBO-for-Hive-over-hbase/m-p/149385#M32528</link>
      <description>&lt;P&gt;Thanks for the info.
Then what will be your best advice to improve performance of hive over hbase?&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2016 17:05:16 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/CBO-for-Hive-over-hbase/m-p/149385#M32528</guid>
      <dc:creator>michelsumbul</dc:creator>
      <dc:date>2016-06-21T17:05:16Z</dc:date>
    </item>
    <item>
      <title>Re: CBO for Hive over hbase</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/CBO-for-Hive-over-hbase/m-p/149386#M32529</link>
      <description>&lt;P&gt;Hive using MR-over-hbase-snapshots would be a viable solution.&lt;/P&gt;&lt;P&gt;Perform a snapshot in hbase, then use hive to directly read from the underlying HFiles.&lt;/P&gt;</description>
      <pubDate>Tue, 21 Jun 2016 20:25:24 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/CBO-for-Hive-over-hbase/m-p/149386#M32529</guid>
      <dc:creator>tyu</dc:creator>
      <dc:date>2016-06-21T20:25:24Z</dc:date>
    </item>
  </channel>
</rss>

