<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Hive Functions slow too much my query in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Hive-Functions-slow-too-much-my-query/m-p/334310#M231710</link>
    <description>&lt;P&gt;Hello&amp;nbsp; I'm new to the community and to cloudera/big data in general,&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I am having issues with hive performance I have for example a table of 600 records and when I use a select * it runs in .05 seconds but if I use for example a count(*) or any function it runs in like 17 seconds, do any have any tip or trick to check performance or what parameter to check/modify in order to improve this execution time?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;My enviroment are CDH 6.1.0 withHive 2.1.1-cdh6.1.0&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thank you in advance&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Ulises Rangel&lt;/P&gt;</description>
    <pubDate>Thu, 20 Jan 2022 18:03:06 GMT</pubDate>
    <dc:creator>uliran</dc:creator>
    <dc:date>2022-01-20T18:03:06Z</dc:date>
    <item>
      <title>Hive Functions slow too much my query</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Hive-Functions-slow-too-much-my-query/m-p/334310#M231710</link>
      <description>&lt;P&gt;Hello&amp;nbsp; I'm new to the community and to cloudera/big data in general,&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I am having issues with hive performance I have for example a table of 600 records and when I use a select * it runs in .05 seconds but if I use for example a count(*) or any function it runs in like 17 seconds, do any have any tip or trick to check performance or what parameter to check/modify in order to improve this execution time?&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;My enviroment are CDH 6.1.0 withHive 2.1.1-cdh6.1.0&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thank you in advance&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Ulises Rangel&lt;/P&gt;</description>
      <pubDate>Thu, 20 Jan 2022 18:03:06 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Hive-Functions-slow-too-much-my-query/m-p/334310#M231710</guid>
      <dc:creator>uliran</dc:creator>
      <dc:date>2022-01-20T18:03:06Z</dc:date>
    </item>
    <item>
      <title>Re: Hive Functions slow too much my query</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Hive-Functions-slow-too-much-my-query/m-p/334314#M231711</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;SPAN&gt;Ulises,&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;This is expected.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;When you do&amp;nbsp;&lt;SPAN&gt;select *&amp;nbsp; without any complex aggregation / function hive can directly read the data from hdfs / files&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;But in case of count it need to do computation which involve creating job and doing the required aggregation which will take time.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 20 Jan 2022 18:38:29 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Hive-Functions-slow-too-much-my-query/m-p/334314#M231711</guid>
      <dc:creator>rpathak</dc:creator>
      <dc:date>2022-01-20T18:38:29Z</dc:date>
    </item>
    <item>
      <title>Re: Hive Functions slow too much my query</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Hive-Functions-slow-too-much-my-query/m-p/334316#M231713</link>
      <description>&lt;P&gt;Thanks for the reply&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I know is a normal thing to happend but is there anything I could check in order to know if there is something wrong with my configuration?&amp;nbsp; or maybe a job trace, I am a newbie in this topics&lt;/P&gt;</description>
      <pubDate>Thu, 20 Jan 2022 18:55:43 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Hive-Functions-slow-too-much-my-query/m-p/334316#M231713</guid>
      <dc:creator>uliran</dc:creator>
      <dc:date>2022-01-20T18:55:43Z</dc:date>
    </item>
    <item>
      <title>Re: Hive Functions slow too much my query</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Hive-Functions-slow-too-much-my-query/m-p/334318#M231715</link>
      <description>&lt;P&gt;Yes, there are lot of places to check but without knowing what are you looking for you will be lost.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;You can start with what you see on screen / console where you run the query.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;In beeline you see tez job summary which has lot of details to look at.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;example of one of the tuning guide is below&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;A href="https://community.cloudera.com/t5/Community-Articles/Demystify-Apache-Tez-Memory-Tuning-Step-by-Step/ta-p/245279" target="_blank" rel="noopener"&gt;https://community.cloudera.com/t5/Community-Articles/Demystify-Apache-Tez-Memory-Tuning-Step-by-Step/ta-p/245279&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Update: I see you are using cdh6 which does not have tez.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;You can refer below link for cdh&lt;BR /&gt;&lt;A href="https://docs.cloudera.com/documentation/enterprise/6/6.1/topics/admin_hive_tuning.html#concept_u51_lkv_cv" target="_blank"&gt;https://docs.cloudera.com/documentation/enterprise/6/6.1/topics/admin_hive_tuning.html#concept_u51_lkv_cv&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 20 Jan 2022 19:27:29 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Hive-Functions-slow-too-much-my-query/m-p/334318#M231715</guid>
      <dc:creator>rpathak</dc:creator>
      <dc:date>2022-01-20T19:27:29Z</dc:date>
    </item>
    <item>
      <title>Re: Hive Functions slow too much my query</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Hive-Functions-slow-too-much-my-query/m-p/334319#M231716</link>
      <description>&lt;P&gt;Thanks&amp;nbsp; I will start from there&lt;/P&gt;</description>
      <pubDate>Thu, 20 Jan 2022 19:28:17 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Hive-Functions-slow-too-much-my-query/m-p/334319#M231716</guid>
      <dc:creator>uliran</dc:creator>
      <dc:date>2022-01-20T19:28:17Z</dc:date>
    </item>
  </channel>
</rss>

