<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Unexpected Spill to Disk Activity in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Unexpected-Spill-to-Disk-Activity/m-p/36703#M16434</link>
    <description>&lt;P&gt;You are most likely running into this bug with the aggregation: &lt;A href="https://issues.cloudera.org/browse/IMPALA-2352" target="_blank"&gt;https://issues.cloudera.org/browse/IMPALA-2352&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;We fixed it in CDH5.5/Impala 2.3 but the change wasn't backported because it was deemed too risky for a maintenance release.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Thu, 28 Jan 2016 00:09:05 GMT</pubDate>
    <dc:creator>Tim Armstrong</dc:creator>
    <dc:date>2016-01-28T00:09:05Z</dc:date>
    <item>
      <title>Unexpected Spill to Disk Activity</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Unexpected-Spill-to-Disk-Activity/m-p/36661#M16433</link>
      <description>&lt;P&gt;&lt;SPAN&gt;Hi&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;&lt;DIV&gt;&lt;DIV&gt;&lt;DIV&gt;We are using CDH4.5.8 Impala 2.2. We are confused by some spill to disk activities and would like to understand why this is happening.&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;Here's a snippet of the profile, we had 128 GB memory available for Impala (YARN and Admission Controller are disabled) and stats are available for all tables.&lt;/DIV&gt;&lt;DIV&gt;Scratch directories are set to one per disk (23 HDD in total). No mem_limit is set with query option either.&lt;/DIV&gt;&lt;DIV&gt;The 4-node cluster has 3 Impalad running on 3 of the node and data nodes are co-located with the impalad.&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;&lt;DIV&gt;BlockMgr:&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- BlockWritesOutstanding: 0 (0)&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- BlocksCreated: 279 (279)&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- BlocksRecycled: 113 (113)&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- BufferedPins: 2 (2)&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- BytesWritten: 140.00 MB (146798191)&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- MaxBlockSize: 8.00 MB (8388608)&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- MemoryLimit: 128.93 GB (138436362240)&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- PeakMemoryUsage: 654.59 MB (686391904)&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- TotalBufferWaitTime: 0ns&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- TotalEncryptionTime: 0ns&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- TotalIntegrityCheckTime: 0ns&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;- TotalReadBlockTime: 122.868ms&lt;/DIV&gt;&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;We are just wondering why Impala spill data to disk when PeakMemoryUsage is only 654.59???&lt;/DIV&gt;&lt;DIV&gt;We are looking for any potential explanations for this scenario.&lt;/DIV&gt;&lt;DIV&gt;Thanks&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;DIV&gt;link to profile:&lt;/DIV&gt;&lt;DIV&gt;&lt;A href="https://my.syncplicity.com/share/bbkeaucyp3dnpsq/C2300_M1600_TPCDS_WFI_q98" target="_blank"&gt;https://my.syncplicity.com/share/bbkeaucyp3dnpsq/C2300_M1600_TPCDS_WFI_q98&lt;/A&gt;&lt;/DIV&gt;&lt;DIV&gt;passwod: 123456&lt;/DIV&gt;&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;&lt;/DIV&gt;&lt;/DIV&gt;</description>
      <pubDate>Fri, 16 Sep 2022 10:00:17 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Unexpected-Spill-to-Disk-Activity/m-p/36661#M16433</guid>
      <dc:creator>epstvxj</dc:creator>
      <dc:date>2022-09-16T10:00:17Z</dc:date>
    </item>
    <item>
      <title>Re: Unexpected Spill to Disk Activity</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Unexpected-Spill-to-Disk-Activity/m-p/36703#M16434</link>
      <description>&lt;P&gt;You are most likely running into this bug with the aggregation: &lt;A href="https://issues.cloudera.org/browse/IMPALA-2352" target="_blank"&gt;https://issues.cloudera.org/browse/IMPALA-2352&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;We fixed it in CDH5.5/Impala 2.3 but the change wasn't backported because it was deemed too risky for a maintenance release.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 28 Jan 2016 00:09:05 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Unexpected-Spill-to-Disk-Activity/m-p/36703#M16434</guid>
      <dc:creator>Tim Armstrong</dc:creator>
      <dc:date>2016-01-28T00:09:05Z</dc:date>
    </item>
  </channel>
</rss>

