<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question HDFS- Non DFS space allocation/capacity in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169676#M25234</link>
    <description>&lt;P&gt;Hi all,&lt;/P&gt;&lt;P&gt;I have a query in relation to Space Allocation within HDFS. I am currently trying to run a large query in Hive (a wordsplit on a large file). However, I am unable to complete this due to running out of disk space.&lt;/P&gt;&lt;P&gt;I have deleted any unnessary files from HDFS and have reduced my starting Disk Usage to 38%. &lt;/P&gt;&lt;P&gt;However, I am wondering what non DFS is as this appears to be taking up the majority of my disk space. &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="3447-yozy6.png" style="width: 476px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/20143iFCD4BBC85F689781/image-size/medium?v=v2&amp;amp;px=400" role="button" title="3447-yozy6.png" alt="3447-yozy6.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;How can I go about reducing the disk space that Non DFS takes up?&lt;/P&gt;&lt;P&gt;Any help is greatly appreciated.&lt;/P&gt;&lt;P&gt;Thanks in advance.&lt;/P&gt;</description>
    <pubDate>Sun, 18 Aug 2019 10:50:14 GMT</pubDate>
    <dc:creator>maeve_ryan226</dc:creator>
    <dc:date>2019-08-18T10:50:14Z</dc:date>
    <item>
      <title>HDFS- Non DFS space allocation/capacity</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169676#M25234</link>
      <description>&lt;P&gt;Hi all,&lt;/P&gt;&lt;P&gt;I have a query in relation to Space Allocation within HDFS. I am currently trying to run a large query in Hive (a wordsplit on a large file). However, I am unable to complete this due to running out of disk space.&lt;/P&gt;&lt;P&gt;I have deleted any unnessary files from HDFS and have reduced my starting Disk Usage to 38%. &lt;/P&gt;&lt;P&gt;However, I am wondering what non DFS is as this appears to be taking up the majority of my disk space. &lt;/P&gt;&lt;P&gt;&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="3447-yozy6.png" style="width: 476px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/20143iFCD4BBC85F689781/image-size/medium?v=v2&amp;amp;px=400" role="button" title="3447-yozy6.png" alt="3447-yozy6.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;How can I go about reducing the disk space that Non DFS takes up?&lt;/P&gt;&lt;P&gt;Any help is greatly appreciated.&lt;/P&gt;&lt;P&gt;Thanks in advance.&lt;/P&gt;</description>
      <pubDate>Sun, 18 Aug 2019 10:50:14 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169676#M25234</guid>
      <dc:creator>maeve_ryan226</dc:creator>
      <dc:date>2019-08-18T10:50:14Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS- Non DFS space allocation/capacity</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169677#M25235</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/3567/maeveryan226.html" nodeid="3567"&gt;@Maeve Ryan&lt;/A&gt; &lt;/P&gt;&lt;P&gt;You can decrease space for non-HDFS use by setting dfs.datanode.du.reserved to a low value. It's set per disk volume. You can also freed it up by deleting any unwanted files from the datanode machine such as hadoop logs, any non hadoop related files (other information on the disk), etc. It cannot be done by using any hadoop commands.&lt;/P&gt;</description>
      <pubDate>Thu, 14 Apr 2016 22:41:50 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169677#M25235</guid>
      <dc:creator>jyadav</dc:creator>
      <dc:date>2016-04-14T22:41:50Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS- Non DFS space allocation/capacity</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169678#M25236</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/2528/jyadav.html" nodeid="2528"&gt;@Jitendra Yadav&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Thanks for the quick response! Are these things I can do on the Hortonworks console or do I need to ssh into the instance?&lt;/P&gt;&lt;P&gt;I am new to Hadoop so apologies if the above question seems elementary!&lt;/P&gt;</description>
      <pubDate>Thu, 14 Apr 2016 22:54:09 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169678#M25236</guid>
      <dc:creator>maeve_ryan226</dc:creator>
      <dc:date>2016-04-14T22:54:09Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS- Non DFS space allocation/capacity</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169679#M25237</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/3567/maeveryan226.html" nodeid="3567"&gt;&lt;/A&gt;&lt;A href="https://community.cloudera.com/legacyfs/online/attachments/3449-screen-shot-2016-04-14-at-50748-pm.png"&gt;&lt;/A&gt;@Maeve Ryan &lt;/P&gt;&lt;P&gt;I believe to delete the logs and other non hdfs data you need to login into machine and execute rm command, but for setting up dfs.datanode.du.reserved property you can login to ambari and search for this property in HDFS &amp;gt; config section(please see attached screenshot). However I think the default value of  dfs.datanode.du.reserved is sufficient in most of the cases. Regarding your job whats the data size you are try to process?&lt;/P&gt;</description>
      <pubDate>Thu, 14 Apr 2016 23:12:21 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169679#M25237</guid>
      <dc:creator>jyadav</dc:creator>
      <dc:date>2016-04-14T23:12:21Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS- Non DFS space allocation/capacity</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169680#M25238</link>
      <description>&lt;P&gt;One thing to keep in mind is that your queries will fail if too many tasks fail. This can happen if one or some of your local dirs is on a small partition as well. Not sure about your cluster setup but sometimes ambari configures the local dirs simply by taking all available non root partitions and this can lead to these problems. I think its hard to believe that your query fails because yarn runs out of disc space given the small amount of data you have in the system. I think it is likelier that one of the local dirs has been set in a small partition.&lt;/P&gt;&lt;P&gt;Check: yarn.nodemanager.local-dirs and see if one of the folders in there is in a small partition. You can simple change that and re run your jobs.&lt;/P&gt;</description>
      <pubDate>Fri, 15 Apr 2016 01:28:16 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169680#M25238</guid>
      <dc:creator>bleonhardi</dc:creator>
      <dc:date>2016-04-15T01:28:16Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS- Non DFS space allocation/capacity</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169681#M25239</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/3567/maeveryan226.html" nodeid="3567"&gt;@Maeve Ryan&lt;/A&gt; &lt;/P&gt;&lt;P&gt;Hi, please let me know if you are still stuck in this issue. Thanks&lt;/P&gt;</description>
      <pubDate>Fri, 15 Apr 2016 15:50:08 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169681#M25239</guid>
      <dc:creator>jyadav</dc:creator>
      <dc:date>2016-04-15T15:50:08Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS- Non DFS space allocation/capacity</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169682#M25240</link>
      <description>&lt;A rel="user" href="https://community.cloudera.com/users/2528/jyadav.html" nodeid="2528"&gt;@Jitendra Yadav&lt;/A&gt;&lt;P&gt;Thanks very much for your help. This issue has been resolved.&lt;/P&gt;</description>
      <pubDate>Mon, 18 Apr 2016 01:58:06 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169682#M25240</guid>
      <dc:creator>maeve_ryan226</dc:creator>
      <dc:date>2016-04-18T01:58:06Z</dc:date>
    </item>
    <item>
      <title>Re: HDFS- Non DFS space allocation/capacity</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169683#M25241</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/168/bleonhardi.html" nodeid="168"&gt;@Benjamin Leonhardi&lt;/A&gt; -  This was indeed part of the reason. Thank you very much for your help!&lt;/P&gt;</description>
      <pubDate>Mon, 18 Apr 2016 01:59:00 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/HDFS-Non-DFS-space-allocation-capacity/m-p/169683#M25241</guid>
      <dc:creator>maeve_ryan226</dc:creator>
      <dc:date>2016-04-18T01:59:00Z</dc:date>
    </item>
  </channel>
</rss>

