<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Cleaning data HDFS in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Cleaning-data-HDFS/m-p/410665#M252883</link>
    <description>&lt;P&gt;Hi Everyone, Can you help me please.&lt;/P&gt;&lt;P&gt;In my cluster have 80% used&amp;nbsp; storage each nodes, I want to clean up each node but I am very worried if deleting data from /hadoop/hdfs/data folder will affect HDFS cluster. see below capacity left 1TB but capacity used 2TB, but in not have table data in my cluster&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="rizalt_0-1750302119893.png" style="width: 400px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/46117i2BA53AA1DC868B3A/image-size/medium?v=v2&amp;amp;px=400" role="button" title="rizalt_0-1750302119893.png" alt="rizalt_0-1750302119893.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;Not have table in my cluster like below&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="rizalt_1-1750302397603.png" style="width: 400px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/46118i244D1D39ED7DB1F1/image-size/medium?v=v2&amp;amp;px=400" role="button" title="rizalt_1-1750302397603.png" alt="rizalt_1-1750302397603.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;please suggestions for case, Can I to remove file in folder&amp;nbsp;/hadoop/hdfs/data? please tell me to step by step to remove it&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Thu, 19 Jun 2025 03:11:55 GMT</pubDate>
    <dc:creator>rizalt</dc:creator>
    <dc:date>2025-06-19T03:11:55Z</dc:date>
    <item>
      <title>Cleaning data HDFS</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cleaning-data-HDFS/m-p/410665#M252883</link>
      <description>&lt;P&gt;Hi Everyone, Can you help me please.&lt;/P&gt;&lt;P&gt;In my cluster have 80% used&amp;nbsp; storage each nodes, I want to clean up each node but I am very worried if deleting data from /hadoop/hdfs/data folder will affect HDFS cluster. see below capacity left 1TB but capacity used 2TB, but in not have table data in my cluster&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="rizalt_0-1750302119893.png" style="width: 400px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/46117i2BA53AA1DC868B3A/image-size/medium?v=v2&amp;amp;px=400" role="button" title="rizalt_0-1750302119893.png" alt="rizalt_0-1750302119893.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;Not have table in my cluster like below&lt;/P&gt;&lt;P&gt;&lt;span class="lia-inline-image-display-wrapper lia-image-align-inline" image-alt="rizalt_1-1750302397603.png" style="width: 400px;"&gt;&lt;img src="https://community.cloudera.com/t5/image/serverpage/image-id/46118i244D1D39ED7DB1F1/image-size/medium?v=v2&amp;amp;px=400" role="button" title="rizalt_1-1750302397603.png" alt="rizalt_1-1750302397603.png" /&gt;&lt;/span&gt;&lt;/P&gt;&lt;P&gt;please suggestions for case, Can I to remove file in folder&amp;nbsp;/hadoop/hdfs/data? please tell me to step by step to remove it&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 19 Jun 2025 03:11:55 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cleaning-data-HDFS/m-p/410665#M252883</guid>
      <dc:creator>rizalt</dc:creator>
      <dc:date>2025-06-19T03:11:55Z</dc:date>
    </item>
    <item>
      <title>Re: Cleaning data HDFS</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cleaning-data-HDFS/m-p/411105#M252989</link>
      <description>&lt;P&gt;Hello&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/109307"&gt;@rizalt&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks for posting your questions on Cloudera Community forum!&lt;BR /&gt;&lt;BR /&gt;If I understood well, your space usage is high although it seems you don't have any data in hdfs at all.&lt;BR /&gt;&lt;BR /&gt;For confirmation, could you please run this command against hdfs (make sure to have a kerberos ticket if the cluster is kerberized:&lt;/P&gt;&lt;P&gt;hdfs dfs -du -h /&lt;/P&gt;&lt;P&gt;or show me from the browse directory page, the root folder.&lt;/P&gt;&lt;P&gt;Finally, to answer your immediate question, please don't remove any data from&amp;nbsp; /hadoop/hdfs/data.&amp;nbsp; It is preferred to remove things using the proper tools.&amp;nbsp; We will walk you through it once we get the above information.&lt;/P&gt;&lt;P&gt;Regards,&lt;/P&gt;&lt;P&gt;JR&lt;/P&gt;</description>
      <pubDate>Wed, 02 Jul 2025 19:58:09 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cleaning-data-HDFS/m-p/411105#M252989</guid>
      <dc:creator>jromero</dc:creator>
      <dc:date>2025-07-02T19:58:09Z</dc:date>
    </item>
    <item>
      <title>Re: Cleaning data HDFS</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cleaning-data-HDFS/m-p/411106#M252990</link>
      <description>&lt;P&gt;Hello&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/109307"&gt;@rizalt&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Do not try to delete anything on&amp;nbsp;&lt;SPAN&gt;/hadoop/hdfs/data. From your query it seems you may have snapshots enabled which might be holding the blocks. Deleting the snapshots that belongs to /warehouse/tablespace/managed/hive may help to recover the space. You may check if the snapshot enabled for /warehourse or it child directory using below comamnd.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;$ hdfs lsSnapshottableDir&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;If you find snapshot for this directory, you may delete it from Cloudera Manager using procedure specified in the below documentation.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;&lt;A href="https://docs.cloudera.com/runtime/7.3.1/data-protection/topics/hdfs-deleting-snapshots-cm.html" target="_blank" rel="noopener"&gt;https://docs.cloudera.com/runtime/7.3.1/data-protection/topics/hdfs-deleting-snapshots-cm.html&lt;/A&gt;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;While deleting the snapshots start deleting with oldest to the newest.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Wed, 02 Jul 2025 20:11:01 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cleaning-data-HDFS/m-p/411106#M252990</guid>
      <dc:creator>sathishkr</dc:creator>
      <dc:date>2025-07-02T20:11:01Z</dc:date>
    </item>
    <item>
      <title>Re: Cleaning data HDFS</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cleaning-data-HDFS/m-p/411108#M252992</link>
      <description>&lt;P&gt;hi&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/109307"&gt;@rizalt&lt;/a&gt;&amp;nbsp;,&lt;/P&gt;&lt;P&gt;from your report, you probably have snapshots enabled for this directory, so any delete in this directory will not be 100% effective unless the snapshot is also deleted.&lt;/P&gt;&lt;P&gt;deleting the snapshot will make it impossible to recover data if necessary.&lt;/P&gt;&lt;P&gt;so, on the namenode webui page, in the "snapshot" tab, check your snapshots.&lt;/P&gt;</description>
      <pubDate>Wed, 02 Jul 2025 20:34:43 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cleaning-data-HDFS/m-p/411108#M252992</guid>
      <dc:creator>yagoaparecidoti</dc:creator>
      <dc:date>2025-07-02T20:34:43Z</dc:date>
    </item>
  </channel>
</rss>

