<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: URGENT: Distcp -update -delete is not deleting files in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/URGENT-Distcp-update-delete-is-not-deleting-files/m-p/388090#M246524</link>
    <description>&lt;P&gt;Hello , can you please share the code of distcp you were using with all necessary parameter&lt;BR /&gt;ALso did you try to run the same in Debug console to understand more&lt;/P&gt;&lt;P class="p1"&gt;&lt;STRONG&gt;HADOOP_ROOT_LOGGER=DEBUG,console&lt;/STRONG&gt;&lt;/P&gt;</description>
    <pubDate>Mon, 20 May 2024 06:36:33 GMT</pubDate>
    <dc:creator>Asfahan</dc:creator>
    <dc:date>2024-05-20T06:36:33Z</dc:date>
    <item>
      <title>URGENT: Distcp -update -delete is not deleting files</title>
      <link>https://community.cloudera.com/t5/Support-Questions/URGENT-Distcp-update-delete-is-not-deleting-files/m-p/372831#M241392</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;&lt;BR /&gt;We are on CDP 7.1.7 SP1 and as per my understanding when DistCp is executed with below parameters, it does the following:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;1. update: this will update the files in destination that have got modified at source&lt;/P&gt;&lt;P&gt;2. delete: this will delete the files in destination that exist in destination but not in source.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Apart feom above, it will copy over any new files at source that do not exist in destination.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;While copy and update is happening, it does not delete the files instead duplicates them and hence, the data count at destination is double than the source.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Kindly help urgently as we are at the verge of initiating heavy data copy.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;&lt;P&gt;snm1523&lt;/P&gt;</description>
      <pubDate>Fri, 16 Jun 2023 18:11:20 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/URGENT-Distcp-update-delete-is-not-deleting-files/m-p/372831#M241392</guid>
      <dc:creator>snm1523</dc:creator>
      <dc:date>2023-06-16T18:11:20Z</dc:date>
    </item>
    <item>
      <title>Re: URGENT: Distcp -update -delete is not deleting files</title>
      <link>https://community.cloudera.com/t5/Support-Questions/URGENT-Distcp-update-delete-is-not-deleting-files/m-p/388090#M246524</link>
      <description>&lt;P&gt;Hello , can you please share the code of distcp you were using with all necessary parameter&lt;BR /&gt;ALso did you try to run the same in Debug console to understand more&lt;/P&gt;&lt;P class="p1"&gt;&lt;STRONG&gt;HADOOP_ROOT_LOGGER=DEBUG,console&lt;/STRONG&gt;&lt;/P&gt;</description>
      <pubDate>Mon, 20 May 2024 06:36:33 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/URGENT-Distcp-update-delete-is-not-deleting-files/m-p/388090#M246524</guid>
      <dc:creator>Asfahan</dc:creator>
      <dc:date>2024-05-20T06:36:33Z</dc:date>
    </item>
  </channel>
</rss>

