<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Migrating HDFS data in S3 in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403890#M252222</link>
    <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/124421"&gt;@Zubair123&lt;/a&gt;,&amp;nbsp;Did the response help resolve your query? If it did, kindly mark the relevant reply as the solution, as it will aid others in locating the answer more easily in the future.&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Tue, 11 Mar 2025 06:04:25 GMT</pubDate>
    <dc:creator>VidyaSargur</dc:creator>
    <dc:date>2025-03-11T06:04:25Z</dc:date>
    <item>
      <title>Migrating HDFS data in S3</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403416#M252061</link>
      <description>&lt;P&gt;Hi,&amp;nbsp;&lt;/P&gt;&lt;P&gt;Currently i have 1 TB of data in HDFS where i am trying to migrate into S3, i am using below command, when ever i run this command job runs very fast&amp;nbsp; for 3 hours then it slows down for a week still it is running, i started last week to run this job still it is running and very slow, is this expected behavior.&amp;nbsp;&amp;nbsp;&lt;/P&gt;&lt;P&gt;nohup hadoop distcp -Dfs.s3a.access.key="$AWS_ACCESS_KEY_ID" -Dfs.s3a.secret.key="$AWS_SECRET_ACCESS_KEY" -Dfs.s3a.fast.upload=true -Dfs.s3a.fast.buffer.size=1048576 -Dfs.s3a.multipart.size=10485760 -Dfs.s3a.multipart.threshold=10485760 -Dmapreduce.map.memory.mb=8192 -Dmapreduce.map.java.opts=-Xmx7360m -m=300 -bandwidth 400 -update hdfs:&amp;lt;....&amp;gt; s3a://&amp;lt;.......&amp;gt;&lt;/P&gt;</description>
      <pubDate>Mon, 03 Mar 2025 07:51:09 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403416#M252061</guid>
      <dc:creator>Zubair123</dc:creator>
      <dc:date>2025-03-03T07:51:09Z</dc:date>
    </item>
    <item>
      <title>Re: Migrating HDFS data in S3</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403485#M252082</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/124421"&gt;@Zubair123&lt;/a&gt;,&amp;nbsp;Welcome to our community! To help you get the best possible answer, I have tagged in our HDFS experts&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/82089"&gt;@willx&lt;/a&gt;&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/75213"&gt;@ChethanYM&lt;/a&gt;&amp;nbsp; who may be able to assist you further.&lt;BR /&gt;&lt;BR /&gt;Please feel free to provide any additional information or details about your query, and we hope that you will find a satisfactory solution to your question.&lt;/P&gt;</description>
      <pubDate>Tue, 04 Mar 2025 10:36:23 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403485#M252082</guid>
      <dc:creator>VidyaSargur</dc:creator>
      <dc:date>2025-03-04T10:36:23Z</dc:date>
    </item>
    <item>
      <title>Re: Migrating HDFS data in S3</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403518#M252092</link>
      <description>&lt;P&gt;You may want to collect yarn application log to understand what happened after 3 hours, for example, it may be a yarn resource issue or stuck containers.&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;1. Open console debug log and re-run distcp and save the output&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;export HADOOP_ROOT_LOGGER=DEBUG,console&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;nohup hadoop distcp -Dfs.s3a.access.key="$AWS_ACCESS_KEY_ID" -Dfs.s3a.secret.key="$AWS_SECRET_ACCESS_KEY" -Dfs.s3a.fast.upload=true -Dfs.s3a.fast.buffer.size=1048576 -Dfs.s3a.multipart.size=10485760 -Dfs.s3a.multipart.threshold=10485760 -Dmapreduce.map.memory.mb=8192 -Dmapreduce.map.java.opts=-Xmx7360m -m=300 -bandwidth 400 -update [hdfs path] [s3a path] &amp;gt; distcp_console.out 2&amp;gt;&amp;amp;1 &amp;amp;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;2. Collect yarn application logs:&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;yarn logs -applicationId [applicationID] &amp;gt; /tmp/distcp_application.out&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;3. If there are stuck yarn containers, collect jstack of the container pid, refer to below post&lt;/P&gt;&lt;P&gt;&lt;A href="https://my.cloudera.com/knowledge/How-to-collect-thread-dumps-for-stuck-YARN-containers-via-jstack?id=73696" target="_blank"&gt;https://my.cloudera.com/knowledge/How-to-collect-thread-dumps-for-stuck-YARN-containers-via-jstack?id=73696&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 04 Mar 2025 18:10:26 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403518#M252092</guid>
      <dc:creator>willx</dc:creator>
      <dc:date>2025-03-04T18:10:26Z</dc:date>
    </item>
    <item>
      <title>Re: Migrating HDFS data in S3</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403890#M252222</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/124421"&gt;@Zubair123&lt;/a&gt;,&amp;nbsp;Did the response help resolve your query? If it did, kindly mark the relevant reply as the solution, as it will aid others in locating the answer more easily in the future.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 11 Mar 2025 06:04:25 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403890#M252222</guid>
      <dc:creator>VidyaSargur</dc:creator>
      <dc:date>2025-03-11T06:04:25Z</dc:date>
    </item>
    <item>
      <title>Re: Migrating HDFS data in S3</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403938#M252241</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/82089"&gt;@willx&lt;/a&gt;&amp;nbsp;i really appreciate for response, looks like i don't have an access to the Article.&lt;/P&gt;&lt;P&gt;&lt;A href="https://my.cloudera.com/knowledge/How-to-collect-thread-dumps-for-stuck-YARN-containers-via-jstack?id=73696" target="_blank" rel="noopener noreferrer"&gt;https://my.cloudera.com/knowledge/How-to-collect-thread-dumps-for-stuck-YARN-containers-via-jstack?i...&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Can you please share the solution i really appreciate for help.&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;Zubair.&lt;/P&gt;</description>
      <pubDate>Tue, 11 Mar 2025 17:23:07 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403938#M252241</guid>
      <dc:creator>Zubair123</dc:creator>
      <dc:date>2025-03-11T17:23:07Z</dc:date>
    </item>
    <item>
      <title>Re: Migrating HDFS data in S3</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403939#M252242</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/32119"&gt;@VidyaSargur&lt;/a&gt;&amp;nbsp;i dont have an access to the article waiting for share solution.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 11 Mar 2025 17:23:53 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/403939#M252242</guid>
      <dc:creator>Zubair123</dc:creator>
      <dc:date>2025-03-11T17:23:53Z</dc:date>
    </item>
    <item>
      <title>Re: Migrating HDFS data in S3</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/404003#M252254</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/124421"&gt;@Zubair123&lt;/a&gt;,&amp;nbsp;This article is available exclusively for our customers. If you're a customer, please contact our customer support team for more details. If you’re not, our &lt;A href="https://www.cloudera.com/contact-sales.html" target="_self"&gt;sales&lt;/A&gt; team would happily assist you with any information you need.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Thu, 13 Mar 2025 05:57:11 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Migrating-HDFS-data-in-S3/m-p/404003#M252254</guid>
      <dc:creator>VidyaSargur</dc:creator>
      <dc:date>2025-03-13T05:57:11Z</dc:date>
    </item>
  </channel>
</rss>

