<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question How to speed up &amp;quot;hdfs dfs -mv&amp;quot; for more than 30 000 files ? in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227833#M70253</link>
    <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;I've got 30 thousand of files to move to another hdfs directory. &lt;/P&gt;&lt;P&gt;Do you know a better way than "hdfs dfs -mv /mydirectory/* /targetdirectory" to go faster ?&lt;/P&gt;&lt;P&gt;Average size of a file :  10 Kb.&lt;/P&gt;&lt;P&gt;And I can't merge the files in a bigger one before.&lt;/P&gt;&lt;P&gt;Thanks for your feedback&lt;/P&gt;</description>
    <pubDate>Wed, 25 Oct 2017 19:07:57 GMT</pubDate>
    <dc:creator>thierry_vernhet</dc:creator>
    <dc:date>2017-10-25T19:07:57Z</dc:date>
    <item>
      <title>How to speed up "hdfs dfs -mv" for more than 30 000 files ?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227833#M70253</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;I've got 30 thousand of files to move to another hdfs directory. &lt;/P&gt;&lt;P&gt;Do you know a better way than "hdfs dfs -mv /mydirectory/* /targetdirectory" to go faster ?&lt;/P&gt;&lt;P&gt;Average size of a file :  10 Kb.&lt;/P&gt;&lt;P&gt;And I can't merge the files in a bigger one before.&lt;/P&gt;&lt;P&gt;Thanks for your feedback&lt;/P&gt;</description>
      <pubDate>Wed, 25 Oct 2017 19:07:57 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227833#M70253</guid>
      <dc:creator>thierry_vernhet</dc:creator>
      <dc:date>2017-10-25T19:07:57Z</dc:date>
    </item>
    <item>
      <title>Re: How to speed up "hdfs dfs -mv" for more than 30 000 files ?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227834#M70254</link>
      <description>&lt;P&gt;1. dfs -mv is the fastest as compare to -cp or distcp .  &lt;BR /&gt;If possible move  mydirectory  instead of  mydirectory/* into /targetdirectory&lt;/P&gt;</description>
      <pubDate>Wed, 25 Oct 2017 19:12:59 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227834#M70254</guid>
      <dc:creator>kgautam</dc:creator>
      <dc:date>2017-10-25T19:12:59Z</dc:date>
    </item>
    <item>
      <title>Re: How to speed up "hdfs dfs -mv" for more than 30 000 files ?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227835#M70255</link>
      <description>&lt;P&gt;Thanks&lt;/P&gt;&lt;P&gt;Not possible because the result is /targetdirectory/mydirectory and I expect all the files moved in path /targetdirectory/*&lt;/P&gt;</description>
      <pubDate>Wed, 25 Oct 2017 19:22:24 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227835#M70255</guid>
      <dc:creator>thierry_vernhet</dc:creator>
      <dc:date>2017-10-25T19:22:24Z</dc:date>
    </item>
    <item>
      <title>Re: How to speed up "hdfs dfs -mv" for more than 30 000 files ?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227836#M70256</link>
      <description>&lt;P&gt; &lt;A rel="user" href="https://community.cloudera.com/users/10685/thierryvernhet.html" nodeid="10685"&gt;@Thierry Vernhet&lt;/A&gt;,&lt;/P&gt;&lt;P&gt;If there are less files in /targetdirectory than the /mydirectory , you can do the below&lt;/P&gt;&lt;PRE&gt;hdfs dfs -mv /targetdirectory /x
hdfs dfs -mv /mydirectory /targetdirectory
hdfs dfs -mv /x/* /targetdirectory&lt;/PRE&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;Aditya&lt;/P&gt;</description>
      <pubDate>Wed, 25 Oct 2017 19:29:09 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227836#M70256</guid>
      <dc:creator>asirna</dc:creator>
      <dc:date>2017-10-25T19:29:09Z</dc:date>
    </item>
    <item>
      <title>Re: How to speed up "hdfs dfs -mv" for more than 30 000 files ?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227837#M70257</link>
      <description>&lt;P&gt;Thanks but it doesn't work for the same reason. &lt;/P&gt;&lt;P&gt;When you "mv /mydirectory /targetdirectory" the result is always /targetdirectory/mydirectory. &lt;/P&gt;</description>
      <pubDate>Wed, 25 Oct 2017 20:04:34 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227837#M70257</guid>
      <dc:creator>thierry_vernhet</dc:creator>
      <dc:date>2017-10-25T20:04:34Z</dc:date>
    </item>
    <item>
      <title>Re: How to speed up "hdfs dfs -mv" for more than 30 000 files ?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227838#M70258</link>
      <description>&lt;P&gt; &lt;A href="https://community.hortonworks.com/questions/142457/how-to-speed-up-hdfs-dfs-mv-for-more-than-30-000-f.html?childToView=142460#"&gt;@Thierry Vernhet&lt;/A&gt;,&lt;/P&gt;&lt;P&gt;After running the first command targetdirectory will be renamed to x.&lt;/P&gt;&lt;P&gt;So mv /mydirectory /targetdirectory is not /targetdirectory/mydirectory , instead it will just rename mydirectory to targetdirectory since the destination directory doesn't exist.&lt;/P&gt;&lt;P&gt;So, if targetdirectory has less files this is an option.Instead of moving 30k files, you can move less files&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;Aditya&lt;/P&gt;</description>
      <pubDate>Wed, 25 Oct 2017 20:17:56 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227838#M70258</guid>
      <dc:creator>asirna</dc:creator>
      <dc:date>2017-10-25T20:17:56Z</dc:date>
    </item>
    <item>
      <title>Re: How to speed up "hdfs dfs -mv" for more than 30 000 files ?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227839#M70259</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/14200/asirna.html" nodeid="14200"&gt;@Aditya Sirna&lt;/A&gt;,&lt;/P&gt;&lt;P&gt;Of course... I'm going to try this.&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;</description>
      <pubDate>Wed, 25 Oct 2017 20:36:55 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227839#M70259</guid>
      <dc:creator>thierry_vernhet</dc:creator>
      <dc:date>2017-10-25T20:36:55Z</dc:date>
    </item>
    <item>
      <title>Re: How to speed up "hdfs dfs -mv" for more than 30 000 files ?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227840#M70260</link>
      <description>&lt;A rel="user" href="https://community.cloudera.com/users/10685/thierryvernhet.html" nodeid="10685"&gt;@Thierry Vernhet&lt;/A&gt;&lt;P&gt;If you have more than 10 GB, I'd recommend use distcp instead of using Copy OR Move.&lt;/P&gt;</description>
      <pubDate>Wed, 25 Oct 2017 20:54:30 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-to-speed-up-quot-hdfs-dfs-mv-quot-for-more-than-30-000/m-p/227840#M70260</guid>
      <dc:creator>divakarreddy_a</dc:creator>
      <dc:date>2017-10-25T20:54:30Z</dc:date>
    </item>
  </channel>
</rss>

