<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Resource Utilization for Distcp in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Resource-Utilization-for-Distcp/m-p/202041#M65760</link>
    <description>&lt;P&gt;When doing a hadoop distcp command from source to target, Is it possible to check the resource Utilization in both the source and target cluster. &lt;/P&gt;</description>
    <pubDate>Mon, 31 Jul 2017 09:07:23 GMT</pubDate>
    <dc:creator>aljohnmangahas</dc:creator>
    <dc:date>2017-07-31T09:07:23Z</dc:date>
    <item>
      <title>Resource Utilization for Distcp</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Resource-Utilization-for-Distcp/m-p/202041#M65760</link>
      <description>&lt;P&gt;When doing a hadoop distcp command from source to target, Is it possible to check the resource Utilization in both the source and target cluster. &lt;/P&gt;</description>
      <pubDate>Mon, 31 Jul 2017 09:07:23 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Resource-Utilization-for-Distcp/m-p/202041#M65760</guid>
      <dc:creator>aljohnmangahas</dc:creator>
      <dc:date>2017-07-31T09:07:23Z</dc:date>
    </item>
    <item>
      <title>Re: Resource Utilization for Distcp</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Resource-Utilization-for-Distcp/m-p/202042#M65761</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/18358/aljohnmangahas.html" nodeid="18358"&gt;@Al John Mangahas&lt;/A&gt; &lt;/P&gt;&lt;P&gt;Distcp spins off MapReduce jobs on the cluster it is running on/from.  You can use the Yarn UI on that cluster to monitor the job progress and utilization.  &lt;/P&gt;&lt;P&gt;Having said that, if you are copying from a Prod cluster to a DR cluster, and are worried about resource usage, then you can actually run the Distcp job on the DR cluster and have it "pull" the data from Prod.  That way, the impact in terms of resources on Prod is minimal. &lt;/P&gt;</description>
      <pubDate>Tue, 01 Aug 2017 01:55:18 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Resource-Utilization-for-Distcp/m-p/202042#M65761</guid>
      <dc:creator>egarelnabi</dc:creator>
      <dc:date>2017-08-01T01:55:18Z</dc:date>
    </item>
  </channel>
</rss>

