<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Write MR job output to existing directory in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157894#M24503</link>
    <description>&lt;P&gt;It worked. Thanks!&lt;/P&gt;</description>
    <pubDate>Tue, 12 Apr 2016 00:24:32 GMT</pubDate>
    <dc:creator>shubham2629</dc:creator>
    <dc:date>2016-04-12T00:24:32Z</dc:date>
    <item>
      <title>Write MR job output to existing directory</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157889#M24498</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;Is it possible to write MR job output to existing directory without deleting it(incremental write)?&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;&lt;P&gt;Shubham&lt;/P&gt;</description>
      <pubDate>Wed, 06 Apr 2016 13:27:05 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157889#M24498</guid>
      <dc:creator>shubham2629</dc:creator>
      <dc:date>2016-04-06T13:27:05Z</dc:date>
    </item>
    <item>
      <title>Re: Write MR job output to existing directory</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157890#M24499</link>
      <description>&lt;P&gt;You can write the following kind of logic in your MR application to make sure that if the directory exist already then delete it first.&lt;/P&gt;&lt;PRE&gt;Configuration conf = new Configuration(); 
FileSystem fs = FileSystem.get(conf); 
if(fs.exists(new Path(args[1]))) {
      /*If exist delete the output path*/
       fs.delete(new Path(args[1]),true); 
}
&lt;/PRE&gt;</description>
      <pubDate>Wed, 06 Apr 2016 13:49:57 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157890#M24499</guid>
      <dc:creator>Former Member</dc:creator>
      <dc:date>2016-04-06T13:49:57Z</dc:date>
    </item>
    <item>
      <title>Re: Write MR job output to existing directory</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157891#M24500</link>
      <description>&lt;P&gt;I do not want to delete existing directory as i mentioned above. I want to write more data to existing directory.&lt;/P&gt;</description>
      <pubDate>Wed, 06 Apr 2016 14:07:54 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157891#M24500</guid>
      <dc:creator>shubham2629</dc:creator>
      <dc:date>2016-04-06T14:07:54Z</dc:date>
    </item>
    <item>
      <title>Re: Write MR job output to existing directory</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157892#M24501</link>
      <description>&lt;P&gt;It can be done by extending the OutputFormat class and overwriting the &lt;A href="https://hadoop.apache.org/docs/r2.7.1/api/org/apache/hadoop/mapreduce/OutputFormat.html#checkOutputSpecs%28org.apache.hadoop.mapreduce.JobContext%29"&gt;OutputFormat.checkOutputSpecs&lt;/A&gt; method so that it doesn't throw exception when the output path already exists. After that, register the new class using &lt;A href="https://hadoop.apache.org/docs/r2.7.1/api/org/apache/hadoop/mapred/JobConf.html"&gt;JobConf.setOutputFormatClass&lt;/A&gt; method [some more details &lt;A href="http://comments.gmane.org/gmane.comp.jakarta.lucene.hadoop.user/42813"&gt;here&lt;/A&gt;].&lt;/P&gt;</description>
      <pubDate>Wed, 06 Apr 2016 14:33:37 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157892#M24501</guid>
      <dc:creator>pminovic</dc:creator>
      <dc:date>2016-04-06T14:33:37Z</dc:date>
    </item>
    <item>
      <title>Re: Write MR job output to existing directory</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157893#M24502</link>
      <description>&lt;P&gt;thanks!. I will try that.&lt;/P&gt;</description>
      <pubDate>Wed, 06 Apr 2016 15:42:00 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157893#M24502</guid>
      <dc:creator>shubham2629</dc:creator>
      <dc:date>2016-04-06T15:42:00Z</dc:date>
    </item>
    <item>
      <title>Re: Write MR job output to existing directory</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157894#M24503</link>
      <description>&lt;P&gt;It worked. Thanks!&lt;/P&gt;</description>
      <pubDate>Tue, 12 Apr 2016 00:24:32 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Write-MR-job-output-to-existing-directory/m-p/157894#M24503</guid>
      <dc:creator>shubham2629</dc:creator>
      <dc:date>2016-04-12T00:24:32Z</dc:date>
    </item>
  </channel>
</rss>

