<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Recommended config: mapreduce.input.fileinputformat.split.[minsize|maxsize] in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-config-mapreduce-input-fileinputformat-split/m-p/96062#M9475</link>
    <description>&lt;P&gt;Thanks for sharing &lt;span class="lia-unicode-emoji" title=":slightly_smiling_face:"&gt;🙂&lt;/span&gt;  &lt;A rel="user" href="https://community.cloudera.com/users/113/jstraub.html" nodeid="113"&gt;@Jonas Straub&lt;/A&gt;&lt;/P&gt;</description>
    <pubDate>Wed, 28 Oct 2015 18:28:23 GMT</pubDate>
    <dc:creator>nsabharwal</dc:creator>
    <dc:date>2015-10-28T18:28:23Z</dc:date>
    <item>
      <title>Recommended config: mapreduce.input.fileinputformat.split.[minsize|maxsize]</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-config-mapreduce-input-fileinputformat-split/m-p/96059#M9472</link>
      <description>&lt;P&gt;What is the purpose of the following two configuration parameters in &lt;EM&gt;mapred-size.xml&lt;/EM&gt;? What are recommended values?&lt;/P&gt;&lt;PRE&gt;mapreduce.input.fileinputformat.split.minsize
mapreduce.input.fileinputformat.split.maxsize&lt;/PRE&gt;&lt;P&gt;Thanks &lt;span class="lia-unicode-emoji" title=":slightly_smiling_face:"&gt;🙂&lt;/span&gt;&lt;/P&gt;</description>
      <pubDate>Tue, 27 Oct 2015 15:55:33 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-config-mapreduce-input-fileinputformat-split/m-p/96059#M9472</guid>
      <dc:creator>jstraub</dc:creator>
      <dc:date>2015-10-27T15:55:33Z</dc:date>
    </item>
    <item>
      <title>Re: Recommended config: mapreduce.input.fileinputformat.split.[minsize|maxsize]</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-config-mapreduce-input-fileinputformat-split/m-p/96060#M9473</link>
      <description>&lt;A rel="user" href="https://community.cloudera.com/users/113/jstraub.html" nodeid="113"&gt;@Jonas Straub&lt;/A&gt;&lt;P&gt;I found &lt;A target="_blank" href="http://stackoverflow.com/questions/19188315/behavior-of-the-parameter-mapred-min-split-size-in-hdfs"&gt;this&lt;/A&gt; really useful &lt;/P&gt;&lt;P&gt;Also, from Apache &lt;A target="_blank" href="https://hadoop.apache.org/docs/current/hadoop-project-dist/hadoop-common/DeprecatedProperties.html"&gt;doc&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;STRONG&gt;Deprecated property name  &lt;/STRONG&gt;&lt;/P&gt;mapred.min.split.size&lt;P&gt;New&lt;/P&gt;mapreduce.input.fileinputformat.split.minsize</description>
      <pubDate>Tue, 27 Oct 2015 19:41:42 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-config-mapreduce-input-fileinputformat-split/m-p/96060#M9473</guid>
      <dc:creator>nsabharwal</dc:creator>
      <dc:date>2015-10-27T19:41:42Z</dc:date>
    </item>
    <item>
      <title>Re: Recommended config: mapreduce.input.fileinputformat.split.[minsize|maxsize]</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-config-mapreduce-input-fileinputformat-split/m-p/96061#M9474</link>
      <description>&lt;P&gt;Thanks &lt;A href="http://community.hortonworks.com/questions/2179/recommended-config-mapreduceinputfileinputformatsp.html#"&gt;@Neeraj&lt;/A&gt;&lt;/P&gt;&lt;P&gt;I also found these two books:&lt;/P&gt;&lt;P&gt;&lt;A href="https://books.google.de/books?id=uL59BAAAQBAJ&amp;amp;lpg=PA156&amp;amp;dq=mapreduce.input.fileinputformat.split.minsize&amp;amp;pg=PA156#v=onepage&amp;amp;q=mapreduce.input.fileinputformat.split.minsize&amp;amp;f=false"&gt;Pro Apache Hadoop&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://books.google.de/books?id=6BmkBwAAQBAJ&amp;amp;lpg=PT291&amp;amp;dq=mapreduce.input.fileinputformat.split.minsize%20smallest%20valid&amp;amp;pg=PT291#v=onepage&amp;amp;q=mapreduce.input.fileinputformat.split.minsize%20smallest%20valid&amp;amp;f=false"&gt;Hadoop Definitive Guide&lt;/A&gt;&lt;/P&gt;&lt;P&gt;And both are basically saying that &lt;STRONG&gt;mapreduce.input.fileinputformat.split.minsize &amp;lt; dfs.blocksize &amp;lt; ...maxsize&lt;/STRONG&gt;&lt;/P&gt;&lt;P&gt;Smartsense recommended: 105MB (minsize) and 270MB (maxsize)&lt;/P&gt;&lt;P&gt;Our current block setting is 64MB, although Smartsense recommended 128MB blocksize, so it kind of fits the min/max recommendations as well as the descriptions from the books.&lt;/P&gt;</description>
      <pubDate>Wed, 28 Oct 2015 18:16:47 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-config-mapreduce-input-fileinputformat-split/m-p/96061#M9474</guid>
      <dc:creator>jstraub</dc:creator>
      <dc:date>2015-10-28T18:16:47Z</dc:date>
    </item>
    <item>
      <title>Re: Recommended config: mapreduce.input.fileinputformat.split.[minsize|maxsize]</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-config-mapreduce-input-fileinputformat-split/m-p/96062#M9475</link>
      <description>&lt;P&gt;Thanks for sharing &lt;span class="lia-unicode-emoji" title=":slightly_smiling_face:"&gt;🙂&lt;/span&gt;  &lt;A rel="user" href="https://community.cloudera.com/users/113/jstraub.html" nodeid="113"&gt;@Jonas Straub&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 28 Oct 2015 18:28:23 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Recommended-config-mapreduce-input-fileinputformat-split/m-p/96062#M9475</guid>
      <dc:creator>nsabharwal</dc:creator>
      <dc:date>2015-10-28T18:28:23Z</dc:date>
    </item>
  </channel>
</rss>

