<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: How can I control the size of the blocks that hive writes to s3? in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-can-I-control-the-size-of-the-blocks-that-hive-writes-to/m-p/161103#M45110</link>
    <description>&lt;P&gt;@Peter Coates - look for the parameters &lt;CODE&gt;fs.s3a.multipart.threshold&lt;/CODE&gt; and &lt;CODE&gt;fs.s3a.multipart.size&lt;/CODE&gt;&lt;/P&gt;</description>
    <pubDate>Wed, 02 Nov 2016 21:00:17 GMT</pubDate>
    <dc:creator>njayakumar</dc:creator>
    <dc:date>2016-11-02T21:00:17Z</dc:date>
    <item>
      <title>How can I control the size of the blocks that hive writes to s3?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-can-I-control-the-size-of-the-blocks-that-hive-writes-to/m-p/161102#M45109</link>
      <description>&lt;P&gt;I'm using insert-into to write data up to S3, but it's writing very large files--0.8GB to 1.8 GB plus one of just a few K. I've tried tez.grouping.max-size and min-size, but neither seems to limit either the min or the max size of the files that are generated. I've also tried controlling the number of mappers and reducers, but to no avail. &lt;/P&gt;</description>
      <pubDate>Wed, 02 Nov 2016 20:55:23 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-can-I-control-the-size-of-the-blocks-that-hive-writes-to/m-p/161102#M45109</guid>
      <dc:creator>coatespt</dc:creator>
      <dc:date>2016-11-02T20:55:23Z</dc:date>
    </item>
    <item>
      <title>Re: How can I control the size of the blocks that hive writes to s3?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-can-I-control-the-size-of-the-blocks-that-hive-writes-to/m-p/161103#M45110</link>
      <description>&lt;P&gt;@Peter Coates - look for the parameters &lt;CODE&gt;fs.s3a.multipart.threshold&lt;/CODE&gt; and &lt;CODE&gt;fs.s3a.multipart.size&lt;/CODE&gt;&lt;/P&gt;</description>
      <pubDate>Wed, 02 Nov 2016 21:00:17 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-can-I-control-the-size-of-the-blocks-that-hive-writes-to/m-p/161103#M45110</guid>
      <dc:creator>njayakumar</dc:creator>
      <dc:date>2016-11-02T21:00:17Z</dc:date>
    </item>
  </channel>
</rss>

