<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: MapReduce performance on the HBase input table. in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/MapReduce-performance-on-the-HBase-input-table/m-p/163414#M45220</link>
    <description>&lt;P&gt;TableInputFormat used in HBase will create 1 map task per table region. The data size will depend on how big your regions are. &lt;/P&gt;</description>
    <pubDate>Fri, 04 Nov 2016 00:56:32 GMT</pubDate>
    <dc:creator>Enis</dc:creator>
    <dc:date>2016-11-04T00:56:32Z</dc:date>
    <item>
      <title>MapReduce performance on the HBase input table.</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/MapReduce-performance-on-the-HBase-input-table/m-p/163413#M45219</link>
      <description>&lt;P&gt;While running a MR on the HDFS file, The # of mappers is based on the input split size. While it is usually true that
the input split size will match the block size with a text input file in hdfs.
( understand not always the case but most of the time)&lt;/P&gt;&lt;P&gt;What will happen when I run a MR on the hbase
table as a input record. How does the input split size match with the hbase
table and how can I control the number of mapper while running MR on top of the
HBase table. Can someone guide me here. Using hbase 0.98.4 and hdoop 2.6 version.&lt;/P&gt;</description>
      <pubDate>Thu, 03 Nov 2016 19:48:17 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/MapReduce-performance-on-the-HBase-input-table/m-p/163413#M45219</guid>
      <dc:creator>arunkumar_d</dc:creator>
      <dc:date>2016-11-03T19:48:17Z</dc:date>
    </item>
    <item>
      <title>Re: MapReduce performance on the HBase input table.</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/MapReduce-performance-on-the-HBase-input-table/m-p/163414#M45220</link>
      <description>&lt;P&gt;TableInputFormat used in HBase will create 1 map task per table region. The data size will depend on how big your regions are. &lt;/P&gt;</description>
      <pubDate>Fri, 04 Nov 2016 00:56:32 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/MapReduce-performance-on-the-HBase-input-table/m-p/163414#M45220</guid>
      <dc:creator>Enis</dc:creator>
      <dc:date>2016-11-04T00:56:32Z</dc:date>
    </item>
  </channel>
</rss>

