<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: how to configure mergecontent processor in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/how-to-configure-mergecontent-processor/m-p/183650#M83166</link>
    <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/363/bbende.html" nodeid="363"&gt;@Bryan Bende&lt;/A&gt; &lt;/P&gt;&lt;P&gt;I have checked my data, it has no new blank spaces, but was arriving like batches.&lt;/P&gt;&lt;P&gt;I am merging the files and appending using puthdfs.&lt;/P&gt;&lt;P&gt;When I use the configurations you suggested, some times I am getting a new blank line at the beginning of the file which is appended using puthdfs.&lt;/P&gt;&lt;P&gt;Can you please help me how to avoid the blank line at the beginning of the file, also the file is big (1GB).&lt;/P&gt;</description>
    <pubDate>Thu, 06 Sep 2018 10:35:22 GMT</pubDate>
    <dc:creator>mark_hadoop</dc:creator>
    <dc:date>2018-09-06T10:35:22Z</dc:date>
    <item>
      <title>how to configure mergecontent processor</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/how-to-configure-mergecontent-processor/m-p/183648#M83164</link>
      <description>&lt;P&gt;Hi All,&lt;/P&gt;&lt;P&gt;I have json data in multiple small files (some times only one line in a file).&lt;/P&gt;&lt;P&gt;I want to merge all small files in to single large file.&lt;/P&gt;&lt;P&gt;I am getting a large file in an unexpected format.&lt;/P&gt;&lt;P&gt;&lt;STRONG&gt;ex:&lt;/STRONG&gt;&lt;/P&gt;
&lt;BLOCKQUOTE&gt;&lt;STRONG&gt;file 1:&lt;BR /&gt;&lt;/STRONG&gt;&lt;PRE&gt;{"code"="1", "color"="green"}
{"code"="2", "color"="blue"}
{"code"="3", "color"="orange"}

&lt;/PRE&gt;
&lt;/BLOCKQUOTE&gt;
&lt;BLOCKQUOTE&gt;&lt;STRONG&gt;file 2:&lt;/STRONG&gt;&lt;BR /&gt;&lt;PRE&gt;{"code"="4", "color"="yellow"}
{"code"="5", "color"="red"}&lt;/PRE&gt;
I am getting the below output after using MergeContent&lt;BR /&gt;&lt;PRE&gt;{"code"="1", "color"="green"}
{"code"="2", "color"="blue"}
{"code"="3", "color"="orange"}{"code"="4", "color"="yellow"}
{"code"="5", "color"="red"}&lt;/PRE&gt;
Expected output&lt;BR /&gt;&lt;PRE&gt;{"code"="1", "color"="green"}
{"code"="2", "color"="blue"}
{"code"="3", "color"="orange"}
{"code"="4", "color"="yellow"}
{"code"="5", "color"="red"}&lt;/PRE&gt;
&lt;/BLOCKQUOTE&gt;</description>
      <pubDate>Wed, 05 Sep 2018 16:42:14 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/how-to-configure-mergecontent-processor/m-p/183648#M83164</guid>
      <dc:creator>mark_hadoop</dc:creator>
      <dc:date>2018-09-05T16:42:14Z</dc:date>
    </item>
    <item>
      <title>Re: how to configure mergecontent processor</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/how-to-configure-mergecontent-processor/m-p/183649#M83165</link>
      <description>&lt;P&gt;I answered this on stackoverflow:&lt;/P&gt;&lt;P&gt;&lt;A href="https://stackoverflow.com/questions/52188619/mergecontent-processor-is-not-giving-expected-result" target="_blank"&gt;https://stackoverflow.com/questions/52188619/mergecontent-processor-is-not-giving-expected-result&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 06 Sep 2018 02:31:36 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/how-to-configure-mergecontent-processor/m-p/183649#M83165</guid>
      <dc:creator>bbende</dc:creator>
      <dc:date>2018-09-06T02:31:36Z</dc:date>
    </item>
    <item>
      <title>Re: how to configure mergecontent processor</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/how-to-configure-mergecontent-processor/m-p/183650#M83166</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/363/bbende.html" nodeid="363"&gt;@Bryan Bende&lt;/A&gt; &lt;/P&gt;&lt;P&gt;I have checked my data, it has no new blank spaces, but was arriving like batches.&lt;/P&gt;&lt;P&gt;I am merging the files and appending using puthdfs.&lt;/P&gt;&lt;P&gt;When I use the configurations you suggested, some times I am getting a new blank line at the beginning of the file which is appended using puthdfs.&lt;/P&gt;&lt;P&gt;Can you please help me how to avoid the blank line at the beginning of the file, also the file is big (1GB).&lt;/P&gt;</description>
      <pubDate>Thu, 06 Sep 2018 10:35:22 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/how-to-configure-mergecontent-processor/m-p/183650#M83166</guid>
      <dc:creator>mark_hadoop</dc:creator>
      <dc:date>2018-09-06T10:35:22Z</dc:date>
    </item>
  </channel>
</rss>

