<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Flume adding line feed after 2048 characters in a row in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Flume-adding-line-feed-after-2048-characters-in-a-row/m-p/39224#M50274</link>
    <description>&lt;P&gt;The default maxLineLength for the LINE deserializer is 2048:&lt;BR /&gt;&lt;A href="http://archive.cloudera.com/cdh5/cdh/5/flume-ng/FlumeUserGuide.html#line" target="_blank"&gt;http://archive.cloudera.com/cdh5/cdh/5/flume-ng/FlumeUserGuide.html#line&lt;/A&gt;&lt;BR /&gt;&lt;BR /&gt;You can set the following to accomodate your large events:&lt;BR /&gt;agent.sources.axon_source.deserializer.maxLineLength=10000&lt;/P&gt;</description>
    <pubDate>Thu, 31 Mar 2016 19:41:46 GMT</pubDate>
    <dc:creator>pdvorak</dc:creator>
    <dc:date>2016-03-31T19:41:46Z</dc:date>
    <item>
      <title>Flume adding line feed after 2048 characters in a row</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Flume-adding-line-feed-after-2048-characters-in-a-row/m-p/39222#M50273</link>
      <description>&lt;P&gt;I have a Flume 1.5 agent running on a Ubuntu workstation that collects logs from various devices and re-formats the logs into a comma delimited file with very long rows. After the collection and re-reformatting of the logs they are placed into a spool directory where the Flume Agent sends the log file to a Hadoop server running a Flume agent to accept the log file and place them in a HDFS directory.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Everything works fine except that when Flume sends the file to HDFS directory there are Line Feeds after every 2048 characters in each row.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Is there a setting to tell flume to not insert line feeds?&lt;/P&gt;&lt;P&gt;Below are my config files:&lt;/P&gt;&lt;PRE&gt;#On Ubuntu Workstation
#list sources, sinks and channels in the agent
agent.sources = axon_source
agent.channels = memorychannel
agent.sinks = AvroOut

#define flow
agent.sources.axon_source.channels = memorychannel
agent.sinks.AvroOut.channel = memorychannel
agent.channels.memorychannel.type = memory
agent.channels.memorychannel.capacity = 100000

#source
agent.sources.axon_source.type = spooldir
agent.sources.axon_source.spoolDir = /home/ubuntu/workspace/logdump
agent.sources.axon_source.decodeErrorPolicy = ignore

#avro out
agent.sinks.AvroOut.type = avro
agent.sinks.AvroOut.hostname = 172.31.12.221
agent.sinks.AvroOut.port = 41415
agent.sinks.AvroOut.maxIoWorkers = 2


------------------------------------------------------------


#On Hadoop Server
agent.sources = AvroIn
agent.sources.AvroIn.type = avro
agent.sources.AvroIn.bind = 172.31.131.1
agent.sources.AvroIn.port = 41415
agent.sources.AvroIn.channels = MemChan1

agent.channels = MemChan1
agent.channels.MemChan1.type = memory
agent.channels.MemChan1.capacity = 100000

agent.sinks = HDFSSink
agent.sinks.HDFSSink.type = hdfs
agent.sinks.HDFSSink.channel = MemChan1
agent.sinks.HDFSSink.hdfs.path = /Logs/%Y%m/
agent.sinks.HDFSSink.hdfs.filePrefix = axoncapture
agent.sinks.HDFSSink.hdfs.fileSuffix = .log
agent.sinks.HDFSSink.hdfs.minBlockReplicas = 1
agent.sinks.HDFSSink.hdfs.rollCount = 0
agent.sinks.HDFSSink.hdfs.rollSize = 314572800
agent.sinks.HDFSSink.hdfs.writeFormat = Text
agent.sinks.HDFSSink.hdfs.fileType = DataStream
agent.sinks.HDFSSink.hdfs.useLocalTimeStamp = True&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;Thanks...Corey&lt;/P&gt;</description>
      <pubDate>Fri, 16 Sep 2022 10:11:57 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Flume-adding-line-feed-after-2048-characters-in-a-row/m-p/39222#M50273</guid>
      <dc:creator>coreyfarrar</dc:creator>
      <dc:date>2022-09-16T10:11:57Z</dc:date>
    </item>
    <item>
      <title>Re: Flume adding line feed after 2048 characters in a row</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Flume-adding-line-feed-after-2048-characters-in-a-row/m-p/39224#M50274</link>
      <description>&lt;P&gt;The default maxLineLength for the LINE deserializer is 2048:&lt;BR /&gt;&lt;A href="http://archive.cloudera.com/cdh5/cdh/5/flume-ng/FlumeUserGuide.html#line" target="_blank"&gt;http://archive.cloudera.com/cdh5/cdh/5/flume-ng/FlumeUserGuide.html#line&lt;/A&gt;&lt;BR /&gt;&lt;BR /&gt;You can set the following to accomodate your large events:&lt;BR /&gt;agent.sources.axon_source.deserializer.maxLineLength=10000&lt;/P&gt;</description>
      <pubDate>Thu, 31 Mar 2016 19:41:46 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Flume-adding-line-feed-after-2048-characters-in-a-row/m-p/39224#M50274</guid>
      <dc:creator>pdvorak</dc:creator>
      <dc:date>2016-03-31T19:41:46Z</dc:date>
    </item>
  </channel>
</rss>

