<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Data ingestion using flume - Visualize website clickstream data in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Data-ingestion-using-flume-Visualize-website-clickstream/m-p/140569#M19428</link>
    <description>&lt;P&gt;Thank you.&lt;/P&gt;</description>
    <pubDate>Sun, 14 Feb 2016 21:12:49 GMT</pubDate>
    <dc:creator>Eukrev</dc:creator>
    <dc:date>2016-02-14T21:12:49Z</dc:date>
    <item>
      <title>Data ingestion using flume - Visualize website clickstream data</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Data-ingestion-using-flume-Visualize-website-clickstream/m-p/140566#M19425</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;How can I use Flume to ingest data into HDFS instead of NFS in the below use case?
&lt;A href="http://hortonworks.com/hadoop-tutorial/how-to-visualize-website-clickstream-data/#section_1"&gt;http://hortonworks.com/hadoop-tutorial/how-to-visualize-website-clickstream-data/#section_1&lt;/A&gt;&lt;/P&gt;&lt;P&gt;For a semi-structured data where data is placed on Omniture weblog directory, would like to confirm on the source type -&lt;/P&gt;&lt;P&gt;would it be spooling directory source or multiport_syslogtcp. which one to use.&lt;/P&gt;&lt;P&gt;Thank you.&lt;/P&gt;</description>
      <pubDate>Sun, 14 Feb 2016 10:40:39 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Data-ingestion-using-flume-Visualize-website-clickstream/m-p/140566#M19425</guid>
      <dc:creator>Eukrev</dc:creator>
      <dc:date>2016-02-14T10:40:39Z</dc:date>
    </item>
    <item>
      <title>Re: Data ingestion using flume - Visualize website clickstream data</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Data-ingestion-using-flume-Visualize-website-clickstream/m-p/140567#M19426</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/2579/revathymurugesan.html" nodeid="2579"&gt;@Revathy Mourouguessane&lt;/A&gt;&lt;/P&gt;&lt;P&gt;I hope this link will help for you&lt;/P&gt;&lt;P&gt;&lt;A href="https://flume.apache.org/FlumeUserGuide.html" target="_blank"&gt;https://flume.apache.org/FlumeUserGuide.html&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Sun, 14 Feb 2016 11:17:59 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Data-ingestion-using-flume-Visualize-website-clickstream/m-p/140567#M19426</guid>
      <dc:creator>divakarreddy_a</dc:creator>
      <dc:date>2016-02-14T11:17:59Z</dc:date>
    </item>
    <item>
      <title>Re: Data ingestion using flume - Visualize website clickstream data</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Data-ingestion-using-flume-Visualize-website-clickstream/m-p/140568#M19427</link>
      <description>&lt;A rel="user" href="https://community.cloudera.com/users/2579/revathymurugesan.html" nodeid="2579"&gt;@Revathy Mourouguessane&lt;/A&gt;&lt;P&gt;spooling dir is good when you want to watch directory for new files. Syslog listens on a port. So if your logs land in a directory, you would use spooling dir. For hdfs you would use hdfs sink. When you master flume, check out Apache NiFi.&lt;/P&gt;</description>
      <pubDate>Sun, 14 Feb 2016 20:48:47 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Data-ingestion-using-flume-Visualize-website-clickstream/m-p/140568#M19427</guid>
      <dc:creator>aervits</dc:creator>
      <dc:date>2016-02-14T20:48:47Z</dc:date>
    </item>
    <item>
      <title>Re: Data ingestion using flume - Visualize website clickstream data</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Data-ingestion-using-flume-Visualize-website-clickstream/m-p/140569#M19428</link>
      <description>&lt;P&gt;Thank you.&lt;/P&gt;</description>
      <pubDate>Sun, 14 Feb 2016 21:12:49 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Data-ingestion-using-flume-Visualize-website-clickstream/m-p/140569#M19428</guid>
      <dc:creator>Eukrev</dc:creator>
      <dc:date>2016-02-14T21:12:49Z</dc:date>
    </item>
  </channel>
</rss>

