<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Is it possible to write the spark streaming output to single file in HDFS ? where spark streaming get's the logs from kafka topics. in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133962#M47762</link>
    <description>&lt;P&gt;What is the largest load (MBs or GBs) you have run your use case on?&lt;/P&gt;</description>
    <pubDate>Sat, 17 Dec 2016 02:09:29 GMT</pubDate>
    <dc:creator>gkeys</dc:creator>
    <dc:date>2016-12-17T02:09:29Z</dc:date>
    <item>
      <title>Is it possible to write the spark streaming output to single file in HDFS ? where spark streaming get's the logs from kafka topics.</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133955#M47755</link>
      <description />
      <pubDate>Fri, 02 Dec 2016 06:15:26 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133955#M47755</guid>
      <dc:creator>raviteja_gogata</dc:creator>
      <dc:date>2016-12-02T06:15:26Z</dc:date>
    </item>
    <item>
      <title>Re: Is it possible to write the spark streaming output to single file in HDFS ? where spark streaming get's the logs from kafka topics.</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133956#M47756</link>
      <description>&lt;P&gt;@&lt;A href="https://community.hortonworks.com/users/11346/vijaykumar243.html"&gt;Vijay Kumar J&lt;/A&gt; any idea ? thanks in advance&lt;/P&gt;</description>
      <pubDate>Sun, 04 Dec 2016 08:30:11 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133956#M47756</guid>
      <dc:creator>raviteja_gogata</dc:creator>
      <dc:date>2016-12-04T08:30:11Z</dc:date>
    </item>
    <item>
      <title>Re: Is it possible to write the spark streaming output to single file in HDFS ? where spark streaming get's the logs from kafka topics.</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133957#M47757</link>
      <description>&lt;P&gt;@Greg Keys any idea ? thanks in advance&lt;/P&gt;</description>
      <pubDate>Fri, 16 Dec 2016 00:48:56 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133957#M47757</guid>
      <dc:creator>raviteja_gogata</dc:creator>
      <dc:date>2016-12-16T00:48:56Z</dc:date>
    </item>
    <item>
      <title>Re: Is it possible to write the spark streaming output to single file in HDFS ? where spark streaming get's the logs from kafka topics.</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133958#M47758</link>
      <description>&lt;P&gt;I suggest looking at the merge and saveAsTextFile functions as per bottom post here &lt;A href="http://stackoverflow.com/questions/31666361/process-spark-streaming-rdd-and-store-to-single-hdfs-file" target="_blank"&gt;http://stackoverflow.com/questions/31666361/process-spark-streaming-rdd-and-store-to-single-hdfs-file&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 16 Dec 2016 05:23:32 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133958#M47758</guid>
      <dc:creator>gkeys</dc:creator>
      <dc:date>2016-12-16T05:23:32Z</dc:date>
    </item>
    <item>
      <title>Re: Is it possible to write the spark streaming output to single file in HDFS ? where spark streaming get's the logs from kafka topics.</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133959#M47759</link>
      <description>&lt;P&gt;Hi Greg Keys, thanks for the reply i was using the similar approach, but wondering whether this approach works if spark streaming processing the data in giga bytes ?&lt;/P&gt;</description>
      <pubDate>Fri, 16 Dec 2016 05:58:38 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133959#M47759</guid>
      <dc:creator>raviteja_gogata</dc:creator>
      <dc:date>2016-12-16T05:58:38Z</dc:date>
    </item>
    <item>
      <title>Re: Is it possible to write the spark streaming output to single file in HDFS ? where spark streaming get's the logs from kafka topics.</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133960#M47760</link>
      <description>&lt;P&gt;That is really an issue of scaling (how many nodes and memory per node you have) and multitenancy (which other jobs will run at the same time, particularly spark or other memory-intensive jobs).  The more nodes and the less memory contention, the more data you can process in spark.&lt;/P&gt;</description>
      <pubDate>Fri, 16 Dec 2016 21:47:53 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133960#M47760</guid>
      <dc:creator>gkeys</dc:creator>
      <dc:date>2016-12-16T21:47:53Z</dc:date>
    </item>
    <item>
      <title>Re: Is it possible to write the spark streaming output to single file in HDFS ? where spark streaming get's the logs from kafka topics.</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133961#M47761</link>
      <description>&lt;P&gt;i am working on 12 node cluster with 4 having 126 gigs, 8 having 252 gigs memory.  &lt;/P&gt;</description>
      <pubDate>Sat, 17 Dec 2016 02:07:01 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133961#M47761</guid>
      <dc:creator>raviteja_gogata</dc:creator>
      <dc:date>2016-12-17T02:07:01Z</dc:date>
    </item>
    <item>
      <title>Re: Is it possible to write the spark streaming output to single file in HDFS ? where spark streaming get's the logs from kafka topics.</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133962#M47762</link>
      <description>&lt;P&gt;What is the largest load (MBs or GBs) you have run your use case on?&lt;/P&gt;</description>
      <pubDate>Sat, 17 Dec 2016 02:09:29 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Is-it-possible-to-write-the-spark-streaming-output-to-single/m-p/133962#M47762</guid>
      <dc:creator>gkeys</dc:creator>
      <dc:date>2016-12-17T02:09:29Z</dc:date>
    </item>
  </channel>
</rss>

