<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Log managmement for Long-running Spark Streaming Jobs on YARN Cluster in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Log-managmement-for-Long-running-Spark-Streaming-Jobs-on/m-p/117586#M55108</link>
    <description>&lt;P&gt;Hi, We need to find a way to maintain and search logs for the Long running Sprk streaming jobs on YARN. We have Log aggregation disabled in our cluster. We are thinking about Solr/Elastic search and may be Flume or Kafka to read the Sprk job logs.&lt;/P&gt;&lt;P&gt;any suggestions on how to implement search the on these logs and easily manage them?&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;Suri&lt;/P&gt;</description>
    <pubDate>Wed, 22 Feb 2017 00:35:15 GMT</pubDate>
    <dc:creator>SuriNuthalapati</dc:creator>
    <dc:date>2017-02-22T00:35:15Z</dc:date>
    <item>
      <title>Log managmement for Long-running Spark Streaming Jobs on YARN Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Log-managmement-for-Long-running-Spark-Streaming-Jobs-on/m-p/117586#M55108</link>
      <description>&lt;P&gt;Hi, We need to find a way to maintain and search logs for the Long running Sprk streaming jobs on YARN. We have Log aggregation disabled in our cluster. We are thinking about Solr/Elastic search and may be Flume or Kafka to read the Sprk job logs.&lt;/P&gt;&lt;P&gt;any suggestions on how to implement search the on these logs and easily manage them?&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;Suri&lt;/P&gt;</description>
      <pubDate>Wed, 22 Feb 2017 00:35:15 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Log-managmement-for-Long-running-Spark-Streaming-Jobs-on/m-p/117586#M55108</guid>
      <dc:creator>SuriNuthalapati</dc:creator>
      <dc:date>2017-02-22T00:35:15Z</dc:date>
    </item>
    <item>
      <title>Re: Log managmement for Long-running Spark Streaming Jobs on YARN Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Log-managmement-for-Long-running-Spark-Streaming-Jobs-on/m-p/117587#M55109</link>
      <description>&lt;P&gt;You achieve it by setting appropriate value: in yarn-site.xml&lt;/P&gt;&lt;P&gt;yarn.nodemanager.log-aggregation.roll-monitoring-interval-seconds&lt;/P&gt;&lt;P&gt;Then yarn will aggreagate the logs for the running jobs too.&lt;/P&gt;&lt;P&gt;&lt;A href="https://hadoop.apache.org/docs/r2.6.0/hadoop-yarn/hadoop-yarn-common/yarn-default.xml"&gt;https://hadoop.apache.org/docs/r2.6.0/hadoop-yarn/hadoop-yarn-common/yarn-default.xml&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Suri&lt;/P&gt;</description>
      <pubDate>Thu, 23 Feb 2017 01:37:53 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Log-managmement-for-Long-running-Spark-Streaming-Jobs-on/m-p/117587#M55109</guid>
      <dc:creator>SuriNuthalapati</dc:creator>
      <dc:date>2017-02-23T01:37:53Z</dc:date>
    </item>
  </channel>
</rss>

