<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Delete application logs from spark history specifying date in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Delete-application-logs-from-spark-history-specifying-date/m-p/376363#M242883</link>
    <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/102259"&gt;@Emanuel_MXN&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Generally not recommended to keep event logs older than some days/months. In your case, you are keeping logs for years.&amp;nbsp;&lt;/P&gt;&lt;P&gt;To avoid keeping the old logs, please add the following parameters to the&amp;nbsp;&lt;SPAN&gt;spark-defaults.conf file&lt;/SPAN&gt; and delete old event logs based on your need.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;spark.history.fs.cleaner.enabled true
spark.history.fs.cleaner.maxAge  7d
spark.history.fs.cleaner.interval 1h&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I don't have any handy script to delete files from hdfs for specific date/year. If i found definetely i will share it here.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Fri, 15 Sep 2023 01:32:05 GMT</pubDate>
    <dc:creator>RangaReddy</dc:creator>
    <dc:date>2023-09-15T01:32:05Z</dc:date>
    <item>
      <title>Delete application logs from spark history specifying date</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Delete-application-logs-from-spark-history-specifying-date/m-p/376360#M242880</link>
      <description>&lt;P&gt;from&lt;/P&gt;
&lt;P&gt;&lt;SPAN&gt;hdfs dfs -du -h /&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;we see that spark history take a lot space from HDFS&lt;/P&gt;
&lt;P&gt;I want delete only some&amp;nbsp;that I specified for example all that are of the year 2019 and 2019, and keep the rest.&lt;/P&gt;
&lt;P&gt;If I use the command&lt;BR /&gt;&lt;SPAN&gt;hdfs dfs -rm -R /spark2-history/*&lt;/SPAN&gt;&lt;/P&gt;
&lt;P&gt;this delete all and I want not delete all.&lt;/P&gt;
&lt;P&gt;Thanks&lt;/P&gt;</description>
      <pubDate>Thu, 21 Sep 2023 14:24:45 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Delete-application-logs-from-spark-history-specifying-date/m-p/376360#M242880</guid>
      <dc:creator>Emanuel_MXN</dc:creator>
      <dc:date>2023-09-21T14:24:45Z</dc:date>
    </item>
    <item>
      <title>Re: Delete application logs from spark history specifying date</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Delete-application-logs-from-spark-history-specifying-date/m-p/376363#M242883</link>
      <description>&lt;P&gt;Hi&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/102259"&gt;@Emanuel_MXN&lt;/a&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Generally not recommended to keep event logs older than some days/months. In your case, you are keeping logs for years.&amp;nbsp;&lt;/P&gt;&lt;P&gt;To avoid keeping the old logs, please add the following parameters to the&amp;nbsp;&lt;SPAN&gt;spark-defaults.conf file&lt;/SPAN&gt; and delete old event logs based on your need.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;spark.history.fs.cleaner.enabled true
spark.history.fs.cleaner.maxAge  7d
spark.history.fs.cleaner.interval 1h&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I don't have any handy script to delete files from hdfs for specific date/year. If i found definetely i will share it here.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 15 Sep 2023 01:32:05 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Delete-application-logs-from-spark-history-specifying-date/m-p/376363#M242883</guid>
      <dc:creator>RangaReddy</dc:creator>
      <dc:date>2023-09-15T01:32:05Z</dc:date>
    </item>
    <item>
      <title>Re: Delete application logs from spark history specifying date</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Delete-application-logs-from-spark-history-specifying-date/m-p/376836#M243027</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/102259"&gt;@Emanuel_MXN&lt;/a&gt;,&amp;nbsp;Has the reply helped resolve your issue? If so, please mark the appropriate reply as the solution, as it will make it easier for others to find the answer in the future.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 26 Sep 2023 09:42:32 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Delete-application-logs-from-spark-history-specifying-date/m-p/376836#M243027</guid>
      <dc:creator>VidyaSargur</dc:creator>
      <dc:date>2023-09-26T09:42:32Z</dc:date>
    </item>
  </channel>
</rss>

