<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Spark Job long GC pauses in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Spark-Job-long-GC-pauses/m-p/282792#M210200</link>
    <description>&lt;P&gt;Hi &lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/71136"&gt;@PARTOMIA09&lt;/a&gt;&amp;nbsp;&lt;BR /&gt;&lt;BR /&gt;One suggestion off the bat is to possibly consider moving to a G1GC policy instead given that you have relatively large heap sizes (30 GB for executors and 16 GB for the driver). Typically the G1GC policy was developed to be better performant for larger heaps (&amp;gt; 8 GB). Try the following and see if that helps:&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;&lt;LI-CODE lang="markup"&gt;--conf "spark.executor.extraJavaOptions=-XX:+UseG1GC -XX:MaxGCPauseMillis=20 -XX:InitiatingHeapOccupancyPercent=35"

--conf "spark.driver.extraJavaOptions=-XX:+UseG1GC -XX:MaxGCPauseMillis=20 -XX:InitiatingHeapOccupancyPercent=35"&lt;/LI-CODE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;U&gt;"The Garbage-First Garbage Collector":&lt;/U&gt;&lt;BR /&gt;&lt;A href="https://www.oracle.com/technetwork/java/javase/tech/g1-intro-jsp-135488.html" target="_blank"&gt;https://www.oracle.com/technetwork/java/javase/tech/g1-intro-jsp-135488.html&lt;/A&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;/P&gt;</description>
    <pubDate>Tue, 12 Nov 2019 22:42:53 GMT</pubDate>
    <dc:creator>w@leed</dc:creator>
    <dc:date>2019-11-12T22:42:53Z</dc:date>
  </channel>
</rss>

