<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Need Cloudera CDP Consultant - Spark Job Performance Tuning in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Need-Cloudera-CDP-Consultant-Spark-Job-Performance-Tuning/m-p/412603#M253564</link>
    <description>&lt;P&gt;Hello&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/132856"&gt;@Brenda99&lt;/a&gt;,&amp;nbsp;&lt;/P&gt;&lt;P&gt;The question is very wide, there are many things that can help to improve the performance.&amp;nbsp;&lt;/P&gt;&lt;P&gt;Some basic recomendations are documented here:&amp;nbsp;&lt;BR /&gt;&lt;A href="https://docs.cloudera.com/cdp-private-cloud-base/7.3.1/tuning-spark/topics/spark-admin_spark_tuning.html" target="_blank"&gt;https://docs.cloudera.com/cdp-private-cloud-base/7.3.1/tuning-spark/topics/spark-admin_spark_tuning.html&lt;/A&gt;&amp;nbsp;&lt;BR /&gt;Take a look on the documentation, that could help you.&amp;nbsp;&lt;/P&gt;&lt;P&gt;Also, it will worth to talk with the team in charge of your account to found deeper performance tuning analysis.&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Mon, 06 Oct 2025 20:18:46 GMT</pubDate>
    <dc:creator>vafs</dc:creator>
    <dc:date>2025-10-06T20:18:46Z</dc:date>
    <item>
      <title>Need Cloudera CDP Consultant - Spark Job Performance Tuning</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Need-Cloudera-CDP-Consultant-Spark-Job-Performance-Tuning/m-p/412509#M253501</link>
      <description>&lt;P class="whitespace-normal break-words"&gt;Looking for help with Cloudera Data Platform Spark job optimization. We're running large-scale ETL jobs that are timing out during the shuffle phase, consuming excessive cluster resources and causing memory spillage.&lt;/P&gt;&lt;P class="whitespace-normal break-words"&gt;The jobs process ~500GB datasets but execution times have increased 3x after migrating to CDP. Need someone experienced with Spark tuning on Cloudera and YARN resource management to identify bottlenecks.&lt;/P&gt;&lt;P class="whitespace-normal break-words"&gt;Seeking 3-4 hours remote performance analysis to optimize job configuration and cluster settings. Must be resolved by Tuesday for our data pipeline SLA.&lt;/P&gt;</description>
      <pubDate>Fri, 26 Sep 2025 12:43:11 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Need-Cloudera-CDP-Consultant-Spark-Job-Performance-Tuning/m-p/412509#M253501</guid>
      <dc:creator>Brenda99</dc:creator>
      <dc:date>2025-09-26T12:43:11Z</dc:date>
    </item>
    <item>
      <title>Re: Need Cloudera CDP Consultant - Spark Job Performance Tuning</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Need-Cloudera-CDP-Consultant-Spark-Job-Performance-Tuning/m-p/412526#M253515</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/132856"&gt;@Brenda99&lt;/a&gt;&amp;nbsp;Welcome to the Cloudera Community!&lt;BR /&gt;&lt;BR /&gt;To help you get the best possible solution, I have tagged our CDP experts &lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/13587"&gt;@venkatsambath&lt;/a&gt;&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/79328"&gt;@abdulpasithali&lt;/a&gt;&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/95611"&gt;@upadhyayk04&lt;/a&gt;&amp;nbsp;who may be able to assist you further.&lt;BR /&gt;&lt;BR /&gt;Please keep us updated on your post, and we hope you find a satisfactory solution to your query.&lt;/P&gt;</description>
      <pubDate>Fri, 26 Sep 2025 17:01:12 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Need-Cloudera-CDP-Consultant-Spark-Job-Performance-Tuning/m-p/412526#M253515</guid>
      <dc:creator>DianaTorres</dc:creator>
      <dc:date>2025-09-26T17:01:12Z</dc:date>
    </item>
    <item>
      <title>Re: Need Cloudera CDP Consultant - Spark Job Performance Tuning</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Need-Cloudera-CDP-Consultant-Spark-Job-Performance-Tuning/m-p/412527#M253516</link>
      <description>&lt;P&gt;Hi Brenda,&lt;/P&gt;&lt;P&gt;I have extensive experience optimizing Spark jobs on CDP and dealing with shuffle-heavy workloads.&lt;/P&gt;&lt;P&gt;Your timeout issues during shuffle phase sound like a combination of executor memory settings and partition strategy problems, pretty common after CDP migrations actually.&lt;/P&gt;&lt;P&gt;I can help diagnose the bottlenecks through Spark UI analysis and YARN logs, then tune your spark.sql.shuffle.partitions and executor configurations.&lt;/P&gt;&lt;P&gt;Have successfully reduced similar ETL job runtimes by 60-70% for other clients facing post-migration performance degradation.&lt;/P&gt;&lt;P&gt;You can reach out to me on my &lt;A href="mailto:colinwilliams8254@gmail.com" target="_self"&gt;email here&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Colin&lt;/P&gt;</description>
      <pubDate>Mon, 29 Sep 2025 12:23:32 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Need-Cloudera-CDP-Consultant-Spark-Job-Performance-Tuning/m-p/412527#M253516</guid>
      <dc:creator>Colin4</dc:creator>
      <dc:date>2025-09-29T12:23:32Z</dc:date>
    </item>
    <item>
      <title>Re: Need Cloudera CDP Consultant - Spark Job Performance Tuning</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Need-Cloudera-CDP-Consultant-Spark-Job-Performance-Tuning/m-p/412603#M253564</link>
      <description>&lt;P&gt;Hello&amp;nbsp;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/132856"&gt;@Brenda99&lt;/a&gt;,&amp;nbsp;&lt;/P&gt;&lt;P&gt;The question is very wide, there are many things that can help to improve the performance.&amp;nbsp;&lt;/P&gt;&lt;P&gt;Some basic recomendations are documented here:&amp;nbsp;&lt;BR /&gt;&lt;A href="https://docs.cloudera.com/cdp-private-cloud-base/7.3.1/tuning-spark/topics/spark-admin_spark_tuning.html" target="_blank"&gt;https://docs.cloudera.com/cdp-private-cloud-base/7.3.1/tuning-spark/topics/spark-admin_spark_tuning.html&lt;/A&gt;&amp;nbsp;&lt;BR /&gt;Take a look on the documentation, that could help you.&amp;nbsp;&lt;/P&gt;&lt;P&gt;Also, it will worth to talk with the team in charge of your account to found deeper performance tuning analysis.&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 06 Oct 2025 20:18:46 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Need-Cloudera-CDP-Consultant-Spark-Job-Performance-Tuning/m-p/412603#M253564</guid>
      <dc:creator>vafs</dc:creator>
      <dc:date>2025-10-06T20:18:46Z</dc:date>
    </item>
  </channel>
</rss>

