<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Spark YARN Configuration on HDP 2.4 Recommendations in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155362#M117801</link>
    <description>&lt;P&gt;Thanks &lt;A rel="user" href="https://community.cloudera.com/users/332/vshukla.html" nodeid="332"&gt;@vshukla&lt;/A&gt;, &lt;A rel="user" href="https://community.cloudera.com/users/9304/tspann.html" nodeid="9304"&gt;@Timothy Spann&lt;/A&gt;, &lt;A rel="user" href="https://community.cloudera.com/users/2528/jyadav.html" nodeid="2528"&gt;@Jitendra Yadav&lt;/A&gt;, &lt;A rel="user" href="https://community.cloudera.com/users/524/yimai.html" nodeid="524"&gt;@Yuta Imai&lt;/A&gt;&lt;/P&gt;</description>
    <pubDate>Thu, 19 May 2016 18:37:57 GMT</pubDate>
    <dc:creator>smartninja723</dc:creator>
    <dc:date>2016-05-19T18:37:57Z</dc:date>
    <item>
      <title>Spark YARN Configuration on HDP 2.4 Recommendations</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155356#M117795</link>
      <description>&lt;P&gt;Hi Guys,&lt;/P&gt;&lt;P&gt;We have successfully configured Spark on YARN using Ambari on HDP 2.4 with default parameters. However I would like to know what all parameters can we tune for best performance. Should we have separate queues for spark jobs? The use cases are yet to be decided but primarily to replace old MR jobs, experiment with Spark streaming and probably we will also use data frames. How many Spark Thrift Server instances recommended?&lt;/P&gt;&lt;P&gt;Cluster is 20 nodes, each with 256 GB RAM, 36 cores each. Load is generally 5% for other jobs. &lt;/P&gt;&lt;P&gt;Many thanks.&lt;/P&gt;</description>
      <pubDate>Thu, 19 May 2016 01:42:23 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155356#M117795</guid>
      <dc:creator>smartninja723</dc:creator>
      <dc:date>2016-05-19T01:42:23Z</dc:date>
    </item>
    <item>
      <title>Re: Spark YARN Configuration on HDP 2.4 Recommendations</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155357#M117796</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/524/yimai.html" nodeid="524"&gt;@Yuta Imai&lt;/A&gt;, &lt;A rel="user" href="https://community.cloudera.com/users/104/sball.html" nodeid="104"&gt;@Simon Elliston Ball&lt;/A&gt;, &lt;A rel="user" href="https://community.cloudera.com/users/140/nsabharwal.html" nodeid="140"&gt;@Neeraj Sabharwal&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 19 May 2016 01:44:58 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155357#M117796</guid>
      <dc:creator>smartninja723</dc:creator>
      <dc:date>2016-05-19T01:44:58Z</dc:date>
    </item>
    <item>
      <title>Re: Spark YARN Configuration on HDP 2.4 Recommendations</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155358#M117797</link>
      <description>&lt;A rel="user" href="https://community.cloudera.com/users/3021/smartninja723.html" nodeid="3021"&gt;@Smart Solutions&lt;/A&gt;&lt;P&gt;Below is an official doc for spark tuning on YARN, &lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.hortonworks.com/HDPDocuments/HDP2/HDP-2.3.2/bk_spark-guide/content/ch_tuning-spark.html" target="_blank"&gt;https://docs.hortonworks.com/HDPDocuments/HDP2/HDP-2.3.2/bk_spark-guide/content/ch_tuning-spark.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Generally we see people creates  queues to segregate resources b/w different department groups within company or on the basis of number of applications like ETL, real time and so on. Therefore it depends on what your use case is and how you are going to share the cluster resources b/w groups/application. For Spark thrift its better to have single instance within a cluster unless you have 100's of thrift clients running and submitting jobs at same time. &lt;/P&gt;</description>
      <pubDate>Thu, 19 May 2016 03:06:34 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155358#M117797</guid>
      <dc:creator>jyadav</dc:creator>
      <dc:date>2016-05-19T03:06:34Z</dc:date>
    </item>
    <item>
      <title>Re: Spark YARN Configuration on HDP 2.4 Recommendations</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155359#M117798</link>
      <description>&lt;P&gt;Please see Running Spark in Production session from Hadoop Summit, Dublin. See the section on perf tuning.&lt;/P&gt;&lt;P&gt;&lt;A href="http://www.slideshare.net/vinnies12/running-spark-in-production"&gt;Slides&lt;/A&gt;, &lt;A href="https://youtu.be/OkyRdKahMpk"&gt;video&lt;/A&gt; about executor selection&lt;/P&gt;</description>
      <pubDate>Thu, 19 May 2016 04:54:29 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155359#M117798</guid>
      <dc:creator>vshukla</dc:creator>
      <dc:date>2016-05-19T04:54:29Z</dc:date>
    </item>
    <item>
      <title>Re: Spark YARN Configuration on HDP 2.4 Recommendations</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155360#M117799</link>
      <description>&lt;P&gt;Updated for 2.4&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.hortonworks.com/HDPDocuments/HDP2/HDP-2.4.2/bk_spark-guide/content/ch_tuning-spark.html" target="_blank"&gt;https://docs.hortonworks.com/HDPDocuments/HDP2/HDP-2.4.2/bk_spark-guide/content/ch_tuning-spark.html&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 19 May 2016 09:13:41 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155360#M117799</guid>
      <dc:creator>TimothySpann</dc:creator>
      <dc:date>2016-05-19T09:13:41Z</dc:date>
    </item>
    <item>
      <title>Re: Spark YARN Configuration on HDP 2.4 Recommendations</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155361#M117800</link>
      <description>&lt;P&gt;If you have 256 GB/node, leave out at-least 2 GB &amp;amp; 1 core for OS, more if there is something else running on the node. Then start with 5 cores/Executor &amp;amp; 30GB/Ex. So about 7 Executor/node.&lt;/P&gt;</description>
      <pubDate>Thu, 19 May 2016 11:40:26 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155361#M117800</guid>
      <dc:creator>vshukla</dc:creator>
      <dc:date>2016-05-19T11:40:26Z</dc:date>
    </item>
    <item>
      <title>Re: Spark YARN Configuration on HDP 2.4 Recommendations</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155362#M117801</link>
      <description>&lt;P&gt;Thanks &lt;A rel="user" href="https://community.cloudera.com/users/332/vshukla.html" nodeid="332"&gt;@vshukla&lt;/A&gt;, &lt;A rel="user" href="https://community.cloudera.com/users/9304/tspann.html" nodeid="9304"&gt;@Timothy Spann&lt;/A&gt;, &lt;A rel="user" href="https://community.cloudera.com/users/2528/jyadav.html" nodeid="2528"&gt;@Jitendra Yadav&lt;/A&gt;, &lt;A rel="user" href="https://community.cloudera.com/users/524/yimai.html" nodeid="524"&gt;@Yuta Imai&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Thu, 19 May 2016 18:37:57 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Spark-YARN-Configuration-on-HDP-2-4-Recommendations/m-p/155362#M117801</guid>
      <dc:creator>smartninja723</dc:creator>
      <dc:date>2016-05-19T18:37:57Z</dc:date>
    </item>
  </channel>
</rss>

