<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Best Practices for Deploying Production Hadoop Cluster in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Best-Practices-for-Deploying-Production-Hadoop-Cluster/m-p/124366#M55443</link>
    <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/488/akanto.html" nodeid="488"&gt;@Attila Kanto&lt;/A&gt; &lt;/P&gt;&lt;P&gt;Thoughts?&lt;/P&gt;</description>
    <pubDate>Fri, 24 Feb 2017 18:46:05 GMT</pubDate>
    <dc:creator>munnyrahul</dc:creator>
    <dc:date>2017-02-24T18:46:05Z</dc:date>
    <item>
      <title>Best Practices for Deploying Production Hadoop Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Best-Practices-for-Deploying-Production-Hadoop-Cluster/m-p/124365#M55442</link>
      <description>&lt;P&gt;I am planning to setup a 4 node Production Cluster on Azure VM's. I am planning to have 1 edge Node, 1 Master Node and 2 Slave Nodes. I wanted to setup below mentioned services on that cluster.&lt;/P&gt;&lt;P&gt;1) Namenode&lt;/P&gt;&lt;P&gt;2) Oozie&lt;/P&gt;&lt;P&gt;3) DataNode&lt;/P&gt;&lt;P&gt;4) Yarn&lt;/P&gt;&lt;P&gt;5) Spark&lt;/P&gt;&lt;P&gt;6) Ranger&lt;/P&gt;&lt;P&gt;7) Atlas&lt;/P&gt;&lt;P&gt;&lt;span class="lia-unicode-emoji" title=":smiling_face_with_sunglasses:"&gt;😎&lt;/span&gt; Knox&lt;/P&gt;&lt;P&gt;9) Hbase&lt;/P&gt;&lt;P&gt;10) SAP Hana Vora&lt;/P&gt;&lt;P&gt;11) Zookeeper&lt;/P&gt;&lt;P&gt;I am actually looking out for any guidelines on Memory, Cores and Storage to be required for different services of hadoop as mentioned above. I need to buy 4 VM's on Azure but i want to understand from Infrastructure perspective that how much memory, cores, Storage would be optimal for above mentioned hadoop services(service wise) ,keeping in mind more services can also be added in future.&lt;/P&gt;&lt;P&gt;Is there any reference documentation/link?&lt;/P&gt;&lt;P&gt;Any help would be appreciated.&lt;/P&gt;&lt;P&gt;Thanks&lt;/P&gt;</description>
      <pubDate>Fri, 24 Feb 2017 18:34:12 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Best-Practices-for-Deploying-Production-Hadoop-Cluster/m-p/124365#M55442</guid>
      <dc:creator>munnyrahul</dc:creator>
      <dc:date>2017-02-24T18:34:12Z</dc:date>
    </item>
    <item>
      <title>Re: Best Practices for Deploying Production Hadoop Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Best-Practices-for-Deploying-Production-Hadoop-Cluster/m-p/124366#M55443</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/488/akanto.html" nodeid="488"&gt;@Attila Kanto&lt;/A&gt; &lt;/P&gt;&lt;P&gt;Thoughts?&lt;/P&gt;</description>
      <pubDate>Fri, 24 Feb 2017 18:46:05 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Best-Practices-for-Deploying-Production-Hadoop-Cluster/m-p/124366#M55443</guid>
      <dc:creator>munnyrahul</dc:creator>
      <dc:date>2017-02-24T18:46:05Z</dc:date>
    </item>
    <item>
      <title>Re: Best Practices for Deploying Production Hadoop Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Best-Practices-for-Deploying-Production-Hadoop-Cluster/m-p/124367#M55444</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/15105/rahgulati.html" nodeid="15105"&gt;@rahul gulati&lt;/A&gt;&lt;/P&gt;&lt;P&gt;See this article on best practices for deploying HDP on Azure: &lt;A target="_blank" href="https://community.hortonworks.com/articles/22376/recommendations-for-microsoft-azure-hdp-deployment-1.html"&gt;https://community.hortonworks.com/articles/22376/recommendations-for-microsoft-azure-hdp-deployment-1.html&lt;/A&gt;&lt;/P&gt;&lt;P&gt;For most production clusters, we typically recommend enabling HA for services.  That requires that you have at a minimum 2 master servers, although 3 would be better.  You need 3 Zookeeper instances.  While you can put Zookeeper on the data nodes, it would be better to put Zookeeper on the master nodes.&lt;/P&gt;</description>
      <pubDate>Fri, 24 Feb 2017 20:17:22 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Best-Practices-for-Deploying-Production-Hadoop-Cluster/m-p/124367#M55444</guid>
      <dc:creator>myoung</dc:creator>
      <dc:date>2017-02-24T20:17:22Z</dc:date>
    </item>
    <item>
      <title>Re: Best Practices for Deploying Production Hadoop Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Best-Practices-for-Deploying-Production-Hadoop-Cluster/m-p/124368#M55445</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/2695/myoung.html" nodeid="2695"&gt;@Michael Young&lt;/A&gt; &lt;/P&gt;&lt;P&gt;Thanks!! article is very useful.&lt;/P&gt;</description>
      <pubDate>Fri, 24 Feb 2017 21:12:25 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Best-Practices-for-Deploying-Production-Hadoop-Cluster/m-p/124368#M55445</guid>
      <dc:creator>munnyrahul</dc:creator>
      <dc:date>2017-02-24T21:12:25Z</dc:date>
    </item>
  </channel>
</rss>

