<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: CDH Hardware requirements for a small cluster in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/CDH-Hardware-requirements-for-a-small-cluster/m-p/301640#M220785</link>
    <description>&lt;P&gt;Ma be we will exclude impala from this list for resources economy. Hive is enough for a while.&lt;/P&gt;</description>
    <pubDate>Wed, 19 Aug 2020 08:53:09 GMT</pubDate>
    <dc:creator>tol2000</dc:creator>
    <dc:date>2020-08-19T08:53:09Z</dc:date>
    <item>
      <title>CDH Hardware requirements for a small cluster</title>
      <link>https://community.cloudera.com/t5/Support-Questions/CDH-Hardware-requirements-for-a-small-cluster/m-p/301611#M220775</link>
      <description>&lt;DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;Hello!&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;Please help me about minimal hardware requirements for out small cluster.&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&amp;nbsp;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;We decided to make very small production cluster with high availability for archiving purposes based on Cloudera CDH 6.3.3 (community version)&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;BR /&gt;
&lt;DIV&gt;&lt;SPAN&gt;Storage size planning as about of 10-20 TiB&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;BR /&gt;
&lt;DIV&gt;&lt;SPAN&gt;Workload planning:&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;BR /&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; every 2 minutes ETL from external oracle to local parquet about of 500-1000 rows of data&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; periodically (very rarely) analytic queries to hive about search through all of parquets&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; periodically (very rarely) run spark ad-hoc tasks with goals same as above&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;BR /&gt;
&lt;DIV&gt;&lt;SPAN&gt;Components:&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;BR /&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; Cloudera manager&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; HDFS&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; Hive&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; Hue&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; Impala&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; Spark&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; Yarn with MR2&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; ZooKeeper&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;-&lt;/SPAN&gt;&lt;SPAN&gt; Streamsets parcel (as a part of cloudera)&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;BR /&gt;
&lt;DIV&gt;&lt;SPAN&gt;We want to use only 3 hosts (not more) and disaster of any of this host must not crash all system.&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;BR /&gt;
&lt;DIV&gt;&lt;SPAN&gt;So we plan to place all of above components to all of the hosts.&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;In another words, each component will be on each host.&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;DIV&gt;&lt;SPAN&gt;Is it normal and available or someone may advise another alignment?&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;BR /&gt;
&lt;DIV&gt;&lt;SPAN&gt;We also want to know if we can place HDFS namenode and cloudera manager on only 2 hosts or this components also better to put to all three hosts?&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;BR /&gt;
&lt;DIV&gt;&lt;SPAN&gt;And, finally, which minimal requirements of RAM, CPU and disk storage to each of this three hosts?&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;BR /&gt;
&lt;DIV&gt;&lt;SPAN&gt;Big thanks in advance!&lt;/SPAN&gt;&lt;/DIV&gt;
&lt;/DIV&gt;</description>
      <pubDate>Fri, 16 Sep 2022 14:38:35 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/CDH-Hardware-requirements-for-a-small-cluster/m-p/301611#M220775</guid>
      <dc:creator>tol2000</dc:creator>
      <dc:date>2022-09-16T14:38:35Z</dc:date>
    </item>
    <item>
      <title>Re: CDH Hardware requirements for a small cluster</title>
      <link>https://community.cloudera.com/t5/Support-Questions/CDH-Hardware-requirements-for-a-small-cluster/m-p/301640#M220785</link>
      <description>&lt;P&gt;Ma be we will exclude impala from this list for resources economy. Hive is enough for a while.&lt;/P&gt;</description>
      <pubDate>Wed, 19 Aug 2020 08:53:09 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/CDH-Hardware-requirements-for-a-small-cluster/m-p/301640#M220785</guid>
      <dc:creator>tol2000</dc:creator>
      <dc:date>2020-08-19T08:53:09Z</dc:date>
    </item>
    <item>
      <title>Re: CDH Hardware requirements for a small cluster</title>
      <link>https://community.cloudera.com/t5/Support-Questions/CDH-Hardware-requirements-for-a-small-cluster/m-p/301775#M220841</link>
      <description>&lt;P&gt;&lt;a href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/79622"&gt;@tol2000&lt;/a&gt;&amp;nbsp;This guide may be a good start for you.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;A href="https://docs.cloudera.com/documentation/enterprise/6/release-notes/topics/rg_hardware_requirements.html#concept_vvv_cxt_gbb" target="_blank"&gt;https://docs.cloudera.com/documentation/enterprise/6/release-notes/topics/rg_hardware_requirements.html#concept_vvv_cxt_gbb&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 21 Aug 2020 18:22:14 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/CDH-Hardware-requirements-for-a-small-cluster/m-p/301775#M220841</guid>
      <dc:creator>GangWar</dc:creator>
      <dc:date>2020-08-21T18:22:14Z</dc:date>
    </item>
    <item>
      <title>Re: CDH Hardware requirements for a small cluster</title>
      <link>https://community.cloudera.com/t5/Support-Questions/CDH-Hardware-requirements-for-a-small-cluster/m-p/303265#M221463</link>
      <description>&lt;P&gt;Thank you. I have started thinking about it exactly from this resource &lt;span class="lia-unicode-emoji" title=":slightly_smiling_face:"&gt;🙂&lt;/span&gt; Not all is clear for me for a while, but now I have +- ability of imaging about this question, it's all very individual, I understand. Thank you. This question is closed )&lt;/P&gt;</description>
      <pubDate>Wed, 23 Sep 2020 09:41:09 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/CDH-Hardware-requirements-for-a-small-cluster/m-p/303265#M221463</guid>
      <dc:creator>tol2000</dc:creator>
      <dc:date>2020-09-23T09:41:09Z</dc:date>
    </item>
  </channel>
</rss>

