<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: 3 Nodes Hadoop Cluster in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21369#M3604</link>
    <description>&lt;P&gt;hello&amp;nbsp;&lt;SPAN&gt;&lt;A target="_self" href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/8587"&gt;ZKhan&lt;/A&gt;&amp;nbsp;,&lt;BR /&gt;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;thanks for the replay, by your respose to my question you meant that the HW is sufficient&amp;nbsp;conditioned to 10TB harddrive for each machine, but my whole data set is 10gb,&amp;nbsp;why I need 10TB for each machine.&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;thank you in advance,&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Mon, 10 Nov 2014 16:41:37 GMT</pubDate>
    <dc:creator>ahmed1988</dc:creator>
    <dc:date>2014-11-10T16:41:37Z</dc:date>
    <item>
      <title>3 Nodes Hadoop Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21349#M3602</link>
      <description>&lt;P&gt;&lt;SPAN style="color: #000000; font-size: 12pt;"&gt;Hello I am trying to Setup a Hadoop environment with commodity hardware, in short I want to perform predictive analysis and learn more about Hadoop environment. by performing the analysis on Twitter data using various algorithms such as Clustering, Topic Modeling and Sentiment Analysis, the size of my data set is 10GB with approximately 10000000 tweets. and I have the following hardware specification :&lt;/SPAN&gt;&lt;/P&gt;&lt;P class="discussion details full"&gt;&lt;BR /&gt;&lt;SPAN style="color: #993300; font-size: 12pt;"&gt;&lt;STRONG&gt;One Desktop Quad Core processor 8GB ram &lt;/STRONG&gt;&lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN style="color: #993300; font-size: 12pt;"&gt;&lt;STRONG&gt;and two Desktops with Quad Core processor and 4GB ram .&lt;/STRONG&gt;&lt;/SPAN&gt;&lt;BR /&gt;&lt;BR /&gt;&lt;SPAN style="font-size: 14pt; color: #000000;"&gt;My questions: &lt;/SPAN&gt;&lt;BR /&gt;&lt;SPAN style="font-size: 14pt; color: #000000;"&gt;Is the hardware specification sufficient for the given tasks or do I need to Upgrade the hardware ?&lt;/SPAN&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 16 Sep 2022 09:12:16 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21349#M3602</guid>
      <dc:creator>ahmed1988</dc:creator>
      <dc:date>2022-09-16T09:12:16Z</dc:date>
    </item>
    <item>
      <title>Re: 3 Nodes Hadoop Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21361#M3603</link>
      <description>&lt;P&gt;Hi Ahmed,&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Given hardware specification is sufficient to run a cluster of 3 nodes. Make sure you have ample amount to disk space to run these opperations. Approx 10TB each.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks and Regards,&lt;/P&gt;&lt;P&gt;ZKhan&lt;/P&gt;</description>
      <pubDate>Mon, 10 Nov 2014 16:04:39 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21361#M3603</guid>
      <dc:creator>ZKhan</dc:creator>
      <dc:date>2014-11-10T16:04:39Z</dc:date>
    </item>
    <item>
      <title>Re: 3 Nodes Hadoop Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21369#M3604</link>
      <description>&lt;P&gt;hello&amp;nbsp;&lt;SPAN&gt;&lt;A target="_self" href="https://community.cloudera.com/t5/user/viewprofilepage/user-id/8587"&gt;ZKhan&lt;/A&gt;&amp;nbsp;,&lt;BR /&gt;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;thanks for the replay, by your respose to my question you meant that the HW is sufficient&amp;nbsp;conditioned to 10TB harddrive for each machine, but my whole data set is 10gb,&amp;nbsp;why I need 10TB for each machine.&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;thank you in advance,&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 10 Nov 2014 16:41:37 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21369#M3604</guid>
      <dc:creator>ahmed1988</dc:creator>
      <dc:date>2014-11-10T16:41:37Z</dc:date>
    </item>
    <item>
      <title>Re: 3 Nodes Hadoop Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21381#M3605</link>
      <description>&lt;P&gt;Hello,&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;It's recommended to have this much of disk space to run HDFS opperations smoothly. It's nice to have but not have to have..!!&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Thanks,&lt;/P&gt;&lt;P&gt;ZKhan&lt;/P&gt;</description>
      <pubDate>Mon, 10 Nov 2014 19:39:47 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21381#M3605</guid>
      <dc:creator>ZKhan</dc:creator>
      <dc:date>2014-11-10T19:39:47Z</dc:date>
    </item>
    <item>
      <title>Re: 3 Nodes Hadoop Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21389#M3606</link>
      <description>&lt;P&gt;It depends a lot on just what you mean by 'analysis'. 1 machine could be just fine. In general I think you will want to play with Spark, and Spark loves memory. So 8GB RAM seems a bit small, but 4 cores is OK, and I bet you have plenty of disk space.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;I do not agree at all that you need 10TB of disk space. That is orders of magnitude overkill for a 10GB data set.&lt;/P&gt;</description>
      <pubDate>Mon, 10 Nov 2014 22:14:31 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21389#M3606</guid>
      <dc:creator>srowen</dc:creator>
      <dc:date>2014-11-10T22:14:31Z</dc:date>
    </item>
    <item>
      <title>Re: 3 Nodes Hadoop Cluster</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21390#M3607</link>
      <description>&lt;P&gt;hello&amp;nbsp;&amp;nbsp;srowen,&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;what I meant by analysis using Mahout algorithms on top of hadoop cluster as well MapReduce preprocessing tasks for instnstance tokenization, stemming and translation of 10 million of tweets.&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;thank you&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Mon, 10 Nov 2014 22:18:27 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/3-Nodes-Hadoop-Cluster/m-p/21390#M3607</guid>
      <dc:creator>ahmed1988</dc:creator>
      <dc:date>2014-11-10T22:18:27Z</dc:date>
    </item>
  </channel>
</rss>

