<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: How indexing is done in HDFS? in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-indexing-is-done-in-HDFS/m-p/149044#M20245</link>
    <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/2769/rushikeshdeshmukh007.html" nodeid="2769"&gt;@Rushikesh Deshmukh&lt;/A&gt;  Look at &lt;A rel="user" href="https://community.cloudera.com/users/168/bleonhardi.html" nodeid="168"&gt;@Benjamin Leonhardi&lt;/A&gt; answer.&lt;/P&gt;&lt;P&gt;No, it's not correct.&lt;/P&gt;</description>
    <pubDate>Fri, 19 Feb 2016 19:31:00 GMT</pubDate>
    <dc:creator>nsabharwal</dc:creator>
    <dc:date>2016-02-19T19:31:00Z</dc:date>
    <item>
      <title>How indexing is done in HDFS?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-indexing-is-done-in-HDFS/m-p/149040#M20241</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;Can anyone explains me how indexing is done in HDFS?&lt;/P&gt;</description>
      <pubDate>Fri, 19 Feb 2016 14:26:18 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-indexing-is-done-in-HDFS/m-p/149040#M20241</guid>
      <dc:creator>rushikeshdeshmu</dc:creator>
      <dc:date>2016-02-19T14:26:18Z</dc:date>
    </item>
    <item>
      <title>Re: How indexing is done in HDFS?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-indexing-is-done-in-HDFS/m-p/149041#M20242</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/2769/rushikeshdeshmukh007.html" nodeid="2769"&gt;@Rushikesh Deshmukh&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/2769/rushikeshdeshmukh007.html" nodeid="2769"&gt;&lt;/A&gt;See this &lt;A href="http://stackoverflow.com/questions/11954904/indexing-and-searching-in-hadoop" target="_blank"&gt;http://stackoverflow.com/questions/11954904/indexing-and-searching-in-hadoop&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 19 Feb 2016 14:37:07 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-indexing-is-done-in-HDFS/m-p/149041#M20242</guid>
      <dc:creator>rahulpathak109</dc:creator>
      <dc:date>2016-02-19T14:37:07Z</dc:date>
    </item>
    <item>
      <title>Re: How indexing is done in HDFS?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-indexing-is-done-in-HDFS/m-p/149042#M20243</link>
      <description>&lt;P&gt;I got below answer:&lt;/P&gt;&lt;P&gt;Hadoop
has its own way of indexing. Depending upon the block size, once the data
is stored, HDFS will keep on storing the last part of the data which will
say where the next part of the data will be. In fact, this is the base
of HDFS.&lt;/P&gt;&lt;P&gt;-&lt;/P&gt;&lt;P&gt;Is this answer correct?&lt;/P&gt;</description>
      <pubDate>Fri, 19 Feb 2016 14:42:38 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-indexing-is-done-in-HDFS/m-p/149042#M20243</guid>
      <dc:creator>rushikeshdeshmu</dc:creator>
      <dc:date>2016-02-19T14:42:38Z</dc:date>
    </item>
    <item>
      <title>Re: How indexing is done in HDFS?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-indexing-is-done-in-HDFS/m-p/149043#M20244</link>
      <description>&lt;P&gt;Hello Rukishek,&lt;/P&gt;&lt;P&gt;unless I misunderstand something this is not correct. HDFS doesn't store in the data where the next block is. Instead the Namenode knows which blocks make up a file and also the order of the blocks. Using this the HDFS client knows which block to load at any time if you seek in the file. &lt;/P&gt;&lt;P&gt;HDFS blocks are stupid, simple 128MB cut blocks of the data. Datanodes are stupid and only know which blocks they have. The Namenode pieces it all together using an in-memory image of all files and blocks that make these files and where they are stored. The clients get this information from the namenode.&lt;/P&gt;&lt;P&gt;Now if you mean full-text indexing then you should look at Solr like Rahul said.&lt;/P&gt;</description>
      <pubDate>Fri, 19 Feb 2016 17:38:41 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-indexing-is-done-in-HDFS/m-p/149043#M20244</guid>
      <dc:creator>bleonhardi</dc:creator>
      <dc:date>2016-02-19T17:38:41Z</dc:date>
    </item>
    <item>
      <title>Re: How indexing is done in HDFS?</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-indexing-is-done-in-HDFS/m-p/149044#M20245</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/2769/rushikeshdeshmukh007.html" nodeid="2769"&gt;@Rushikesh Deshmukh&lt;/A&gt;  Look at &lt;A rel="user" href="https://community.cloudera.com/users/168/bleonhardi.html" nodeid="168"&gt;@Benjamin Leonhardi&lt;/A&gt; answer.&lt;/P&gt;&lt;P&gt;No, it's not correct.&lt;/P&gt;</description>
      <pubDate>Fri, 19 Feb 2016 19:31:00 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/How-indexing-is-done-in-HDFS/m-p/149044#M20245</guid>
      <dc:creator>nsabharwal</dc:creator>
      <dc:date>2016-02-19T19:31:00Z</dc:date>
    </item>
  </channel>
</rss>

