<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Tried Search 1.0.0 and Morphline HBase Indexer with no success in Archives of Support Questions (Read Only)</title>
    <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Tried-Search-1-0-0-and-Morphline-HBase-Indexer-with-no/m-p/2209#M375</link>
    <description>&lt;P&gt;Hi&lt;/P&gt;&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; I tried setting up the HBASE indexer following the guidelines, but didn't see any indexed documents.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; Using CM4.7 Search1.0.0&lt;/P&gt;&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; And the steps below:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Added the Indexer Service to the Cluster and the Morphlines File is:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;SOLR_LOCATOR : {
  # Name of solr collection
  collection : hbase-collection1
  
  # ZooKeeper ensemble
  zkHost : "$ZK_HOST" 
}


morphlines : [
{
id : morphline
importCommands : ["com.cloudera.**", "com.ngdata.**"]

commands : [                    
  {
    extractHBaseCells {
      mappings : [
        {
          inputColumn : "data&amp;amp;colon;*"
          outputField : "data" 
          type : string 
          source : value
        }
      ]
    }
  }


  { logDebug { format : "output record: {}", args : ["@{}"] } }
]
}
]&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;and ks_indexer starts successfully&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;then enabled replication on HBase column families.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;created a corresponding SolrCloud collection with following command line:&lt;/P&gt;&lt;PRE&gt;$ solrctl instancedir --generate $HOME/hbase-collection1
$ solrctl instancedir --create hbase-collection1 $HOME/hbase-collection1
$ solrctl collection --create hbase-collection1&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;created an HBase Indexer configuration:&lt;/P&gt;&lt;PRE&gt;$ cat $HOME/morphline-hbase-mapper.xml

&amp;lt;?xml version="1.0"?&amp;gt;
&amp;lt;indexer table="record" mapper="com.ngdata.hbaseindexer.morphline.MorphlineResultToSolrMapper"&amp;gt;

   &amp;lt;!-- The relative or absolute path on the local file system to the morphline configuration file. --&amp;gt;
   &amp;lt;!-- Use relative path "morphlines.conf" for morphlines managed by Cloudera Manager 
   &amp;lt;param name="morphlineFile" value="/etc/hbase-solr/conf/morphlines.conf"/&amp;gt;

   &amp;lt;!-- The optional morphlineId identifies a morphline if there are multiple morphlines in morphlines.conf --&amp;gt;
   &amp;lt;!-- &amp;lt;param name="morphlineId" value="morphline1"/&amp;gt; --&amp;gt;

&amp;lt;/indexer&amp;gt;&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;created a Morphline Configuration File&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;$ cat /etc/hbase-solr/conf/morphlines.conf

morphlines : [
  {
    id : morphline1
    importCommands : ["com.cloudera.cdk.morphline.**", "com.ngdata.**"]

    commands : [                    
      {
        extractHBaseCells {
          mappings : [
            {
              inputColumn : "data&amp;amp;colon;*"
              outputField : "data" 
              type : string 
              source : value
            }

            #{
            #  inputColumn : "data&amp;amp;colon;item"
            #  outputField : "attachment_body" 
            #  type : "byte[]" 
            #  source : value
            #}
          ]
        }
      }

      #for avro use with type : "byte[]" in extractHBaseCells mapping above
      #{ readAvroContainer {} } 
      #{ 
      #  extractAvroPaths {
      #    paths : { 
      #      data &amp;amp;colon; /user_name      
      #    }
      #  }
      #}

      { logTrace { format : "output record: {}", args : ["@{}"] } }    
    ]
  }
]&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Registered an HBase Indexer configuration with the HBase Indexer Service&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;hbase-indexer add-indexer \
--name myIndexer \
--indexer-conf $HOME/morphline-hbase-mapper.xml \
--connection-param solr.zk=localhost:2181/solr \
--connection-param solr.collection=hbase-collection1 \
--zookeeper localhost:2181&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;#hbase-indexer list-indexers&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;myindex&lt;BR /&gt;&amp;nbsp; + Lifecycle state: ACTIVE&lt;BR /&gt;&amp;nbsp; + Incremental indexing state: SUBSCRIBE_AND_CONSUME&lt;BR /&gt;&amp;nbsp; + Batch indexing state: INACTIVE&lt;BR /&gt;&amp;nbsp; + SEP subscription ID: null&lt;BR /&gt;&amp;nbsp; + SEP subscription timestamp: 2013-10-14T19:00:36.262+08:00&lt;BR /&gt;&amp;nbsp; + Connection type: solr&lt;BR /&gt;&amp;nbsp; + Connection params:&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; + solr.collection = hbase-collection1&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; + solr.zk = localhost:2181/solr&lt;BR /&gt;&amp;nbsp; + Indexer config:&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 574 bytes, use -dump to see content&lt;BR /&gt;&amp;nbsp; + Batch index config:&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; (none)&lt;BR /&gt;&amp;nbsp; + Default batch index config:&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; (none)&lt;BR /&gt;&amp;nbsp; + Processes&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; + 0 running processes&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; + 0 failed processes&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;In solr query, I couldn't find the records which I had put it in hbase , what did I missed?&lt;/P&gt;&lt;P&gt;BTW, before trying search1.0.0, I had tried hbase-indexer from ngdata's github with indexdemo-usr example and succeeded.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Best Regards,&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
    <pubDate>Fri, 16 Sep 2022 08:48:56 GMT</pubDate>
    <dc:creator>ooyama</dc:creator>
    <dc:date>2022-09-16T08:48:56Z</dc:date>
    <item>
      <title>Tried Search 1.0.0 and Morphline HBase Indexer with no success</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Tried-Search-1-0-0-and-Morphline-HBase-Indexer-with-no/m-p/2209#M375</link>
      <description>&lt;P&gt;Hi&lt;/P&gt;&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; I tried setting up the HBASE indexer following the guidelines, but didn't see any indexed documents.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; Using CM4.7 Search1.0.0&lt;/P&gt;&lt;P&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; And the steps below:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Added the Indexer Service to the Cluster and the Morphlines File is:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;SOLR_LOCATOR : {
  # Name of solr collection
  collection : hbase-collection1
  
  # ZooKeeper ensemble
  zkHost : "$ZK_HOST" 
}


morphlines : [
{
id : morphline
importCommands : ["com.cloudera.**", "com.ngdata.**"]

commands : [                    
  {
    extractHBaseCells {
      mappings : [
        {
          inputColumn : "data&amp;amp;colon;*"
          outputField : "data" 
          type : string 
          source : value
        }
      ]
    }
  }


  { logDebug { format : "output record: {}", args : ["@{}"] } }
]
}
]&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;and ks_indexer starts successfully&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;then enabled replication on HBase column families.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;created a corresponding SolrCloud collection with following command line:&lt;/P&gt;&lt;PRE&gt;$ solrctl instancedir --generate $HOME/hbase-collection1
$ solrctl instancedir --create hbase-collection1 $HOME/hbase-collection1
$ solrctl collection --create hbase-collection1&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;created an HBase Indexer configuration:&lt;/P&gt;&lt;PRE&gt;$ cat $HOME/morphline-hbase-mapper.xml

&amp;lt;?xml version="1.0"?&amp;gt;
&amp;lt;indexer table="record" mapper="com.ngdata.hbaseindexer.morphline.MorphlineResultToSolrMapper"&amp;gt;

   &amp;lt;!-- The relative or absolute path on the local file system to the morphline configuration file. --&amp;gt;
   &amp;lt;!-- Use relative path "morphlines.conf" for morphlines managed by Cloudera Manager 
   &amp;lt;param name="morphlineFile" value="/etc/hbase-solr/conf/morphlines.conf"/&amp;gt;

   &amp;lt;!-- The optional morphlineId identifies a morphline if there are multiple morphlines in morphlines.conf --&amp;gt;
   &amp;lt;!-- &amp;lt;param name="morphlineId" value="morphline1"/&amp;gt; --&amp;gt;

&amp;lt;/indexer&amp;gt;&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;created a Morphline Configuration File&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;$ cat /etc/hbase-solr/conf/morphlines.conf

morphlines : [
  {
    id : morphline1
    importCommands : ["com.cloudera.cdk.morphline.**", "com.ngdata.**"]

    commands : [                    
      {
        extractHBaseCells {
          mappings : [
            {
              inputColumn : "data&amp;amp;colon;*"
              outputField : "data" 
              type : string 
              source : value
            }

            #{
            #  inputColumn : "data&amp;amp;colon;item"
            #  outputField : "attachment_body" 
            #  type : "byte[]" 
            #  source : value
            #}
          ]
        }
      }

      #for avro use with type : "byte[]" in extractHBaseCells mapping above
      #{ readAvroContainer {} } 
      #{ 
      #  extractAvroPaths {
      #    paths : { 
      #      data &amp;amp;colon; /user_name      
      #    }
      #  }
      #}

      { logTrace { format : "output record: {}", args : ["@{}"] } }    
    ]
  }
]&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Registered an HBase Indexer configuration with the HBase Indexer Service&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;PRE&gt;hbase-indexer add-indexer \
--name myIndexer \
--indexer-conf $HOME/morphline-hbase-mapper.xml \
--connection-param solr.zk=localhost:2181/solr \
--connection-param solr.collection=hbase-collection1 \
--zookeeper localhost:2181&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;#hbase-indexer list-indexers&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;myindex&lt;BR /&gt;&amp;nbsp; + Lifecycle state: ACTIVE&lt;BR /&gt;&amp;nbsp; + Incremental indexing state: SUBSCRIBE_AND_CONSUME&lt;BR /&gt;&amp;nbsp; + Batch indexing state: INACTIVE&lt;BR /&gt;&amp;nbsp; + SEP subscription ID: null&lt;BR /&gt;&amp;nbsp; + SEP subscription timestamp: 2013-10-14T19:00:36.262+08:00&lt;BR /&gt;&amp;nbsp; + Connection type: solr&lt;BR /&gt;&amp;nbsp; + Connection params:&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; + solr.collection = hbase-collection1&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; + solr.zk = localhost:2181/solr&lt;BR /&gt;&amp;nbsp; + Indexer config:&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; 574 bytes, use -dump to see content&lt;BR /&gt;&amp;nbsp; + Batch index config:&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; (none)&lt;BR /&gt;&amp;nbsp; + Default batch index config:&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp;&amp;nbsp; (none)&lt;BR /&gt;&amp;nbsp; + Processes&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; + 0 running processes&lt;BR /&gt;&amp;nbsp;&amp;nbsp;&amp;nbsp; + 0 failed processes&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;In solr query, I couldn't find the records which I had put it in hbase , what did I missed?&lt;/P&gt;&lt;P&gt;BTW, before trying search1.0.0, I had tried hbase-indexer from ngdata's github with indexdemo-usr example and succeeded.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Best Regards,&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Fri, 16 Sep 2022 08:48:56 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Tried-Search-1-0-0-and-Morphline-HBase-Indexer-with-no/m-p/2209#M375</guid>
      <dc:creator>ooyama</dc:creator>
      <dc:date>2022-09-16T08:48:56Z</dc:date>
    </item>
    <item>
      <title>Re: Tried Search 1.0.0 and Morphline HBase Indexer with no success</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Tried-Search-1-0-0-and-Morphline-HBase-Indexer-with-no/m-p/2211#M376</link>
      <description>&lt;P&gt;FWIW, there are some funny colon quote chars in the morphline config you posted. Probably just copy n'paste weirdness, but maybe something to double check.&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;Also enable TRACE logging and check the corresponding log files:&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;log4j.logger.com.cloudera.cdk.morphline=TRACE&lt;BR /&gt;log4j.logger.com.ngdata=TRACE&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;</description>
      <pubDate>Tue, 15 Oct 2013 07:51:04 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Tried-Search-1-0-0-and-Morphline-HBase-Indexer-with-no/m-p/2211#M376</guid>
      <dc:creator>whosch</dc:creator>
      <dc:date>2013-10-15T07:51:04Z</dc:date>
    </item>
    <item>
      <title>Re: Tried Search 1.0.0 and Morphline HBase Indexer with no success</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Tried-Search-1-0-0-and-Morphline-HBase-Indexer-with-no/m-p/2223#M377</link>
      <description>&lt;P&gt;Hi @ooyama&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;&amp;nbsp; &amp;nbsp;Looks like your "&lt;SPAN&gt;HBase Indexer configuration" is wrong.&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;&amp;nbsp; &amp;nbsp;If you notice the XML comments in the morphline-hbase-mapper.xml&lt;/SPAN&gt;, it has commented out all the text including the path to morphline file.&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;&amp;nbsp; &amp;nbsp;Fix:&lt;/SPAN&gt;&lt;/P&gt;&lt;P&gt;&lt;SPAN&gt;&amp;nbsp; &amp;nbsp; &amp;nbsp; &amp;nbsp;&amp;nbsp;&lt;/SPAN&gt;&lt;/P&gt;&lt;PRE&gt;&amp;lt;!-- Use relative path "morphlines.conf" for morphlines managed by Cloudera Manager&lt;/PRE&gt;&lt;PRE&gt;&amp;lt;!-- Use relative path "morphlines.conf" for morphlines managed by Cloudera Manager --&amp;gt;&lt;/PRE&gt;</description>
      <pubDate>Tue, 15 Oct 2013 18:27:18 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Tried-Search-1-0-0-and-Morphline-HBase-Indexer-with-no/m-p/2223#M377</guid>
      <dc:creator>Vamsee</dc:creator>
      <dc:date>2013-10-15T18:27:18Z</dc:date>
    </item>
    <item>
      <title>Re: Tried Search 1.0.0 and Morphline HBase Indexer with no success</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Tried-Search-1-0-0-and-Morphline-HBase-Indexer-with-no/m-p/2235#M378</link>
      <description>&lt;P&gt;Thank you very much！It's running now!&lt;/P&gt;&lt;P&gt;&amp;nbsp;&lt;/P&gt;&lt;P&gt;And one more question: How could I index the rows in hbase before hbase-indexer add-index? I know there's a command with lily&lt;/P&gt;&lt;PRE&gt;lily-update-index -n nameOfYourIndex --build-state BUILD_REQUESTED&lt;/PRE&gt;&lt;P&gt;&amp;nbsp;What should I suppose to do with Cloudera Search?&lt;/P&gt;</description>
      <pubDate>Wed, 16 Oct 2013 09:15:26 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Tried-Search-1-0-0-and-Morphline-HBase-Indexer-with-no/m-p/2235#M378</guid>
      <dc:creator>ooyama</dc:creator>
      <dc:date>2013-10-16T09:15:26Z</dc:date>
    </item>
    <item>
      <title>Re: Tried Search 1.0.0 and Morphline HBase Indexer with no success</title>
      <link>https://community.cloudera.com/t5/Archives-of-Support-Questions/Tried-Search-1-0-0-and-Morphline-HBase-Indexer-with-no/m-p/2245#M379</link>
      <description>We are working on such a feature, should be available soon. Meanwhile you can work around it by touching all cells without significantly modifying them, e.g. by updating the timestamp.&lt;BR /&gt;&lt;BR /&gt;Wolfgang.&lt;BR /&gt;&lt;BR /&gt;</description>
      <pubDate>Wed, 16 Oct 2013 16:09:23 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Archives-of-Support-Questions/Tried-Search-1-0-0-and-Morphline-HBase-Indexer-with-no/m-p/2245#M379</guid>
      <dc:creator>whosch</dc:creator>
      <dc:date>2013-10-16T16:09:23Z</dc:date>
    </item>
  </channel>
</rss>

