<?xml version="1.0" encoding="UTF-8"?>
<rss xmlns:content="http://purl.org/rss/1.0/modules/content/" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:taxo="http://purl.org/rss/1.0/modules/taxonomy/" version="2.0">
  <channel>
    <title>question Re: Cannot start Ambari-metrics-collector in Support Questions</title>
    <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116568#M79362</link>
    <description>&lt;P&gt;Hi Orivier,&lt;/P&gt;&lt;P&gt;It is Version2.1.2.1&lt;/P&gt;</description>
    <pubDate>Thu, 07 Jul 2016 00:11:10 GMT</pubDate>
    <dc:creator>akafazov</dc:creator>
    <dc:date>2016-07-07T00:11:10Z</dc:date>
    <item>
      <title>Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116566#M79360</link>
      <description>&lt;P&gt;Hi,&lt;/P&gt;&lt;P&gt;I am having difficulties getting the ambari-metrics-collector to start. I have HBase running in distributed mode.&lt;/P&gt;&lt;P&gt;&lt;A href="https://community.cloudera.com/legacyfs/online/attachments/5549-ambari-metrics-collectorlog.txt"&gt;ambari-metrics-collectorlog.txt&lt;/A&gt;I have attached the ambari-metrics-collector.log&lt;/P&gt;&lt;P&gt;I already tried the suggestions from this thread: &lt;A href="https://community.hortonworks.com/questions/15818/ambari-metrics-collector-now-starting.html" target="_blank"&gt;https://community.hortonworks.com/questions/15818/ambari-metrics-collector-now-starting.html&lt;/A&gt; as well as the workaround for issue 6 here &lt;A href="https://cwiki.apache.org/confluence/display/AMBARI/Known+Issues" target="_blank"&gt;https://cwiki.apache.org/confluence/display/AMBARI/Known+Issues&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Any tips will be very appreciated.&lt;/P&gt;</description>
      <pubDate>Wed, 06 Jul 2016 22:33:10 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116566#M79360</guid>
      <dc:creator>akafazov</dc:creator>
      <dc:date>2016-07-06T22:33:10Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116567#M79361</link>
      <description>&lt;P&gt;Which version of Ambari are you using? &lt;/P&gt;</description>
      <pubDate>Wed, 06 Jul 2016 23:08:48 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116567#M79361</guid>
      <dc:creator>orenault</dc:creator>
      <dc:date>2016-07-06T23:08:48Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116568#M79362</link>
      <description>&lt;P&gt;Hi Orivier,&lt;/P&gt;&lt;P&gt;It is Version2.1.2.1&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 00:11:10 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116568#M79362</guid>
      <dc:creator>akafazov</dc:creator>
      <dc:date>2016-07-07T00:11:10Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116569#M79363</link>
      <description>&lt;P&gt;2016-07-06 14:59:14,466 INFO org.apache.zookeeper.ZooKeeper: Initiating client connection, connectString=m2.domain:2181 sessionTimeout=120000 watcher=hconnection-         0x7bc9e6ab0x0, quorum=m2.domain:2181, baseZNode=/hbase-secure&lt;/P&gt;&lt;P&gt;Looks like AMS tried to connect to hbase cluster's znode.&lt;/P&gt;&lt;P&gt;AMS should use /ams-hbase-secure as base znode.&lt;/P&gt;&lt;P&gt;Can you check your configuration ?&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 00:22:55 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116569#M79363</guid>
      <dc:creator>tyu</dc:creator>
      <dc:date>2016-07-07T00:22:55Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116570#M79364</link>
      <description>&lt;P&gt;Hi, I changed it, but now I am getting&lt;/P&gt;&lt;P&gt;2016-07-06 17:55:20,187 ERROR org.apache.hadoop.hbase.client.ConnectionManager$HConnectionImplementation: The node /ams-hbase-secure is not in ZooKeeper. It should have been written by the master. Check the value configured in 'zookeeper.znode.parent'. There could be a mismatch with the one configured in the master.&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 00:56:46 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116570#M79364</guid>
      <dc:creator>akafazov</dc:creator>
      <dc:date>2016-07-07T00:56:46Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116571#M79365</link>
      <description>&lt;P&gt;Hi Angel,&lt;/P&gt;&lt;P&gt;From your error, it looks like AMS is talking to cluster zookeeper (port 2181) . AMS in Version 2.1.2.1 uses it's own zookeeper in all modes of operation (port 61181). &lt;/P&gt;&lt;P&gt;Can you share your hbase-site.xml in /etc/ams-hbase/conf ? That will help us figure out the issue.&lt;/P&gt;&lt;P&gt;Thanks!&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 01:20:08 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116571#M79365</guid>
      <dc:creator>avijayan</dc:creator>
      <dc:date>2016-07-07T01:20:08Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116572#M79366</link>
      <description>&lt;P&gt;Please revert back the znode setting to default, if cluster is not kerberized: &lt;/P&gt;&lt;PRE&gt;/ams-hbase-unsecure&lt;/PRE&gt;&lt;P&gt;Also, make sure the quorum value in ams-hbase-site is:&lt;/P&gt;&lt;P&gt;hbase.zookeeper.quorum&lt;/P&gt;&lt;P&gt;{{zookeeper_quorum_hosts}}&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 01:21:54 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116572#M79366</guid>
      <dc:creator>sidwagle</dc:creator>
      <dc:date>2016-07-07T01:21:54Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116573#M79367</link>
      <description>&lt;P&gt;Hi swagle,&lt;/P&gt;&lt;P&gt;the cluster is kerberized. hbase.zookeeper.quorum looks ok&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 01:41:24 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116573#M79367</guid>
      <dc:creator>akafazov</dc:creator>
      <dc:date>2016-07-07T01:41:24Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116574#M79368</link>
      <description>&lt;P&gt;@&lt;A href="https://community.hortonworks.com/users/10765/akafazov.html"&gt;Angel Kafazov&lt;/A&gt;&lt;/P&gt;&lt;P&gt;See the attached doc should help.&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 04:37:19 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116574#M79368</guid>
      <dc:creator>Shelton</dc:creator>
      <dc:date>2016-07-07T04:37:19Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116575#M79369</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/10765/akafazov.html" nodeid="10765"&gt;@Angel Kafazov&lt;/A&gt; We need to look at the Master, RS and ZK logs to identify the issue. Can you upload them from /var/log/ambari-metrics-collector/ ?&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 11:19:57 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116575#M79369</guid>
      <dc:creator>sidwagle</dc:creator>
      <dc:date>2016-07-07T11:19:57Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116576#M79370</link>
      <description>&lt;P&gt;@&lt;A href="https://community.hortonworks.com/users/10765/akafazov.html"&gt;Angel Kafazov&lt;/A&gt;&lt;/P&gt;&lt;P&gt;Did you take note of no.9 "zookeeper.znode.parent" and restart all the components&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 11:36:03 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116576#M79370</guid>
      <dc:creator>Shelton</dc:creator>
      <dc:date>2016-07-07T11:36:03Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116577#M79371</link>
      <description>&lt;P&gt;&lt;A rel="user" href="https://community.cloudera.com/users/1271/sheltong.html" nodeid="1271"&gt;@Geoffrey Shelton Okot&lt;/A&gt; The document suggests setting the zookeeper.znode.parent to the same value as HBase service which is somewhat incorrect for versions &amp;gt; 2.1.2.1. Prior to 2.2, the value was not set so it defaulted to /hbase, this was ok because AMS started its own ZK. Post 2.2, AMS talks to cluster ZK and thereby the znode is set to /ams-hbase-(unsecure/secure).&lt;/P&gt;&lt;P&gt;Logs would indicate whether TGT was acquired correctly and if the problem is something totally different.&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 13:02:17 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116577#M79371</guid>
      <dc:creator>sidwagle</dc:creator>
      <dc:date>2016-07-07T13:02:17Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116578#M79372</link>
      <description>&lt;P&gt;Hi Geoffrey,&lt;/P&gt;&lt;P&gt;In HBase config I have:&lt;/P&gt;&lt;P&gt;zookeeper.znode.parent=/hbase-secure&lt;/P&gt;&lt;P&gt;In Ambari metrics:&lt;/P&gt;&lt;P&gt;zookeeper.znode.parent=/ams-hbase-secure&lt;/P&gt;&lt;P&gt;I am not sure if those must be the same.&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 14:08:39 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116578#M79372</guid>
      <dc:creator>akafazov</dc:creator>
      <dc:date>2016-07-07T14:08:39Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116579#M79373</link>
      <description>&lt;P&gt;&lt;A href="https://community.cloudera.com/legacyfs/online/attachments/5602-hbase-ams-master-m2-trunkatedlog.txt"&gt;hbase-ams-master-m2-trunkatedlog.txt&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://community.cloudera.com/legacyfs/online/attachments/5603-hbase-ams-zookeeper-m2log.txt"&gt;hbase-ams-zookeeper-m2log.txt&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://community.cloudera.com/legacyfs/online/attachments/5604-hbase-ams-regionserver-m2log.txt"&gt;hbase-ams-regionserver-m2log.txt&lt;/A&gt;&lt;/P&gt;&lt;P&gt;sorry for the delay&lt;/P&gt;</description>
      <pubDate>Thu, 07 Jul 2016 21:38:42 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116579#M79373</guid>
      <dc:creator>akafazov</dc:creator>
      <dc:date>2016-07-07T21:38:42Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116580#M79374</link>
      <description>&lt;P&gt;Both Master and Regions server logs indicate unable to login to Kerberos.&lt;/P&gt;&lt;PRE&gt;Login failure for amshbasemaster/m2.DOMAIN@DOMAIN from keytab /etc/security/keytabs/ams-hbase.regionserver.keytab: javax.security.auth.login.LoginException: Unable to obtain password from user&lt;/PRE&gt;&lt;P&gt;Can you check if you can manually login with the ams keytabs under /etc/security/keytabs/ams*.keytab&lt;/P&gt;&lt;P&gt;Example: kinit -kt /etc/security/keytabs/ams-hbase.regionserver.keytab amshbasemaster/m2.DOMAIN@DOMAIN&lt;/P&gt;</description>
      <pubDate>Fri, 08 Jul 2016 02:03:29 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116580#M79374</guid>
      <dc:creator>sidwagle</dc:creator>
      <dc:date>2016-07-08T02:03:29Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116581#M79375</link>
      <description>&lt;P&gt;I have attached the master, zk and rs logs.&lt;/P&gt;&lt;P&gt;&lt;A href="https://community.cloudera.com/legacyfs/online/attachments/5587-hbase-ams-master-m2-trunkatedlog.txt"&gt;hbase-ams-master-m2-trunkatedlog.txt&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://community.cloudera.com/legacyfs/online/attachments/5587-hbase-ams-master-m2-trunkatedlog.txt"&gt;&lt;/A&gt;&lt;A href="https://community.cloudera.com/legacyfs/online/attachments/5588-hbase-ams-zookeeper-m2log.txt"&gt;hbase-ams-zookeeper-m2log.txt&lt;/A&gt;&lt;/P&gt;&lt;P&gt;&lt;A href="https://community.cloudera.com/legacyfs/online/attachments/5588-hbase-ams-zookeeper-m2log.txt"&gt;&lt;/A&gt;&lt;A href="https://community.cloudera.com/legacyfs/online/attachments/5589-hbase-ams-regionserver-m2log.txt"&gt;hbase-ams-regionserver-m2log.txt&lt;/A&gt;&lt;/P&gt;&lt;P&gt;There seems to be authentication issue in the RS:&lt;/P&gt;&lt;PRE&gt;2016-07-06 11:42:43,688 ERROR [main] regionserver.HRegionServerCommandLine: Region server exiting
java.lang.RuntimeException: Failed construction of Regionserver: class org.apache.hadoop.hbase.regionserver.HRegionServer
at org.apache.hadoop.hbase.regionserver.HRegionServer.constructRegionServer(HRegionServer.java:2636)
at org.apache.hadoop.hbase.regionserver.HRegionServerCommandLine.start(HRegionServerCommandLine.java:64)
at org.apache.hadoop.hbase.regionserver.HRegionServerCommandLine.run(HRegionServerCommandLine.java:87)
at org.apache.hadoop.util.ToolRunner.run(ToolRunner.java:70)
at org.apache.hadoop.hbase.util.ServerCommandLine.doMain(ServerCommandLine.java:126)
at org.apache.hadoop.hbase.regionserver.HRegionServer.main(HRegionServer.java:2651)
Caused by: java.lang.reflect.InvocationTargetException
at sun.reflect.NativeConstructorAccessorImpl.newInstance0(Native Method)
at sun.reflect.NativeConstructorAccessorImpl.newInstance(NativeConstructorAccessorImpl.java:62)
at sun.reflect.DelegatingConstructorAccessorImpl.newInstance(DelegatingConstructorAccessorImpl.java:45)
at java.lang.reflect.Constructor.newInstance(Constructor.java:422)
at org.apache.hadoop.hbase.regionserver.HRegionServer.constructRegionServer(HRegionServer.java:2634)
... 5 more
Caused by: java.io.IOException: Login failure for amshbasemaster/m2.DOMAIN@DOMAIN from keytab /etc/security/keytabs/ams-hbase.regionserver.keytab: javax.security.auth.login.LoginException: Unable to obtain password from user
at org.apache.hadoop.security.UserGroupInformation.loginUserFromKeytab(UserGroupInformation.java:962)
at org.apache.hadoop.security.SecurityUtil.login(SecurityUtil.java:246)
at org.apache.hadoop.hbase.security.User$SecureHadoopUser.login(User.java:386)
at org.apache.hadoop.hbase.security.User.login(User.java:253)
at org.apache.hadoop.hbase.security.UserProvider.login(UserProvider.java:115)
at org.apache.hadoop.hbase.regionserver.HRegionServer.login(HRegionServer.java:612)
at org.apache.hadoop.hbase.regionserver.HRegionServer.&amp;lt;init&amp;gt;(HRegionServer.java:550)
... 10 more
Caused by: javax.security.auth.login.LoginException: Unable to obtain password from user
at com.sun.security.auth.module.Krb5LoginModule.promptForPass(Krb5LoginModule.java:897)
at com.sun.security.auth.module.Krb5LoginModule.attemptAuthentication(Krb5LoginModule.java:760)
at com.sun.security.auth.module.Krb5LoginModule.login(Krb5LoginModule.java:617)
at sun.reflect.NativeMethodAccessorImpl.invoke0(Native Method)
at sun.reflect.NativeMethodAccessorImpl.invoke(NativeMethodAccessorImpl.java:62)
at sun.reflect.DelegatingMethodAccessorImpl.invoke(DelegatingMethodAccessorImpl.java:43)
at java.lang.reflect.Method.invoke(Method.java:497)
at javax.security.auth.login.LoginContext.invoke(LoginContext.java:755)
at javax.security.auth.login.LoginContext.access$000(LoginContext.java:195)
at javax.security.auth.login.LoginContext$4.run(LoginContext.java:682)
at javax.security.auth.login.LoginContext$4.run(LoginContext.java:680)
at java.security.AccessController.doPrivileged(Native Method)
at javax.security.auth.login.LoginContext.invokePriv(LoginContext.java:680)
at javax.security.auth.login.LoginContext.login(LoginContext.java:587)
at org.apache.hadoop.security.UserGroupInformation.loginUserFromKeytab(UserGroupInformation.java:953)
... 16 more&lt;/PRE&gt;&lt;P&gt;ZOOKEEPER:&lt;/P&gt;&lt;PRE&gt;ERROR [main] quorum.QuorumPeerConfig: Invalid configuration, only one server specified (ignoring)&lt;/PRE&gt;&lt;P&gt;MASTER: &lt;/P&gt;&lt;PRE&gt;2016-07-06 10:48:18,075 WARN  [main-SendThread(localhost:61181)] zookeeper.ClientCnxn: Session 0x155bfd1eb150003 for server null, unexpected error, closing socket connection and attempting reconnect
java.net.ConnectException: Connection refused
at sun.nio.ch.SocketChannelImpl.checkConnect(Native Method)
at sun.nio.ch.SocketChannelImpl.finishConnect(SocketChannelImpl.java:717)
at org.apache.zookeeper.ClientCnxnSocketNIO.doTransport(ClientCnxnSocketNIO.java:361)
at org.apache.zookeeper.ClientCnxn$SendThread.run(ClientCnxn.java:1081)
2016-07-06 10:48:20,103 INFO  [main-SendThread(localhost:61181)] zookeeper.ClientCnxn: Opening socket connection to server localhost/127.0.0.1:61181. Will not attempt to authenticate using SASL (unknown error)
2016-07-06 10:48:20,104 WARN  [main-SendThread(localhost:61181)] zookeeper.ClientCnxn: Session 0x155bfd1eb150003 for server null, unexpected error, closing socket connection and attempting reconnect
java.net.ConnectException: Connection refused
at sun.nio.ch.SocketChannelImpl.checkConnect(Native Method)
at sun.nio.ch.SocketChannelImpl.finishConnect(SocketChannelImpl.java:717)
at org.apache.zookeeper.ClientCnxnSocketNIO.doTransport(ClientCnxnSocketNIO.java:361)
at org.apache.zookeeper.ClientCnxn$SendThread.run(ClientCnxn.java:1081)
2016-07-06 10:48:21,724 INFO  [main-SendThread(localhost:61181)] zookeeper.ClientCnxn: Opening socket connection to server localhost/127.0.0.1:61181. Will not attempt to authenticate using SASL (unknown error)
2016-07-06 10:48:21,725 WARN  [main-SendThread(localhost:61181)] zookeeper.ClientCnxn: Session 0x155bfd1eb150003 for server null, unexpected error, closing socket connection and attempting reconnect
java.net.ConnectException: Connection refused
at sun.nio.ch.SocketChannelImpl.checkConnect(Native Method)
at sun.nio.ch.SocketChannelImpl.finishConnect(SocketChannelImpl.java:717)
at org.apache.zookeeper.ClientCnxnSocketNIO.doTransport(ClientCnxnSocketNIO.java:361)
at org.apache.zookeeper.ClientCnxn$SendThread.run(ClientCnxn.java:1081)
2016-07-06 10:48:21,825 WARN  [RS:0;m2:49385] zookeeper.RecoverableZooKeeper: Possibly transient ZooKeeper, quorum=localhost:61181, exception=org.apache.zookeeper.KeeperException$ConnectionLossException: KeeperErrorCode = ConnectionLoss for /hbase/rs/m2.tmaut.tlabsdata.com,49385,1467802057410
2016-07-06 10:48:21,826 ERROR [RS:0;m2:49385] zookeeper.RecoverableZooKeeper: ZooKeeper delete failed after 4 attempts
2016-07-06 10:48:21,826 WARN  [RS:0;m2:49385] regionserver.HRegionServer: Failed deleting my ephemeral node
org.apache.zookeeper.KeeperException$ConnectionLossException: KeeperErrorCode = ConnectionLoss for /hbase/rs/m2.tmaut.tlabsdata.com,49385,1467802057410
at org.apache.zookeeper.KeeperException.create(KeeperException.java:99)
at org.apache.zookeeper.KeeperException.create(KeeperException.java:51)
at org.apache.zookeeper.ZooKeeper.delete(ZooKeeper.java:873)
at org.apache.hadoop.hbase.zookeeper.RecoverableZooKeeper.delete(RecoverableZooKeeper.java:178)
at org.apache.hadoop.hbase.zookeeper.ZKUtil.deleteNode(ZKUtil.java:1345)
at org.apache.hadoop.hbase.zookeeper.ZKUtil.deleteNode(ZKUtil.java:1334)
at org.apache.hadoop.hbase.regionserver.HRegionServer.deleteMyEphemeralNode(HRegionServer.java:1403)
at org.apache.hadoop.hbase.regionserver.HRegionServer.run(HRegionServer.java:1079)
at java.lang.Thread.run(Thread.java:745)
&lt;/PRE&gt;</description>
      <pubDate>Fri, 08 Jul 2016 02:50:34 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116581#M79375</guid>
      <dc:creator>akafazov</dc:creator>
      <dc:date>2016-07-08T02:50:34Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116582#M79376</link>
      <description>&lt;P&gt;
	So I removed the ambari-metrics service and added it again (moving to another node didn't work). I also made some changes:&lt;/P&gt;&lt;P&gt;
	- switch to distributed mode&lt;/P&gt;&lt;P&gt;
	- modified zookeeper.znode.parent=/hbase-secure&lt;/P&gt;&lt;P&gt;
	- manually recreated  ams.collector.keytab and zk.service.keytab due to authentication errors in the log&lt;/P&gt;&lt;P&gt;
	- changed hbase.
	zookeeper.property.clientPort to 2181 from 61181&lt;/P&gt;&lt;P&gt;
	- changed rootdir from local to HDFS&lt;/P&gt;&lt;P&gt;
	I think I am getting cluse as AMS can connect to zookeeper:&lt;/P&gt;
&lt;PRE&gt;INFO org.apache.phoenix.query.ConnectionQueryServicesImpl: Successfull login to secure cluster!!
&lt;/PRE&gt;&lt;P&gt;
	However I am getting error connecting to HBase&lt;/P&gt;
&lt;PRE&gt;WARN org.apache.hadoop.yarn.server.applicationhistoryservice.metrics.timeline.query.DefaultPhoenixDataSource: Unable to connect to HBase store using Phoenix.
java.sql.SQLException: ERROR 103 (08004): Unable to establish connection.
&lt;/PRE&gt;&lt;P&gt;I'll attached the logs in a comment&lt;/P&gt;</description>
      <pubDate>Fri, 08 Jul 2016 18:59:50 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116582#M79376</guid>
      <dc:creator>akafazov</dc:creator>
      <dc:date>2016-07-08T18:59:50Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116583#M79377</link>
      <description>&lt;P&gt;logs&lt;/P&gt;&lt;P&gt;&lt;A href="https://community.cloudera.com/legacyfs/online/attachments/5647-ambari-metrics-collectorlog.txt"&gt;ambari-metrics-collectorlog.txt&lt;/A&gt;&lt;/P&gt;</description>
      <pubDate>Fri, 08 Jul 2016 19:06:49 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116583#M79377</guid>
      <dc:creator>akafazov</dc:creator>
      <dc:date>2016-07-08T19:06:49Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116584#M79378</link>
      <description>&lt;P&gt;Found wrong rootdir hostname, after that I am getting&lt;/P&gt;&lt;PRE&gt;2016-07-08 12:44:39,320 INFO org.apache.zookeeper.ClientCnxn: Opening socket connection to server m2.domain/172.16.164.131:2181. Will not attempt to authenticate using SASL (unknown error)
2016-07-08 12:44:39,321 INFO org.apache.zookeeper.ClientCnxn: Socket connection established to m2.domain/172.16.164.131:2181, initiating session
2016-07-08 12:44:39,328 INFO org.apache.zookeeper.ClientCnxn: Session establishment complete on server m2.domain/172.16.164.131:2181, sessionid = 0x255ca408b8d0063, negotiated timeout = 40000
2016-07-08 12:44:50,376 WARN org.apache.hadoop.hbase.ipc.AbstractRpcClient: Couldn't setup connection for amshbase/m2.domain@domain to amshbasemaster/m1.domain@domain
2016-07-08 12:45:07,243 WARN org.apache.hadoop.hbase.ipc.AbstractRpcClient: Couldn't setup connection for amshbase/m2.domain@domain to amshbasemaster/m1.domain@domain
2016-07-08 12:45:16,166 WARN org.apache.hadoop.hbase.ipc.AbstractRpcClient: Couldn't setup connection for amshbase/m2.domain@domain to amshbasemaster/m1.domain@domain
2016-07-08 12:45:32,517 WARN org.apache.hadoop.hbase.ipc.AbstractRpcClient: Couldn't setup connection for amshbase/m2.domain@domain to amshbasemaster/m1.domain@domain
2016-07-08 12:45:54,803 WARN org.apache.hadoop.hbase.ipc.AbstractRpcClient: Couldn't setup connection for amshbase/m2.domain@domain to amshbasemaster/m1.domain@domain
2016-07-08 12:46:10,720 WARN org.apache.hadoop.hbase.ipc.AbstractRpcClient: Couldn't setup connection for amshbase/m2.domain@domain to amshbasemaster/m1.domain@domain
2016-07-08 12:46:37,467 WARN org.apache.hadoop.hbase.ipc.AbstractRpcClient: Couldn't setup connection for amshbase/m2.domain@domain to amshbasemaster/m1.domain@domain
2016-07-08 12:47:01,600 WARN org.apache.hadoop.hbase.ipc.AbstractRpcClient: Couldn't setup connection for amshbase/m2.domain@domain to amshbasemaster/m1.domain@domain
2016-07-08 12:47:01,600 INFO org.apache.hadoop.hbase.client.RpcRetryingCaller: Call exception, tries=10, retries=35, started=142264 ms ago, cancelled=false, msg=&lt;/PRE&gt;</description>
      <pubDate>Fri, 08 Jul 2016 19:51:35 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116584#M79378</guid>
      <dc:creator>akafazov</dc:creator>
      <dc:date>2016-07-08T19:51:35Z</dc:date>
    </item>
    <item>
      <title>Re: Cannot start Ambari-metrics-collector</title>
      <link>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116585#M79379</link>
      <description>&lt;P&gt;Also moving ambari-metrics-collector to another host fails in the wizard with the following error:&lt;/P&gt;&lt;PRE&gt;stderr: 
Traceback (most recent call last):
  File "/var/lib/ambari-agent/cache/common-services/AMBARI_METRICS/0.1.0/package/scripts/service_check.py", line 165, in &amp;lt;module&amp;gt;
    AMSServiceCheck().execute()
  File "/usr/lib/python2.6/site-packages/resource_management/libraries/script/script.py", line 216, in execute
    method(env)
  File "/usr/lib/python2.6/site-packages/ambari_commons/os_family_impl.py", line 89, in thunk
    return fn(*args, **kwargs)
  File "/var/lib/ambari-agent/cache/common-services/AMBARI_METRICS/0.1.0/package/scripts/service_check.py", line 92, in service_check
    raise Fail("Metrics were not saved. Service check has failed. "
resource_management.core.exceptions.Fail: Metrics were not saved. Service check has failed. 
Connection failed.
 stdout:
2016-07-08 15:41:07,832 - Ambari Metrics service check was started.
2016-07-08 15:41:07,844 - Generated metrics:
{
  "metrics": [
    {
      "metricname": "AMBARI_METRICS.SmokeTest.FakeMetric",
      "appid": "amssmoketestfake",
      "hostname": "w1.domain",
      "timestamp": 1467992467000,
      "starttime": 1467992467000,
      "metrics": {
        "1467992467000": 0.113469705131,
        "1467992468000": 1467992467000
      }
    }
  ]
}
2016-07-08 15:41:07,844 - Connecting (POST) to w3.domain:6188/ws/v1/timeline/metrics/
2016-07-08 15:41:17,856 - Connection failed. Next retry in 10 seconds.
2016-07-08 15:41:17,857 - Connecting (POST) to w3.domain:6188/ws/v1/timeline/metrics/
2016-07-08 15:41:27,867 - Connection failed. Next retry in 10 seconds.
2016-07-08 15:41:27,867 - Connecting (POST) to w3.domain:6188/ws/v1/timeline/metrics/
2016-07-08 15:41:37,878 - Connection failed. Next retry in 10 seconds.
2016-07-08 15:41:37,878 - Connecting (POST) to w3.domain:6188/ws/v1/timeline/metrics/
2016-07-08 15:41:47,891 - Connection failed. Next retry in 10 seconds.
2016-07-08 15:41:47,892 - Connecting (POST) to w3.domain:6188/ws/v1/timeline/metrics/
2016-07-08 15:41:57,904 - Connection failed. Next retry in 10 seconds.
2016-07-08 15:41:57,905 - Connecting (POST) to w3.domain:6188/ws/v1/timeline/metrics/
2016-07-08 15:42:07,919 - Connection failed. Next retry in 10 seconds.
2016-07-08 15:42:07,919 - Connecting (POST) to w3.domain:6188/ws/v1/timeline/metrics/
2016-07-08 15:42:17,929 - Connection failed. Next retry in 10 seconds.
2016-07-08 15:42:17,930 - Connecting (POST) to w3.domain:6188/ws/v1/timeline/metrics/
2016-07-08 15:42:27,941 - Connection failed. Next retry in 10 seconds.
2016-07-08 15:42:27,942 - Connecting (POST) to w3.domain:6188/ws/v1/timeline/metrics/
2016-07-08 15:42:37,956 - Connection failed. Next retry in 10 seconds.
2016-07-08 15:42:37,956 - Connecting (POST) to w3.domain:6188/ws/v1/timeline/metrics/&lt;/PRE&gt;</description>
      <pubDate>Fri, 08 Jul 2016 22:42:40 GMT</pubDate>
      <guid>https://community.cloudera.com/t5/Support-Questions/Cannot-start-Ambari-metrics-collector/m-p/116585#M79379</guid>
      <dc:creator>akafazov</dc:creator>
      <dc:date>2016-07-08T22:42:40Z</dc:date>
    </item>
  </channel>
</rss>

