Browse Source

AMBARI-2051. Remove hard-coded ports from agent scripts - Nagios. (swagle)

git-svn-id: https://svn.apache.org/repos/asf/incubator/ambari/trunk@1477434 13f79535-47bb-0310-9956-ffa450edef68
Siddharth Wagle 12 years ago
parent
commit
babd00f078

+ 2 - 0
CHANGES.txt

@@ -815,6 +815,8 @@ Trunk (unreleased changes):
 
 
  BUG FIXES
  BUG FIXES
 
 
+ AMBARI-2051. Remove hard-coded ports from agent scripts - Nagios. (swagle)
+
  AMBARI-2045. Add Unit test to verify, client re-install for install failed 
  AMBARI-2045. Add Unit test to verify, client re-install for install failed 
  client. (swagle)
  client. (swagle)
 
 

+ 13 - 13
ambari-agent/src/main/puppet/modules/hdp-nagios/templates/hadoop-services.cfg.erb

@@ -124,7 +124,7 @@ define service {
         use                     hadoop-service
         use                     hadoop-service
         service_description     GANGLIA::Ganglia [gmetad] process down
         service_description     GANGLIA::Ganglia [gmetad] process down
         servicegroups           GANGLIA
         servicegroups           GANGLIA
-        check_command           check_tcp!8651!-w 1 -c 1
+        check_command           check_tcp!<%=scope.function_hdp_template_var("ganglia_port")%>!-w 1 -c 1
         normal_check_interval   0.25
         normal_check_interval   0.25
         retry_check_interval    0.25
         retry_check_interval    0.25
         max_check_attempts      4
         max_check_attempts      4
@@ -135,7 +135,7 @@ define service {
         use                     hadoop-service
         use                     hadoop-service
         service_description     GANGLIA::Ganglia Collector [gmond] process down alert for slaves
         service_description     GANGLIA::Ganglia Collector [gmond] process down alert for slaves
         servicegroups           GANGLIA
         servicegroups           GANGLIA
-        check_command           check_tcp!8660!-w 1 -c 1
+        check_command           check_tcp!<%=scope.function_hdp_template_var("ganglia_collector_slaves_port")%>!-w 1 -c 1
         normal_check_interval   0.25
         normal_check_interval   0.25
         retry_check_interval    0.25
         retry_check_interval    0.25
         max_check_attempts      4
         max_check_attempts      4
@@ -146,7 +146,7 @@ define service {
         use                     hadoop-service
         use                     hadoop-service
         service_description     GANGLIA::Ganglia Collector [gmond] process down alert for NameNode
         service_description     GANGLIA::Ganglia Collector [gmond] process down alert for NameNode
         servicegroups           GANGLIA
         servicegroups           GANGLIA
-        check_command           check_tcp!8661!-w 1 -c 1
+        check_command           check_tcp!<%=scope.function_hdp_template_var("ganglia_collector_namenode_port")%>!-w 1 -c 1
         normal_check_interval   0.25
         normal_check_interval   0.25
         retry_check_interval    0.25
         retry_check_interval    0.25
         max_check_attempts      4
         max_check_attempts      4
@@ -157,7 +157,7 @@ define service {
         use                     hadoop-service
         use                     hadoop-service
         service_description     GANGLIA::Ganglia Collector [gmond] process down alert for JobTracker
         service_description     GANGLIA::Ganglia Collector [gmond] process down alert for JobTracker
         servicegroups           GANGLIA
         servicegroups           GANGLIA
-        check_command           check_tcp!8662!-w 1 -c 1
+        check_command           check_tcp!<%=scope.function_hdp_template_var("ganglia_collector_jobtracker_port")%>!-w 1 -c 1
         normal_check_interval   0.25
         normal_check_interval   0.25
         retry_check_interval    0.25
         retry_check_interval    0.25
         max_check_attempts      4
         max_check_attempts      4
@@ -169,7 +169,7 @@ define service {
         use                     hadoop-service
         use                     hadoop-service
         service_description     GANGLIA::Ganglia Collector [gmond] process down alert for HBase Master
         service_description     GANGLIA::Ganglia Collector [gmond] process down alert for HBase Master
         servicegroups           GANGLIA
         servicegroups           GANGLIA
-        check_command           check_tcp!8663!-w 1 -c 1
+        check_command           check_tcp!<%=scope.function_hdp_template_var("ganglia_collector_hbase_port")%>!-w 1 -c 1
         normal_check_interval   0.25
         normal_check_interval   0.25
         retry_check_interval    0.25
         retry_check_interval    0.25
         max_check_attempts      4
         max_check_attempts      4
@@ -231,7 +231,7 @@ define service {
         use                     hadoop-service
         use                     hadoop-service
         service_description     NAMENODE::NameNode process down
         service_description     NAMENODE::NameNode process down
         servicegroups           HDFS
         servicegroups           HDFS
-        check_command           check_tcp!8020!-w 1 -c 1
+        check_command           check_tcp!<%=scope.function_hdp_template_var("namenode_metadata_port")%>!-w 1 -c 1
         normal_check_interval   0.5
         normal_check_interval   0.5
         retry_check_interval    0.25
         retry_check_interval    0.25
         max_check_attempts      3
         max_check_attempts      3
@@ -377,7 +377,7 @@ define service {
         use                     hadoop-service
         use                     hadoop-service
         service_description     ZOOKEEPER::ZooKeeper Server process down
         service_description     ZOOKEEPER::ZooKeeper Server process down
         servicegroups           ZOOKEEPER
         servicegroups           ZOOKEEPER
-        check_command           check_tcp!2181!-w 1 -c 1
+        check_command           check_tcp!<%=scope.function_hdp_template_var("clientPort")%>!-w 1 -c 1
         normal_check_interval   1
         normal_check_interval   1
         retry_check_interval    0.5
         retry_check_interval    0.5
         max_check_attempts      3
         max_check_attempts      3
@@ -440,9 +440,9 @@ define service {
         service_description     HIVE-METASTORE::Hive Metastore status check
         service_description     HIVE-METASTORE::Hive Metastore status check
         servicegroups           HIVE-METASTORE
         servicegroups           HIVE-METASTORE
         <%if scope.function_hdp_template_var("security_enabled")-%>
         <%if scope.function_hdp_template_var("security_enabled")-%>
-        check_command           check_hive_metastore_status!9083!<%=scope.function_hdp_template_var("java64_home")%>!true!<%=scope.function_hdp_template_var("keytab_path")%>/<%=scope.function_hdp_template_var("nagios_user")%>.headless.keytab!<%=scope.function_hdp_template_var("nagios_user")%>!<%=scope.function_hdp_template_var("kinit_path_local")%>/"/usr/bin/kinit"
+        check_command           check_hive_metastore_status!<%=scope.function_hdp_template_var("hive_metastore_port")%>!<%=scope.function_hdp_template_var("java64_home")%>!true!<%=scope.function_hdp_template_var("keytab_path")%>/<%=scope.function_hdp_template_var("nagios_user")%>.headless.keytab!<%=scope.function_hdp_template_var("nagios_user")%>!<%=scope.function_hdp_template_var("kinit_path_local")%>/"/usr/bin/kinit"
         <%else-%>
         <%else-%>
-        check_command           check_hive_metastore_status!9083!<%=scope.function_hdp_template_var("java64_home")%>!false
+        check_command           check_hive_metastore_status!<%=scope.function_hdp_template_var("hive_metastore_port")%>!<%=scope.function_hdp_template_var("java64_home")%>!false
         <%end-%>
         <%end-%>
         normal_check_interval   0.5
         normal_check_interval   0.5
         retry_check_interval    0.5
         retry_check_interval    0.5
@@ -457,9 +457,9 @@ define service {
         service_description     OOZIE::Oozie Server status check
         service_description     OOZIE::Oozie Server status check
         servicegroups           OOZIE
         servicegroups           OOZIE
         <%if scope.function_hdp_template_var("security_enabled")-%>
         <%if scope.function_hdp_template_var("security_enabled")-%>
-        check_command           check_oozie_status!11000!<%=scope.function_hdp_template_var("java64_home")%>!true!<%=scope.function_hdp_template_var("keytab_path")%>/<%=scope.function_hdp_template_var("nagios_user")%>.headless.keytab!<%=scope.function_hdp_template_var("nagios_user")%>!<%=scope.function_hdp_template_var("kinit_path_local")%>/"/usr/bin/kinit"
+        check_command           check_oozie_status!<%=scope.function_hdp_template_var("oozie_server_port")%>!<%=scope.function_hdp_template_var("java64_home")%>!true!<%=scope.function_hdp_template_var("keytab_path")%>/<%=scope.function_hdp_template_var("nagios_user")%>.headless.keytab!<%=scope.function_hdp_template_var("nagios_user")%>!<%=scope.function_hdp_template_var("kinit_path_local")%>/"/usr/bin/kinit"
         <%else-%>
         <%else-%>
-        check_command           check_oozie_status!11000!<%=scope.function_hdp_template_var("java64_home")%>!false
+        check_command           check_oozie_status!<%=scope.function_hdp_template_var("oozie_server_port")%>!<%=scope.function_hdp_template_var("java64_home")%>!false
         <%end-%>
         <%end-%>
         normal_check_interval   1
         normal_check_interval   1
         retry_check_interval    1
         retry_check_interval    1
@@ -474,9 +474,9 @@ define service {
         service_description     WEBHCAT::WebHCat Server status check
         service_description     WEBHCAT::WebHCat Server status check
         servicegroups           WEBHCAT 
         servicegroups           WEBHCAT 
         <%if scope.function_hdp_template_var("security_enabled")-%>
         <%if scope.function_hdp_template_var("security_enabled")-%>
-        check_command           check_templeton_status!50111!v1!true!<%=scope.function_hdp_template_var("keytab_path")%>/<%=scope.function_hdp_template_var("nagios_user")%>.headless.keytab!<%=scope.function_hdp_template_var("nagios_user")%>!<%=scope.function_hdp_template_var("kinit_path_local")%>/"/usr/bin/kinit"
+        check_command           check_templeton_status!<%=scope.function_hdp_template_var("templeton_port")%>!v1!true!<%=scope.function_hdp_template_var("keytab_path")%>/<%=scope.function_hdp_template_var("nagios_user")%>.headless.keytab!<%=scope.function_hdp_template_var("nagios_user")%>!<%=scope.function_hdp_template_var("kinit_path_local")%>/"/usr/bin/kinit"
         <%else-%>
         <%else-%>
-        check_command           check_templeton_status!50111!v1!false
+        check_command           check_templeton_status!<%=scope.function_hdp_template_var("templeton_port")%>!v1!false
         <%end-%>
         <%end-%>
         normal_check_interval   1
         normal_check_interval   1
         retry_check_interval    0.5
         retry_check_interval    0.5

+ 12 - 0
ambari-agent/src/main/puppet/modules/hdp/manifests/init.pp

@@ -56,6 +56,18 @@ class hdp(
   $hbase_master_port = hdp_default("hbase-site/hbase.master.info.port","60010")
   $hbase_master_port = hdp_default("hbase-site/hbase.master.info.port","60010")
   $hbase_rs_port = hdp_default("hbase-site/hbase.regionserver.info.port","60030")
   $hbase_rs_port = hdp_default("hbase-site/hbase.regionserver.info.port","60030")
   
   
+  $ganglia_port = hdp_default("ganglia_port","8651")
+  $ganglia_collector_slaves_port = hdp_default("ganglia_collector_slaves_port","8660")
+  $ganglia_collector_namenode_port = hdp_default("ganglia_collector_namenode_port","8661")
+  $ganglia_collector_jobtracker_port = hdp_default("ganglia_collector_jobtracker_port","8662")
+  $ganglia_collector_hbase_port = hdp_default("ganglia_collector_hbase_port","8663")
+
+  $oozie_server_port = hdp_default("oozie_server_port","11000")
+
+  $templeton_port = hdp_default("webhcat-site/templeton.port","50111")
+
+  $namenode_metadata_port = hdp_default("namenode_metadata_port","8020")
+  
   #TODO: think not needed and also there seems to be a puppet bug around this and ldap
   #TODO: think not needed and also there seems to be a puppet bug around this and ldap
   class { 'hdp::snmp': service_state => 'running'}
   class { 'hdp::snmp': service_state => 'running'}