|
@@ -0,0 +1,656 @@
|
|
|
+{
|
|
|
+ "href" : "http://dev01.hortonworks.com:8080/api/v1/clusters/c1/host_components?fields=HostRoles/nagios_alerts&HostRoles/component_name=NAGIOS_SERVER",
|
|
|
+ "items" : [
|
|
|
+ {
|
|
|
+ "href" : "http://dev01.hortonworks.com:8080/api/v1/clusters/c1/hosts/dev01.hortonworks.com/host_components/NAGIOS_SERVER",
|
|
|
+ "HostRoles" : {
|
|
|
+ "cluster_name" : "c1",
|
|
|
+ "component_name" : "NAGIOS_SERVER",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "nagios_alerts" : {
|
|
|
+ "alerts" : [
|
|
|
+ {
|
|
|
+ "service_description" : "Check ambari-agent process",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: Ambari agent is running [PID:15240]",
|
|
|
+ "last_hard_state_change" : "1375291083",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308183",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308183",
|
|
|
+ "service_type" : "AMBARI"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "DataNode process down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "TCP OK - 0.016 second response time on port 50075",
|
|
|
+ "last_hard_state_change" : "1375296186",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308426",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375294732",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308426",
|
|
|
+ "service_type" : "HDFS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "DataNode storage full",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: Capacity:[52844687359], Remaining Capacity:[45285249024], percent_full:[14.305010991256]",
|
|
|
+ "last_hard_state_change" : "1375291089",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308189",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308189",
|
|
|
+ "service_type" : "HDFS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Ganglia Collector [gmond] process down alert for HBase Master",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "TCP OK - 0.002 second response time on port 8663",
|
|
|
+ "last_hard_state_change" : "1375291092",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308426",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308426",
|
|
|
+ "service_type" : "GANGLIA"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Ganglia Collector [gmond] process down alert for History Server 2",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "TCP OK - 0.001 second response time on port 8666",
|
|
|
+ "last_hard_state_change" : "1375291095",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308420",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308420",
|
|
|
+ "service_type" : "GANGLIA"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Ganglia Collector [gmond] process down alert for JobTracker",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "4",
|
|
|
+ "current_state" : "2",
|
|
|
+ "plugin_output" : "Connection refused",
|
|
|
+ "last_hard_state_change" : "1375291143",
|
|
|
+ "last_hard_state" : "2",
|
|
|
+ "last_time_ok" : "0",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375308423",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308423",
|
|
|
+ "service_type" : "GANGLIA"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Ganglia Collector [gmond] process down alert for NameNode",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "TCP OK - 0.006 second response time on port 8661",
|
|
|
+ "last_hard_state_change" : "1375291101",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308426",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308426",
|
|
|
+ "service_type" : "GANGLIA"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Ganglia Collector [gmond] process down alert for Node Manager",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "TCP OK - 0.002 second response time on port 8660",
|
|
|
+ "last_hard_state_change" : "1375291104",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308416",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308416",
|
|
|
+ "service_type" : "GANGLIA"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Ganglia Collector [gmond] process down alert for Resource Manager",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "TCP OK - 0.002 second response time on port 8664",
|
|
|
+ "last_hard_state_change" : "1375291107",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308426",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308426",
|
|
|
+ "service_type" : "GANGLIA"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Ganglia Collector [gmond] process down alert for slaves",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "TCP OK - 0.005 second response time on port 8660",
|
|
|
+ "last_hard_state_change" : "1375291110",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308420",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308420",
|
|
|
+ "service_type" : "GANGLIA"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Ganglia [gmetad] process down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "TCP OK - 0.018 second response time on port 8651",
|
|
|
+ "last_hard_state_change" : "1375291113",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308423",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308423",
|
|
|
+ "service_type" : "GANGLIA"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Percent RegionServers down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "3",
|
|
|
+ "current_state" : "2",
|
|
|
+ "plugin_output" : "CRITICAL: total:<1>, affected:<1>",
|
|
|
+ "last_hard_state_change" : "1375298856",
|
|
|
+ "last_hard_state" : "2",
|
|
|
+ "last_time_ok" : "1375298796",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375308426",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308426",
|
|
|
+ "service_type" : "HBASE"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "HBase Master CPU utilization",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "1 CPU, load 22.0% < 200% : OK",
|
|
|
+ "last_hard_state_change" : "1375291118",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308218",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308218",
|
|
|
+ "service_type" : "HBASE"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "HBase Master Web UI down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "3",
|
|
|
+ "current_state" : "1",
|
|
|
+ "plugin_output" : "WARNING: HBase Master web UI not accessible : http://dev01.hortonworks.com:60010/master-status",
|
|
|
+ "last_hard_state_change" : "1375299171",
|
|
|
+ "last_hard_state" : "1",
|
|
|
+ "last_time_ok" : "1375298991",
|
|
|
+ "last_time_warning" : "1375308411",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308411",
|
|
|
+ "service_type" : "HBASE"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "HBase Master process down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "4",
|
|
|
+ "current_state" : "2",
|
|
|
+ "plugin_output" : "Connection refused",
|
|
|
+ "last_hard_state_change" : "1375299104",
|
|
|
+ "last_hard_state" : "2",
|
|
|
+ "last_time_ok" : "1375299029",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375308404",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308404",
|
|
|
+ "service_type" : "HBASE"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Corrupt/Missing blocks",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: corrupt_blocks:<>, missing_blocks:<>, total_blocks:<>",
|
|
|
+ "last_hard_state_change" : "1375291127",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308407",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308407",
|
|
|
+ "service_type" : "HDFS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "HDFS capacity utilization",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: DFSUsedGB:<0.2>, DFSTotalGB:<42.4>",
|
|
|
+ "last_hard_state_change" : "1375291130",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375307930",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375307930",
|
|
|
+ "service_type" : "HDFS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "NameNode RPC latency",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: RpcQueueTime_avg_time:<0> Secs, RpcProcessingTime_avg_time:<0> Secs",
|
|
|
+ "last_hard_state_change" : "1375291133",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308233",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308233",
|
|
|
+ "service_type" : "HDFS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Percent DataNodes down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: total:<1>, affected:<0>",
|
|
|
+ "last_hard_state_change" : "1375296206",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308416",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375294782",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308416",
|
|
|
+ "service_type" : "HDFS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Percent DataNodes storage full",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: total:<1>, affected:<0>",
|
|
|
+ "last_hard_state_change" : "1375291139",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308419",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308419",
|
|
|
+ "service_type" : "HDFS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Hive Metastore status check",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: Hive metaserver status OK",
|
|
|
+ "last_hard_state_change" : "1375291472",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308422",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375290048",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308422",
|
|
|
+ "service_type" : "HIVE"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "History Server 2 CPU utilization",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "1 CPU, load 18.0% < 200% : OK",
|
|
|
+ "last_hard_state_change" : "1375291145",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308245",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308245",
|
|
|
+ "service_type" : "UNKNOWN"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "History Server 2 RPC latency",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: RpcQueueTime_avg_time:<0> Secs, RpcProcessingTime_avg_time:<0> Secs",
|
|
|
+ "last_hard_state_change" : "1375291148",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308248",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308248",
|
|
|
+ "service_type" : "UNKNOWN"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "History Server 2 Web UI down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: Successfully accessed historyserver2 Web UI",
|
|
|
+ "last_hard_state_change" : "1375291511",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308371",
|
|
|
+ "last_time_warning" : "1375295397",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308371",
|
|
|
+ "service_type" : "UNKNOWN"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Percent TaskTrackers down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: total:<0>, affected:<0>",
|
|
|
+ "last_hard_state_change" : "1375291153",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308403",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308403",
|
|
|
+ "service_type" : "MAPREDUCE"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Nagios status log staleness",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "NAGIOS OK: 2 processes, status log updated 5 seconds ago",
|
|
|
+ "last_hard_state_change" : "1375291156",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308256",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308256",
|
|
|
+ "service_type" : "NAGIOS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "NameNode Web UI down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: Successfully accessed namenode Web UI",
|
|
|
+ "last_hard_state_change" : "1375296199",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308379",
|
|
|
+ "last_time_warning" : "1375294745",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308379",
|
|
|
+ "service_type" : "HDFS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "NameNode edit logs directory status",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: All Namenode directories are active",
|
|
|
+ "last_hard_state_change" : "1375296202",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308412",
|
|
|
+ "last_time_warning" : "1375294778",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308412",
|
|
|
+ "service_type" : "HDFS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "NameNode host CPU utilization",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "1 CPU, load 26.0% < 200% : OK",
|
|
|
+ "last_hard_state_change" : "1375291165",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308265",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308265",
|
|
|
+ "service_type" : "HDFS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "NameNode process down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "TCP OK - 0.000 second response time on port 8020",
|
|
|
+ "last_hard_state_change" : "1375296208",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308418",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375294784",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308418",
|
|
|
+ "service_type" : "HDFS"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Node Manager process down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "TCP OK - 0.001 second response time on port 8042",
|
|
|
+ "last_hard_state_change" : "1375296571",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308391",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375295117",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308391",
|
|
|
+ "service_type" : "UNKNOWN"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Oozie Server status check",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: Oozie server status [System mode: NORMAL]",
|
|
|
+ "last_hard_state_change" : "1375291534",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308394",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375295660",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308394",
|
|
|
+ "service_type" : "OOZIE"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "RegionServer process down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "3",
|
|
|
+ "current_state" : "2",
|
|
|
+ "plugin_output" : "Connection refused",
|
|
|
+ "last_hard_state_change" : "1375298857",
|
|
|
+ "last_hard_state" : "2",
|
|
|
+ "last_time_ok" : "1375297343",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375308397",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308397",
|
|
|
+ "service_type" : "HBASE"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Resource Manager CPU utilization",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "1 CPU, load 24.0% < 200% : OK",
|
|
|
+ "last_hard_state_change" : "1375291180",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308281",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308281",
|
|
|
+ "service_type" : "UNKNOWN"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Resource Manager RPC latency",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: RpcQueueTime_avg_time:<0> Secs, RpcProcessingTime_avg_time:<0> Secs",
|
|
|
+ "last_hard_state_change" : "1375291183",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308283",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308283",
|
|
|
+ "service_type" : "UNKNOWN"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Resource Manager Web UI down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: Successfully accessed resorcemanager Web UI",
|
|
|
+ "last_hard_state_change" : "1375296526",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308406",
|
|
|
+ "last_time_warning" : "1375295072",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "0",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308406",
|
|
|
+ "service_type" : "UNKNOWN"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "WebHCat Server status check",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "",
|
|
|
+ "last_hard_state_change" : "1375291969",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308409",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375290515",
|
|
|
+ "is_flapping" : "",
|
|
|
+ "last_check" : "",
|
|
|
+ "service_type" : "WEBHCAT"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "Percent ZooKeeper Servers down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "OK: total:<1>, affected:<0>",
|
|
|
+ "last_hard_state_change" : "1375291461",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308411",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375290037",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308411",
|
|
|
+ "service_type" : "ZOOKEEPER"
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "service_description" : "ZooKeeper Server process down",
|
|
|
+ "host_name" : "dev01.hortonworks.com",
|
|
|
+ "current_attempt" : "1",
|
|
|
+ "current_state" : "0",
|
|
|
+ "plugin_output" : "TCP OK - 0.001 second response time on port 2181",
|
|
|
+ "last_hard_state_change" : "1375291434",
|
|
|
+ "last_hard_state" : "0",
|
|
|
+ "last_time_ok" : "1375308415",
|
|
|
+ "last_time_warning" : "0",
|
|
|
+ "last_time_unknown" : "0",
|
|
|
+ "last_time_critical" : "1375289980",
|
|
|
+ "is_flapping" : "0",
|
|
|
+ "last_check" : "1375308415",
|
|
|
+ "service_type" : "ZOOKEEPER"
|
|
|
+ }
|
|
|
+ ],
|
|
|
+ "hostcounts" : {
|
|
|
+ "up_hosts" : "1",
|
|
|
+ "down_hosts" : "0"
|
|
|
+ },
|
|
|
+ "servicestates" : {
|
|
|
+ "PUPPET" : "0",
|
|
|
+ "HIVE-METASTORE" : "0",
|
|
|
+ "HDFS" : "0",
|
|
|
+ "OOZIE" : "0",
|
|
|
+ "WEBHCAT" : "0",
|
|
|
+ "ZOOKEEPER" : "0"
|
|
|
+ }
|
|
|
+ }
|
|
|
+ },
|
|
|
+ "host" : {
|
|
|
+ "href" : "http://dev01.hortonworks.com:8080/api/v1/clusters/c1/hosts/dev01.hortonworks.com"
|
|
|
+ }
|
|
|
+ }
|
|
|
+ ]
|
|
|
+}
|