alerts.json 1.6 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253
  1. {
  2. "ZOOKEEPER": {
  3. "service": [
  4. {
  5. "name": "zookeeper_server_process_percent",
  6. "label": "Percent ZooKeeper Servers Available",
  7. "description": "This service-level alert is triggered if the configured percentage of ZooKeeper processes cannot be determined to be up and listening on the network.",
  8. "interval": 1,
  9. "scope": "SERVICE",
  10. "enabled": true,
  11. "source": {
  12. "type": "AGGREGATE",
  13. "alert_name": "zookeeper_server_process",
  14. "reporting": {
  15. "ok": {
  16. "text": "affected: [{1}], total: [{0}]"
  17. },
  18. "warning": {
  19. "text": "affected: [{1}], total: [{0}]",
  20. "value": 0.35
  21. },
  22. "critical": {
  23. "text": "affected: [{1}], total: [{0}]",
  24. "value": 0.70
  25. }
  26. }
  27. }
  28. }
  29. ],
  30. "ZOOKEEPER_SERVER": [
  31. {
  32. "name": "zookeeper_server_process",
  33. "label": "ZooKeeper Server Process",
  34. "description": "This host-level alert is triggered if the ZooKeeper server process cannot be determined to be up and listening on the network.",
  35. "interval": 1,
  36. "scope": "ANY",
  37. "source": {
  38. "type": "PORT",
  39. "uri": "{{zookeeper-env/clientPort}}",
  40. "default_port": 2181,
  41. "reporting": {
  42. "ok": {
  43. "text": "TCP OK - {0:.4f} response on port {1}"
  44. },
  45. "critical": {
  46. "text": "Connection failed: {0} to {1}:{2}"
  47. }
  48. }
  49. }
  50. }
  51. ]
  52. }
  53. }