template_ops_tools.yml 1.8 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354
  1. ---
  2. g_template_ops_tools:
  3. name: Template Operations Tools
  4. zdiscoveryrules:
  5. - name: disc.ops.runner
  6. key: disc.ops.runner
  7. lifetime: 1
  8. description: "Dynamically register operations runner items"
  9. zitemprototypes:
  10. - discoveryrule_key: disc.ops.runner
  11. name: "Exit code of ops-runner[{#OSO_COMMAND}]"
  12. key: "disc.ops.runner.command.exitcode[{#OSO_COMMAND}]"
  13. value_type: int
  14. description: "The exit code of the command run from ops-runner"
  15. applications:
  16. - Ops Runner
  17. ztriggerprototypes:
  18. - name: 'ops-runner[{#OSO_COMMAND}]: non-zero exit code on {HOST.NAME}'
  19. expression: '{Template Operations Tools:disc.ops.runner.command.exitcode[{#OSO_COMMAND}].last()}<>0'
  20. url: 'https://github.com/openshift/ops-sop/blob/master/V3/Alerts/check_ops_runner_command.asciidoc'
  21. priority: average
  22. zactions:
  23. - name: 'Remote command for [HEAL] triggers'
  24. status: enabled
  25. escalation_time: 60
  26. conditions_filter:
  27. calculation_type: "and/or"
  28. conditions:
  29. - conditiontype: maintenance status
  30. operator: not in
  31. - conditiontype: trigger name
  32. operator: like
  33. value: "[HEAL]"
  34. - conditiontype: trigger value
  35. operator: "="
  36. value: PROBLEM
  37. operations:
  38. - esc_step_from: 1
  39. esc_step_to: 1
  40. esc_period: 0
  41. operationtype: remote command
  42. opcommand:
  43. command: 'ssh -i /etc/openshift_tools/scriptrunner_id_rsa {{ ozb_scriptrunner_user }}@{{ ozb_scriptrunner_bastion_host }} remote-healer --host \"{HOST.NAME}\" --trigger \"{TRIGGER.NAME}\" --trigger-val \"{TRIGGER.VALUE}\"'
  44. execute_on: "zabbix server"
  45. type: 'custom script'
  46. target_hosts:
  47. - target_type: 'zabbix server'
  48. opconditions:
  49. - conditiontype: 'event acknowledged'
  50. operator: '='
  51. value: 'not acknowledged'