curator.py 1.6 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243
  1. """Check for an aggregated logging Curator deployment"""
  2. from openshift_checks.logging.logging import OpenShiftCheckException, LoggingCheck
  3. class Curator(LoggingCheck):
  4. """Check for an aggregated logging Curator deployment"""
  5. name = "curator"
  6. tags = ["health", "logging"]
  7. def run(self):
  8. """Check various things and gather errors. Returns: result as hash"""
  9. curator_pods = self.get_pods_for_component("curator")
  10. self.check_curator(curator_pods)
  11. # TODO(lmeyer): run it all again for the ops cluster
  12. return {}
  13. def check_curator(self, pods):
  14. """Check to see if curator is up and working. Returns: error string"""
  15. if not pods:
  16. raise OpenShiftCheckException(
  17. "MissingComponentPods",
  18. "There are no Curator pods for the logging stack,\n"
  19. "so nothing will prune Elasticsearch indexes.\n"
  20. "Is Curator correctly deployed?"
  21. )
  22. not_running = self.not_running_pods(pods)
  23. if len(not_running) == len(pods):
  24. raise OpenShiftCheckException(
  25. "CuratorNotRunning",
  26. "The Curator pod is not currently in a running state,\n"
  27. "so Elasticsearch indexes may increase without bound."
  28. )
  29. if len(pods) - len(not_running) > 1:
  30. raise OpenShiftCheckException(
  31. "TooManyCurators",
  32. "There is more than one Curator pod running. This should not normally happen.\n"
  33. "Although this doesn't cause any problems, you may want to investigate."
  34. )