123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657 |
- """Check for an aggregated logging Curator deployment"""
- from openshift_checks import get_var
- from openshift_checks.logging.logging import LoggingCheck
- class Curator(LoggingCheck):
- """Check for an aggregated logging Curator deployment"""
- name = "curator"
- tags = ["health", "logging"]
- logging_namespace = None
- def run(self, tmp, task_vars):
- self.logging_namespace = get_var(task_vars, "openshift_logging_namespace", default="logging")
- curator_pods, error = super(Curator, self).get_pods_for_component(
- self.module_executor,
- self.logging_namespace,
- "curator",
- task_vars
- )
- if error:
- return {"failed": True, "changed": False, "msg": error}
- check_error = self.check_curator(curator_pods)
- if check_error:
- msg = ("The following Curator deployment issue was found:"
- "\n-------\n"
- "{}".format(check_error))
- return {"failed": True, "changed": False, "msg": msg}
- # TODO(lmeyer): run it all again for the ops cluster
- return {"failed": False, "changed": False, "msg": 'No problems found with Curator deployment.'}
- def check_curator(self, pods):
- """Check to see if curator is up and working. Returns: error string"""
- if not pods:
- return (
- "There are no Curator pods for the logging stack,\n"
- "so nothing will prune Elasticsearch indexes.\n"
- "Is Curator correctly deployed?"
- )
- not_running = super(Curator, self).not_running_pods(pods)
- if len(not_running) == len(pods):
- return (
- "The Curator pod is not currently in a running state,\n"
- "so Elasticsearch indexes may increase without bound."
- )
- if len(pods) - len(not_running) > 1:
- return (
- "There is more than one Curator pod running. This should not normally happen.\n"
- "Although this doesn't cause any problems, you may want to investigate."
- )
- return None
|