logging.py 3.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596
  1. """
  2. Util functions for performing checks on an Elasticsearch, Fluentd, and Kibana stack
  3. """
  4. import json
  5. import os
  6. from openshift_checks import OpenShiftCheck, OpenShiftCheckException, get_var
  7. class LoggingCheck(OpenShiftCheck):
  8. """Base class for logging component checks"""
  9. name = "logging"
  10. @classmethod
  11. def is_active(cls, task_vars):
  12. return super(LoggingCheck, cls).is_active(task_vars) and cls.is_first_master(task_vars)
  13. @staticmethod
  14. def is_first_master(task_vars):
  15. """Run only on first master and only when logging is configured. Returns: bool"""
  16. logging_deployed = get_var(task_vars, "openshift_hosted_logging_deploy", default=True)
  17. # Note: It would be nice to use membership in oo_first_master group, however for now it
  18. # seems best to avoid requiring that setup and just check this is the first master.
  19. hostname = get_var(task_vars, "ansible_ssh_host") or [None]
  20. masters = get_var(task_vars, "groups", "masters", default=None) or [None]
  21. return logging_deployed and masters[0] == hostname
  22. def run(self, tmp, task_vars):
  23. pass
  24. def get_pods_for_component(self, execute_module, namespace, logging_component, task_vars):
  25. """Get all pods for a given component. Returns: list of pods for component, error string"""
  26. pod_output = self.exec_oc(
  27. execute_module,
  28. namespace,
  29. "get pods -l component={} -o json".format(logging_component),
  30. [],
  31. task_vars
  32. )
  33. try:
  34. pods = json.loads(pod_output)
  35. if not pods or not pods.get('items'):
  36. raise ValueError()
  37. except ValueError:
  38. # successful run but non-parsing data generally means there were no pods in the namespace
  39. return None, 'There are no pods in the {} namespace. Is logging deployed?'.format(namespace)
  40. return pods['items'], None
  41. @staticmethod
  42. def not_running_pods(pods):
  43. """Returns: list of pods not in a ready and running state"""
  44. return [
  45. pod for pod in pods
  46. if any(
  47. container['ready'] is False
  48. for container in pod['status']['containerStatuses']
  49. ) or not any(
  50. condition['type'] == 'Ready' and condition['status'] == 'True'
  51. for condition in pod['status']['conditions']
  52. )
  53. ]
  54. @staticmethod
  55. def exec_oc(execute_module=None, namespace="logging", cmd_str="", extra_args=None, task_vars=None):
  56. """
  57. Execute an 'oc' command in the remote host.
  58. Returns: output of command and namespace,
  59. or raises OpenShiftCheckException on error
  60. """
  61. config_base = get_var(task_vars, "openshift", "common", "config_base")
  62. args = {
  63. "namespace": namespace,
  64. "config_file": os.path.join(config_base, "master", "admin.kubeconfig"),
  65. "cmd": cmd_str,
  66. "extra_args": list(extra_args) if extra_args else [],
  67. }
  68. result = execute_module("ocutil", args, task_vars)
  69. if result.get("failed"):
  70. msg = (
  71. 'Unexpected error using `oc` to validate the logging stack components.\n'
  72. 'Error executing `oc {cmd}`:\n'
  73. '{error}'
  74. ).format(cmd=args['cmd'], error=result['result'])
  75. if result['result'] == '[Errno 2] No such file or directory':
  76. msg = (
  77. "This host is supposed to be a master but does not have the `oc` command where expected.\n"
  78. "Has an installation been run on this host yet?"
  79. )
  80. raise OpenShiftCheckException(msg)
  81. return result.get("result", "")