logging.py 4.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109
  1. """
  2. Util functions for performing checks on an Elasticsearch, Fluentd, and Kibana stack
  3. """
  4. import json
  5. import os
  6. from openshift_checks import OpenShiftCheck, OpenShiftCheckException
  7. class MissingComponentPods(OpenShiftCheckException):
  8. """Raised when a component has no pods in the namespace."""
  9. pass
  10. class CouldNotUseOc(OpenShiftCheckException):
  11. """Raised when ocutil has a failure running oc."""
  12. pass
  13. class LoggingCheck(OpenShiftCheck):
  14. """Base class for OpenShift aggregated logging component checks"""
  15. # FIXME: this should not be listed as a check, since it is not meant to be
  16. # run by itself.
  17. name = "logging"
  18. def is_active(self):
  19. logging_deployed = self.get_var("openshift_hosted_logging_deploy", default=False)
  20. return logging_deployed and super(LoggingCheck, self).is_active() and self.is_first_master()
  21. def is_first_master(self):
  22. """Determine if running on first master. Returns: bool"""
  23. # Note: It would be nice to use membership in oo_first_master group, however for now it
  24. # seems best to avoid requiring that setup and just check this is the first master.
  25. hostname = self.get_var("ansible_ssh_host") or [None]
  26. masters = self.get_var("groups", "masters", default=None) or [None]
  27. return masters[0] == hostname
  28. def run(self):
  29. return {}
  30. def get_pods_for_component(self, logging_component):
  31. """Get all pods for a given component. Returns: list of pods."""
  32. pod_output = self.exec_oc(
  33. "get pods -l component={} -o json".format(logging_component),
  34. [],
  35. )
  36. try:
  37. pods = json.loads(pod_output) # raises ValueError if deserialize fails
  38. if not pods or not pods.get('items'): # also a broken response, treat the same
  39. raise ValueError()
  40. except ValueError:
  41. # successful run but non-parsing data generally means there were no pods to be found
  42. raise MissingComponentPods(
  43. 'There are no "{}" component pods in the "{}" namespace.\n'
  44. 'Is logging deployed?'.format(logging_component, self.logging_namespace())
  45. )
  46. return pods['items']
  47. @staticmethod
  48. def not_running_pods(pods):
  49. """Returns: list of pods not in a ready and running state"""
  50. return [
  51. pod for pod in pods
  52. if not pod.get("status", {}).get("containerStatuses") or any(
  53. container['ready'] is False
  54. for container in pod['status']['containerStatuses']
  55. ) or not any(
  56. condition['type'] == 'Ready' and condition['status'] == 'True'
  57. for condition in pod['status'].get('conditions', [])
  58. )
  59. ]
  60. def logging_namespace(self):
  61. """Returns the namespace in which logging is configured to deploy."""
  62. return self.get_var("openshift_logging_namespace", default="logging")
  63. def exec_oc(self, cmd_str="", extra_args=None):
  64. """
  65. Execute an 'oc' command in the remote host.
  66. Returns: output of command and namespace,
  67. or raises CouldNotUseOc on error
  68. """
  69. config_base = self.get_var("openshift", "common", "config_base")
  70. args = {
  71. "namespace": self.logging_namespace(),
  72. "config_file": os.path.join(config_base, "master", "admin.kubeconfig"),
  73. "cmd": cmd_str,
  74. "extra_args": list(extra_args) if extra_args else [],
  75. }
  76. result = self.execute_module("ocutil", args)
  77. if result.get("failed"):
  78. if result['result'] == '[Errno 2] No such file or directory':
  79. raise CouldNotUseOc(
  80. "This host is supposed to be a master but does not have the `oc` command where expected.\n"
  81. "Has an installation been run on this host yet?"
  82. )
  83. raise CouldNotUseOc(
  84. 'Unexpected error using `oc` to validate the logging stack components.\n'
  85. 'Error executing `oc {cmd}`:\n'
  86. '{error}'.format(cmd=args['cmd'], error=result['result'])
  87. )
  88. return result.get("result", "")