logging.py 3.7 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101
  1. """
  2. Util functions for performing checks on an Elasticsearch, Fluentd, and Kibana stack
  3. """
  4. import json
  5. import os
  6. from openshift_checks import OpenShiftCheck, OpenShiftCheckException
  7. class MissingComponentPods(OpenShiftCheckException):
  8. """Raised when a component has no pods in the namespace."""
  9. pass
  10. class CouldNotUseOc(OpenShiftCheckException):
  11. """Raised when ocutil has a failure running oc."""
  12. pass
  13. class LoggingCheck(OpenShiftCheck):
  14. """Base class for OpenShift aggregated logging component checks"""
  15. # FIXME: this should not be listed as a check, since it is not meant to be
  16. # run by itself.
  17. name = "logging"
  18. def is_active(self):
  19. logging_deployed = self.get_var("openshift_hosted_logging_deploy", convert=bool, default=False)
  20. return logging_deployed and super(LoggingCheck, self).is_active() and self.is_first_master()
  21. def run(self):
  22. return {}
  23. def get_pods_for_component(self, logging_component):
  24. """Get all pods for a given component. Returns: list of pods."""
  25. pod_output = self.exec_oc(
  26. "get pods -l component={} -o json".format(logging_component),
  27. [],
  28. )
  29. try:
  30. pods = json.loads(pod_output) # raises ValueError if deserialize fails
  31. if not pods or not pods.get('items'): # also a broken response, treat the same
  32. raise ValueError()
  33. except ValueError:
  34. # successful run but non-parsing data generally means there were no pods to be found
  35. raise MissingComponentPods(
  36. 'There are no "{}" component pods in the "{}" namespace.\n'
  37. 'Is logging deployed?'.format(logging_component, self.logging_namespace())
  38. )
  39. return pods['items']
  40. @staticmethod
  41. def not_running_pods(pods):
  42. """Returns: list of pods not in a ready and running state"""
  43. return [
  44. pod for pod in pods
  45. if not pod.get("status", {}).get("containerStatuses") or any(
  46. container['ready'] is False
  47. for container in pod['status']['containerStatuses']
  48. ) or not any(
  49. condition['type'] == 'Ready' and condition['status'] == 'True'
  50. for condition in pod['status'].get('conditions', [])
  51. )
  52. ]
  53. def logging_namespace(self):
  54. """Returns the namespace in which logging is configured to deploy."""
  55. return self.get_var("openshift_logging_namespace", default="openshift-logging")
  56. def exec_oc(self, cmd_str="", extra_args=None, save_as_name=None):
  57. """
  58. Execute an 'oc' command in the remote host.
  59. Returns: output of command and namespace,
  60. or raises CouldNotUseOc on error
  61. """
  62. config_base = self.get_var("openshift", "common", "config_base")
  63. args = {
  64. "namespace": self.logging_namespace(),
  65. "config_file": os.path.join(config_base, "master", "admin.kubeconfig"),
  66. "cmd": cmd_str,
  67. "extra_args": list(extra_args) if extra_args else [],
  68. }
  69. result = self.execute_module("ocutil", args, save_as_name=save_as_name)
  70. if result.get("failed"):
  71. if result['result'] == '[Errno 2] No such file or directory':
  72. raise CouldNotUseOc(
  73. "This host is supposed to be a master but does not have the `oc` command where expected.\n"
  74. "Has an installation been run on this host yet?"
  75. )
  76. raise CouldNotUseOc(
  77. 'Unexpected error using `oc` to validate the logging stack components.\n'
  78. 'Error executing `oc {cmd}`:\n'
  79. '{error}'.format(cmd=args['cmd'], error=result['result'])
  80. )
  81. return result.get("result", "")