diagnostics.py 2.3 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162
  1. """
  2. A check to run relevant diagnostics via `oc adm diagnostics`.
  3. """
  4. import os
  5. from openshift_checks import OpenShiftCheck, OpenShiftCheckException
  6. DIAGNOSTIC_LIST = (
  7. "AggregatedLogging ClusterRegistry ClusterRoleBindings ClusterRoles "
  8. "ClusterRouter DiagnosticPod NetworkCheck"
  9. ).split()
  10. class DiagnosticCheck(OpenShiftCheck):
  11. """A check to run relevant diagnostics via `oc adm diagnostics`."""
  12. name = "diagnostics"
  13. tags = ["health"]
  14. def is_active(self):
  15. return super(DiagnosticCheck, self).is_active() and self.is_first_master()
  16. def run(self):
  17. if self.exec_diagnostic("ConfigContexts"):
  18. # only run the other diagnostics if that one succeeds (otherwise, all will fail)
  19. diagnostics = self.get_var("openshift_check_diagnostics", default=DIAGNOSTIC_LIST)
  20. for diagnostic in self.normalize(diagnostics):
  21. self.exec_diagnostic(diagnostic)
  22. return {}
  23. def exec_diagnostic(self, diagnostic):
  24. """
  25. Execute an 'oc adm diagnostics' command on the remote host.
  26. Raises OcNotFound or registers OcDiagFailed.
  27. Returns True on success or False on failure (non-zero rc).
  28. """
  29. config_base = self.get_var("openshift.common.config_base")
  30. args = {
  31. "config_file": os.path.join(config_base, "master", "admin.kubeconfig"),
  32. "cmd": "adm diagnostics",
  33. "extra_args": [diagnostic],
  34. }
  35. result = self.execute_module("ocutil", args, save_as_name=diagnostic + ".failure.json")
  36. self.register_file(diagnostic + ".txt", result['result'])
  37. if result.get("failed"):
  38. if result['result'] == '[Errno 2] No such file or directory':
  39. raise OpenShiftCheckException(
  40. "OcNotFound",
  41. "This host is supposed to be a master but does not have the `oc` command where expected.\n"
  42. "Has an installation been run on this host yet?"
  43. )
  44. self.register_failure(OpenShiftCheckException(
  45. 'OcDiagFailed',
  46. 'The {diag} diagnostic reported an error:\n'
  47. '{error}'.format(diag=diagnostic, error=result['result'])
  48. ))
  49. return False
  50. return True