|
@@ -12,7 +12,7 @@ except ImportError:
|
|
|
from urllib.error import HTTPError, URLError
|
|
|
import urllib.request as urllib2
|
|
|
|
|
|
-from openshift_checks.logging.logging import LoggingCheck
|
|
|
+from openshift_checks.logging.logging import LoggingCheck, OpenShiftCheckException
|
|
|
|
|
|
|
|
|
class Kibana(LoggingCheck):
|
|
@@ -24,25 +24,12 @@ class Kibana(LoggingCheck):
|
|
|
def run(self):
|
|
|
"""Check various things and gather errors. Returns: result as hash"""
|
|
|
|
|
|
- self.logging_namespace = self.get_var("openshift_logging_namespace", default="logging")
|
|
|
- kibana_pods, error = self.get_pods_for_component(
|
|
|
- self.logging_namespace,
|
|
|
- "kibana",
|
|
|
- )
|
|
|
- if error:
|
|
|
- return {"failed": True, "msg": error}
|
|
|
- check_error = self.check_kibana(kibana_pods)
|
|
|
-
|
|
|
- if not check_error:
|
|
|
- check_error = self._check_kibana_route()
|
|
|
-
|
|
|
- if check_error:
|
|
|
- msg = ("The following Kibana deployment issue was found:"
|
|
|
- "{}".format(check_error))
|
|
|
- return {"failed": True, "msg": msg}
|
|
|
-
|
|
|
+ kibana_pods = self.get_pods_for_component("kibana")
|
|
|
+ self.check_kibana(kibana_pods)
|
|
|
+ self.check_kibana_route()
|
|
|
# TODO(lmeyer): run it all again for the ops cluster
|
|
|
- return {"failed": False, "msg": 'No problems found with Kibana deployment.'}
|
|
|
+
|
|
|
+ return {}
|
|
|
|
|
|
def _verify_url_internal(self, url):
|
|
|
"""
|
|
@@ -65,7 +52,7 @@ class Kibana(LoggingCheck):
|
|
|
def _verify_url_external(url):
|
|
|
"""
|
|
|
Try to reach a URL from ansible control host.
|
|
|
- Returns: success (bool), reason (for failure)
|
|
|
+ Raise an OpenShiftCheckException if anything goes wrong.
|
|
|
"""
|
|
|
# This actually checks from the ansible control host, which may or may not
|
|
|
# really be "external" to the cluster.
|
|
@@ -91,130 +78,149 @@ class Kibana(LoggingCheck):
|
|
|
return None
|
|
|
|
|
|
def check_kibana(self, pods):
|
|
|
- """Check to see if Kibana is up and working. Returns: error string."""
|
|
|
+ """Check to see if Kibana is up and working. Raises OpenShiftCheckException if not."""
|
|
|
|
|
|
if not pods:
|
|
|
- return "There are no Kibana pods deployed, so no access to the logging UI."
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ "MissingComponentPods",
|
|
|
+ "There are no Kibana pods deployed, so no access to the logging UI."
|
|
|
+ )
|
|
|
|
|
|
not_running = self.not_running_pods(pods)
|
|
|
if len(not_running) == len(pods):
|
|
|
- return "No Kibana pod is in a running state, so there is no access to the logging UI."
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ "NoRunningPods",
|
|
|
+ "No Kibana pod is in a running state, so there is no access to the logging UI."
|
|
|
+ )
|
|
|
elif not_running:
|
|
|
- return (
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ "PodNotRunning",
|
|
|
"The following Kibana pods are not currently in a running state:\n"
|
|
|
- "{pods}"
|
|
|
- "However at least one is, so service may not be impacted."
|
|
|
- ).format(pods="".join(" " + pod['metadata']['name'] + "\n" for pod in not_running))
|
|
|
-
|
|
|
- return None
|
|
|
+ " {pods}\n"
|
|
|
+ "However at least one is, so service may not be impacted.".format(
|
|
|
+ pods="\n ".join(pod['metadata']['name'] for pod in not_running)
|
|
|
+ )
|
|
|
+ )
|
|
|
|
|
|
def _get_kibana_url(self):
|
|
|
"""
|
|
|
Get kibana route or report error.
|
|
|
- Returns: url (or empty), reason for failure
|
|
|
+ Returns: url
|
|
|
"""
|
|
|
|
|
|
# Get logging url
|
|
|
- get_route = self.exec_oc(
|
|
|
- self.logging_namespace,
|
|
|
- "get route logging-kibana -o json",
|
|
|
- [],
|
|
|
- )
|
|
|
+ get_route = self.exec_oc("get route logging-kibana -o json", [])
|
|
|
if not get_route:
|
|
|
- return None, 'no_route_exists'
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ 'no_route_exists',
|
|
|
+ 'No route is defined for Kibana in the logging namespace,\n'
|
|
|
+ 'so the logging stack is not accessible. Is logging deployed?\n'
|
|
|
+ 'Did something remove the logging-kibana route?'
|
|
|
+ )
|
|
|
|
|
|
- route = json.loads(get_route)
|
|
|
+ try:
|
|
|
+ route = json.loads(get_route)
|
|
|
+ # check that the route has been accepted by a router
|
|
|
+ ingress = route["status"]["ingress"]
|
|
|
+ except (ValueError, KeyError):
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ 'get_route_failed',
|
|
|
+ '"oc get route" returned an unexpected response:\n' + get_route
|
|
|
+ )
|
|
|
|
|
|
- # check that the route has been accepted by a router
|
|
|
- ingress = route["status"]["ingress"]
|
|
|
# ingress can be null if there is no router, or empty if not routed
|
|
|
if not ingress or not ingress[0]:
|
|
|
- return None, 'route_not_accepted'
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ 'route_not_accepted',
|
|
|
+ 'The logging-kibana route is not being routed by any router.\n'
|
|
|
+ 'Is the router deployed and working?'
|
|
|
+ )
|
|
|
|
|
|
host = route.get("spec", {}).get("host")
|
|
|
if not host:
|
|
|
- return None, 'route_missing_host'
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ 'route_missing_host',
|
|
|
+ 'The logging-kibana route has no hostname defined,\n'
|
|
|
+ 'which should never happen. Did something alter its definition?'
|
|
|
+ )
|
|
|
|
|
|
- return 'https://{}/'.format(host), None
|
|
|
+ return 'https://{}/'.format(host)
|
|
|
|
|
|
- def _check_kibana_route(self):
|
|
|
+ def check_kibana_route(self):
|
|
|
"""
|
|
|
Check to see if kibana route is up and working.
|
|
|
- Returns: error string
|
|
|
+ Raises exception if not.
|
|
|
"""
|
|
|
- known_errors = dict(
|
|
|
- no_route_exists=(
|
|
|
- 'No route is defined for Kibana in the logging namespace,\n'
|
|
|
- 'so the logging stack is not accessible. Is logging deployed?\n'
|
|
|
- 'Did something remove the logging-kibana route?'
|
|
|
- ),
|
|
|
- route_not_accepted=(
|
|
|
- 'The logging-kibana route is not being routed by any router.\n'
|
|
|
- 'Is the router deployed and working?'
|
|
|
- ),
|
|
|
- route_missing_host=(
|
|
|
- 'The logging-kibana route has no hostname defined,\n'
|
|
|
- 'which should never happen. Did something alter its definition?'
|
|
|
- ),
|
|
|
- )
|
|
|
|
|
|
- kibana_url, error = self._get_kibana_url()
|
|
|
- if not kibana_url:
|
|
|
- return known_errors.get(error, error)
|
|
|
+ kibana_url = self._get_kibana_url()
|
|
|
|
|
|
# first, check that kibana is reachable from the master.
|
|
|
error = self._verify_url_internal(kibana_url)
|
|
|
if error:
|
|
|
if 'urlopen error [Errno 111] Connection refused' in error:
|
|
|
- error = (
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ 'FailedToConnectInternal',
|
|
|
'Failed to connect from this master to Kibana URL {url}\n'
|
|
|
- 'Is kibana running, and is at least one router routing to it?'
|
|
|
- ).format(url=kibana_url)
|
|
|
+ 'Is kibana running, and is at least one router routing to it?'.format(url=kibana_url)
|
|
|
+ )
|
|
|
elif 'urlopen error [Errno -2] Name or service not known' in error:
|
|
|
- error = (
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ 'FailedToResolveInternal',
|
|
|
'Failed to connect from this master to Kibana URL {url}\n'
|
|
|
'because the hostname does not resolve.\n'
|
|
|
- 'Is DNS configured for the Kibana hostname?'
|
|
|
- ).format(url=kibana_url)
|
|
|
+ 'Is DNS configured for the Kibana hostname?'.format(url=kibana_url)
|
|
|
+ )
|
|
|
elif 'Status code was not' in error:
|
|
|
- error = (
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ 'WrongReturnCodeInternal',
|
|
|
'A request from this master to the Kibana URL {url}\n'
|
|
|
'did not return the correct status code (302).\n'
|
|
|
'This could mean that Kibana is malfunctioning, the hostname is\n'
|
|
|
'resolving incorrectly, or other network issues. The output was:\n'
|
|
|
- ' {error}'
|
|
|
- ).format(url=kibana_url, error=error)
|
|
|
- return 'Error validating the logging Kibana route:\n' + error
|
|
|
+ ' {error}'.format(url=kibana_url, error=error)
|
|
|
+ )
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ 'MiscRouteErrorInternal',
|
|
|
+ 'Error validating the logging Kibana route internally:\n' + error
|
|
|
+ )
|
|
|
|
|
|
# in production we would like the kibana route to work from outside the
|
|
|
# cluster too; but that may not be the case, so allow disabling just this part.
|
|
|
- if not self.get_var("openshift_check_efk_kibana_external", default=True):
|
|
|
- return None
|
|
|
+ if self.get_var("openshift_check_efk_kibana_external", default="True").lower() != "true":
|
|
|
+ return
|
|
|
error = self._verify_url_external(kibana_url)
|
|
|
- if error:
|
|
|
- if 'urlopen error [Errno 111] Connection refused' in error:
|
|
|
- error = (
|
|
|
- 'Failed to connect from the Ansible control host to Kibana URL {url}\n'
|
|
|
- 'Is the router for the Kibana hostname exposed externally?'
|
|
|
- ).format(url=kibana_url)
|
|
|
- elif 'urlopen error [Errno -2] Name or service not known' in error:
|
|
|
- error = (
|
|
|
- 'Failed to resolve the Kibana hostname in {url}\n'
|
|
|
- 'from the Ansible control host.\n'
|
|
|
- 'Is DNS configured to resolve this Kibana hostname externally?'
|
|
|
- ).format(url=kibana_url)
|
|
|
- elif 'Expected success (200)' in error:
|
|
|
- error = (
|
|
|
- 'A request to Kibana at {url}\n'
|
|
|
- 'returned the wrong error code:\n'
|
|
|
- ' {error}\n'
|
|
|
- 'This could mean that Kibana is malfunctioning, the hostname is\n'
|
|
|
- 'resolving incorrectly, or other network issues.'
|
|
|
- ).format(url=kibana_url, error=error)
|
|
|
- error = (
|
|
|
- 'Error validating the logging Kibana route:\n{error}\n'
|
|
|
- 'To disable external Kibana route validation, set in your inventory:\n'
|
|
|
- ' openshift_check_efk_kibana_external=False'
|
|
|
- ).format(error=error)
|
|
|
- return error
|
|
|
- return None
|
|
|
+
|
|
|
+ if not error:
|
|
|
+ return
|
|
|
+
|
|
|
+ error_fmt = (
|
|
|
+ 'Error validating the logging Kibana route:\n{error}\n'
|
|
|
+ 'To disable external Kibana route validation, set the variable:\n'
|
|
|
+ ' openshift_check_efk_kibana_external=False'
|
|
|
+ )
|
|
|
+ if 'urlopen error [Errno 111] Connection refused' in error:
|
|
|
+ msg = (
|
|
|
+ 'Failed to connect from the Ansible control host to Kibana URL {url}\n'
|
|
|
+ 'Is the router for the Kibana hostname exposed externally?'
|
|
|
+ ).format(url=kibana_url)
|
|
|
+ raise OpenShiftCheckException('FailedToConnect', error_fmt.format(error=msg))
|
|
|
+ elif 'urlopen error [Errno -2] Name or service not known' in error:
|
|
|
+ msg = (
|
|
|
+ 'Failed to resolve the Kibana hostname in {url}\n'
|
|
|
+ 'from the Ansible control host.\n'
|
|
|
+ 'Is DNS configured to resolve this Kibana hostname externally?'
|
|
|
+ ).format(url=kibana_url)
|
|
|
+ raise OpenShiftCheckException('FailedToResolve', error_fmt.format(error=msg))
|
|
|
+ elif 'Expected success (200)' in error:
|
|
|
+ msg = (
|
|
|
+ 'A request to Kibana at {url}\n'
|
|
|
+ 'returned the wrong error code:\n'
|
|
|
+ ' {error}\n'
|
|
|
+ 'This could mean that Kibana is malfunctioning, the hostname is\n'
|
|
|
+ 'resolving incorrectly, or other network issues.'
|
|
|
+ ).format(url=kibana_url, error=error)
|
|
|
+ raise OpenShiftCheckException('WrongReturnCode', error_fmt.format(error=msg))
|
|
|
+ raise OpenShiftCheckException(
|
|
|
+ 'MiscRouteError',
|
|
|
+ 'Error validating the logging Kibana route externally:\n' + error
|
|
|
+ )
|