zz_failure_summary.py 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235
  1. """Ansible callback plugin to print a nicely formatted summary of failures.
  2. The file / module name is prefixed with `zz_` to make this plugin be loaded last
  3. by Ansible, thus making its output the last thing that users see.
  4. """
  5. from collections import defaultdict
  6. import traceback
  7. from ansible.plugins.callback import CallbackBase
  8. from ansible import constants as C
  9. from ansible.utils.color import stringc
  10. from ansible.module_utils.six import string_types
  11. FAILED_NO_MSG = u'Failed without returning a message.'
  12. class CallbackModule(CallbackBase):
  13. """This callback plugin stores task results and summarizes failures."""
  14. CALLBACK_VERSION = 2.0
  15. CALLBACK_TYPE = 'aggregate'
  16. CALLBACK_NAME = 'failure_summary'
  17. CALLBACK_NEEDS_WHITELIST = False
  18. def __init__(self):
  19. super(CallbackModule, self).__init__()
  20. self.__failures = []
  21. self.__playbook_file = ''
  22. def v2_playbook_on_start(self, playbook):
  23. super(CallbackModule, self).v2_playbook_on_start(playbook)
  24. # pylint: disable=protected-access; Ansible gives us no public API to
  25. # get the file name of the current playbook from a callback plugin.
  26. self.__playbook_file = playbook._file_name
  27. def v2_runner_on_failed(self, result, ignore_errors=False):
  28. super(CallbackModule, self).v2_runner_on_failed(result, ignore_errors)
  29. if not ignore_errors:
  30. self.__failures.append(result)
  31. def v2_playbook_on_stats(self, stats):
  32. super(CallbackModule, self).v2_playbook_on_stats(stats)
  33. # pylint: disable=broad-except; capturing exceptions broadly is
  34. # intentional, to isolate arbitrary failures in this callback plugin.
  35. try:
  36. if self.__failures:
  37. self._display.display(failure_summary(self.__failures, self.__playbook_file))
  38. except Exception:
  39. msg = stringc(
  40. u'An error happened while generating a summary of failures:\n'
  41. u'{}'.format(traceback.format_exc()), C.COLOR_WARN)
  42. self._display.v(msg)
  43. def failure_summary(failures, playbook):
  44. """Return a summary of failed tasks, including details on health checks."""
  45. if not failures:
  46. return u''
  47. # NOTE: because we don't have access to task_vars from callback plugins, we
  48. # store the playbook context in the task result when the
  49. # openshift_health_check action plugin is used, and we use this context to
  50. # customize the error message.
  51. # pylint: disable=protected-access; Ansible gives us no sufficient public
  52. # API on TaskResult objects.
  53. context = next((
  54. context for context in
  55. (failure._result.get('playbook_context') for failure in failures)
  56. if context
  57. ), None)
  58. failures = [failure_to_dict(failure) for failure in failures]
  59. failures = deduplicate_failures(failures)
  60. summary = [u'', u'', u'Failure summary:', u'']
  61. width = len(str(len(failures)))
  62. initial_indent_format = u' {{:>{width}}}. '.format(width=width)
  63. initial_indent_len = len(initial_indent_format.format(0))
  64. subsequent_indent = u' ' * initial_indent_len
  65. subsequent_extra_indent = u' ' * (initial_indent_len + 10)
  66. for i, failure in enumerate(failures, 1):
  67. entries = format_failure(failure)
  68. summary.append(u'\n{}{}'.format(initial_indent_format.format(i), entries[0]))
  69. for entry in entries[1:]:
  70. entry = entry.replace(u'\n', u'\n' + subsequent_extra_indent)
  71. indented = u'{}{}'.format(subsequent_indent, entry)
  72. summary.append(indented)
  73. failed_checks = set()
  74. for failure in failures:
  75. failed_checks.update(name for name, message in failure['checks'])
  76. if failed_checks:
  77. summary.append(check_failure_footer(failed_checks, context, playbook))
  78. return u'\n'.join(summary)
  79. def failure_to_dict(failed_task_result):
  80. """Extract information out of a failed TaskResult into a dict.
  81. The intent is to transform a TaskResult object into something easier to
  82. manipulate. TaskResult is ansible.executor.task_result.TaskResult.
  83. """
  84. # pylint: disable=protected-access; Ansible gives us no sufficient public
  85. # API on TaskResult objects.
  86. _result = failed_task_result._result
  87. return {
  88. 'host': failed_task_result._host.get_name(),
  89. 'play': play_name(failed_task_result._task),
  90. 'task': failed_task_result.task_name,
  91. 'msg': _result.get('msg', FAILED_NO_MSG),
  92. 'checks': tuple(
  93. (name, result.get('msg', FAILED_NO_MSG))
  94. for name, result in sorted(_result.get('checks', {}).items())
  95. if result.get('failed')
  96. ),
  97. }
  98. def play_name(obj):
  99. """Given a task or block, return the name of its parent play.
  100. This is loosely inspired by ansible.playbook.base.Base.dump_me.
  101. """
  102. # pylint: disable=protected-access; Ansible gives us no sufficient public
  103. # API to implement this.
  104. if not obj:
  105. return ''
  106. if hasattr(obj, '_play'):
  107. return obj._play.get_name()
  108. return play_name(getattr(obj, '_parent'))
  109. def deduplicate_failures(failures):
  110. """Group together similar failures from different hosts.
  111. Returns a new list of failures such that identical failures from different
  112. hosts are grouped together in a single entry. The relative order of failures
  113. is preserved.
  114. If failures is unhashable, the original list of failures is returned.
  115. """
  116. groups = defaultdict(list)
  117. for failure in failures:
  118. group_key = tuple(sorted((key, value) for key, value in failure.items() if key != 'host'))
  119. try:
  120. groups[group_key].append(failure)
  121. except TypeError:
  122. # abort and return original list of failures when failures has an
  123. # unhashable type.
  124. return failures
  125. result = []
  126. for failure in failures:
  127. group_key = tuple(sorted((key, value) for key, value in failure.items() if key != 'host'))
  128. if group_key not in groups:
  129. continue
  130. failure['host'] = tuple(sorted(g_failure['host'] for g_failure in groups.pop(group_key)))
  131. result.append(failure)
  132. return result
  133. def format_failure(failure):
  134. """Return a list of pretty-formatted text entries describing a failure, including
  135. relevant information about it. Expect that the list of text entries will be joined
  136. by a newline separator when output to the user."""
  137. if isinstance(failure['host'], string_types):
  138. host = failure['host']
  139. else:
  140. host = u', '.join(failure['host'])
  141. play = failure['play']
  142. task = failure['task']
  143. msg = failure['msg']
  144. checks = failure['checks']
  145. fields = (
  146. (u'Hosts', host),
  147. (u'Play', play),
  148. (u'Task', task),
  149. (u'Message', stringc(msg, C.COLOR_ERROR)),
  150. )
  151. if checks:
  152. fields += ((u'Details', format_failed_checks(checks)),)
  153. row_format = '{:10}{}'
  154. return [row_format.format(header + u':', body) for header, body in fields]
  155. def format_failed_checks(checks):
  156. """Return pretty-formatted text describing checks that failed."""
  157. messages = []
  158. for name, message in checks:
  159. messages.append(u'check "{}":\n{}'.format(name, message))
  160. return stringc(u'\n\n'.join(messages), C.COLOR_ERROR)
  161. def check_failure_footer(failed_checks, context, playbook):
  162. """Return a textual explanation about checks depending on context.
  163. The purpose of specifying context is to vary the output depending on what
  164. the user was expecting to happen (based on which playbook they ran). The
  165. only use currently is to vary the message depending on whether the user was
  166. deliberately running checks or was trying to install/upgrade and checks are
  167. just included. Other use cases may arise.
  168. """
  169. checks = ','.join(sorted(failed_checks))
  170. summary = [u'']
  171. if context in ['pre-install', 'health', 'adhoc']:
  172. # User was expecting to run checks, less explanation needed.
  173. summary.extend([
  174. u'You may configure or disable checks by setting Ansible '
  175. u'variables. To disable those above, set:',
  176. u' openshift_disable_check={checks}'.format(checks=checks),
  177. u'Consult check documentation for configurable variables.',
  178. ])
  179. else:
  180. # User may not be familiar with the checks, explain what checks are in
  181. # the first place.
  182. summary.extend([
  183. u'The execution of "{playbook}" includes checks designed to fail '
  184. u'early if the requirements of the playbook are not met. One or '
  185. u'more of these checks failed. To disregard these results,'
  186. u'explicitly disable checks by setting an Ansible variable:'.format(playbook=playbook),
  187. u' openshift_disable_check={checks}'.format(checks=checks),
  188. u'Failing check names are shown in the failure details above. '
  189. u'Some checks may be configurable by variables if your requirements '
  190. u'are different from the defaults; consult check documentation.',
  191. ])
  192. summary.append(
  193. u'Variables can be set in the inventory or passed on the command line '
  194. u'using the -e flag to ansible-playbook.'
  195. )
  196. return u'\n'.join(summary)