zz_failure_summary.py 8.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214
  1. """Ansible callback plugin to print a nicely formatted summary of failures.
  2. The file / module name is prefixed with `zz_` to make this plugin be loaded last
  3. by Ansible, thus making its output the last thing that users see.
  4. """
  5. from collections import defaultdict
  6. from ansible.plugins.callback import CallbackBase
  7. from ansible import constants as C
  8. from ansible.utils.color import stringc
  9. FAILED_NO_MSG = u'Failed without returning a message.'
  10. class CallbackModule(CallbackBase):
  11. """This callback plugin stores task results and summarizes failures."""
  12. CALLBACK_VERSION = 2.0
  13. CALLBACK_TYPE = 'aggregate'
  14. CALLBACK_NAME = 'failure_summary'
  15. CALLBACK_NEEDS_WHITELIST = False
  16. def __init__(self):
  17. super(CallbackModule, self).__init__()
  18. self.__failures = []
  19. self.__playbook_file = ''
  20. def v2_playbook_on_start(self, playbook):
  21. super(CallbackModule, self).v2_playbook_on_start(playbook)
  22. # pylint: disable=protected-access; Ansible gives us no public API to
  23. # get the file name of the current playbook from a callback plugin.
  24. self.__playbook_file = playbook._file_name
  25. def v2_runner_on_failed(self, result, ignore_errors=False):
  26. super(CallbackModule, self).v2_runner_on_failed(result, ignore_errors)
  27. if not ignore_errors:
  28. self.__failures.append(result)
  29. def v2_playbook_on_stats(self, stats):
  30. super(CallbackModule, self).v2_playbook_on_stats(stats)
  31. if self.__failures:
  32. self._display.display(failure_summary(self.__failures, self.__playbook_file))
  33. def failure_summary(failures, playbook):
  34. """Return a summary of failed tasks, including details on health checks."""
  35. if not failures:
  36. return u''
  37. # NOTE: because we don't have access to task_vars from callback plugins, we
  38. # store the playbook context in the task result when the
  39. # openshift_health_check action plugin is used, and we use this context to
  40. # customize the error message.
  41. # pylint: disable=protected-access; Ansible gives us no sufficient public
  42. # API on TaskResult objects.
  43. context = next((
  44. context for context in
  45. (failure._result.get('playbook_context') for failure in failures)
  46. if context
  47. ), None)
  48. failures = [failure_to_dict(failure) for failure in failures]
  49. failures = deduplicate_failures(failures)
  50. summary = [u'', u'', u'Failure summary:', u'']
  51. width = len(str(len(failures)))
  52. initial_indent_format = u' {{:>{width}}}. '.format(width=width)
  53. initial_indent_len = len(initial_indent_format.format(0))
  54. subsequent_indent = u' ' * initial_indent_len
  55. subsequent_extra_indent = u' ' * (initial_indent_len + 10)
  56. for i, failure in enumerate(failures, 1):
  57. entries = format_failure(failure)
  58. summary.append(u'\n{}{}'.format(initial_indent_format.format(i), entries[0]))
  59. for entry in entries[1:]:
  60. entry = entry.replace(u'\n', u'\n' + subsequent_extra_indent)
  61. indented = u'{}{}'.format(subsequent_indent, entry)
  62. summary.append(indented)
  63. failed_checks = set()
  64. for failure in failures:
  65. failed_checks.update(name for name, message in failure['checks'])
  66. if failed_checks:
  67. summary.append(check_failure_footer(failed_checks, context, playbook))
  68. return u'\n'.join(summary)
  69. def failure_to_dict(failed_task_result):
  70. """Extract information out of a failed TaskResult into a dict.
  71. The intent is to transform a TaskResult object into something easier to
  72. manipulate. TaskResult is ansible.executor.task_result.TaskResult.
  73. """
  74. # pylint: disable=protected-access; Ansible gives us no sufficient public
  75. # API on TaskResult objects.
  76. _result = failed_task_result._result
  77. return {
  78. 'host': failed_task_result._host.get_name(),
  79. 'play': play_name(failed_task_result._task),
  80. 'task': failed_task_result.task_name,
  81. 'msg': _result.get('msg', FAILED_NO_MSG),
  82. 'checks': tuple(
  83. (name, result.get('msg', FAILED_NO_MSG))
  84. for name, result in sorted(_result.get('checks', {}).items())
  85. if result.get('failed')
  86. ),
  87. }
  88. def play_name(obj):
  89. """Given a task or block, return the name of its parent play.
  90. This is loosely inspired by ansible.playbook.base.Base.dump_me.
  91. """
  92. # pylint: disable=protected-access; Ansible gives us no sufficient public
  93. # API to implement this.
  94. if not obj:
  95. return ''
  96. if hasattr(obj, '_play'):
  97. return obj._play.get_name()
  98. return play_name(getattr(obj, '_parent'))
  99. def deduplicate_failures(failures):
  100. """Group together similar failures from different hosts.
  101. Returns a new list of failures such that identical failures from different
  102. hosts are grouped together in a single entry. The relative order of failures
  103. is preserved.
  104. """
  105. groups = defaultdict(list)
  106. for failure in failures:
  107. group_key = tuple(sorted((key, value) for key, value in failure.items() if key != 'host'))
  108. groups[group_key].append(failure)
  109. result = []
  110. for failure in failures:
  111. group_key = tuple(sorted((key, value) for key, value in failure.items() if key != 'host'))
  112. if group_key not in groups:
  113. continue
  114. failure['host'] = tuple(sorted(g_failure['host'] for g_failure in groups.pop(group_key)))
  115. result.append(failure)
  116. return result
  117. def format_failure(failure):
  118. """Return a list of pretty-formatted text entries describing a failure, including
  119. relevant information about it. Expect that the list of text entries will be joined
  120. by a newline separator when output to the user."""
  121. host = u', '.join(failure['host'])
  122. play = failure['play']
  123. task = failure['task']
  124. msg = failure['msg']
  125. checks = failure['checks']
  126. fields = (
  127. (u'Hosts', host),
  128. (u'Play', play),
  129. (u'Task', task),
  130. (u'Message', stringc(msg, C.COLOR_ERROR)),
  131. )
  132. if checks:
  133. fields += ((u'Details', format_failed_checks(checks)),)
  134. row_format = '{:10}{}'
  135. return [row_format.format(header + u':', body) for header, body in fields]
  136. def format_failed_checks(checks):
  137. """Return pretty-formatted text describing checks that failed."""
  138. messages = []
  139. for name, message in checks:
  140. messages.append(u'check "{}":\n{}'.format(name, message))
  141. return stringc(u'\n\n'.join(messages), C.COLOR_ERROR)
  142. def check_failure_footer(failed_checks, context, playbook):
  143. """Return a textual explanation about checks depending on context.
  144. The purpose of specifying context is to vary the output depending on what
  145. the user was expecting to happen (based on which playbook they ran). The
  146. only use currently is to vary the message depending on whether the user was
  147. deliberately running checks or was trying to install/upgrade and checks are
  148. just included. Other use cases may arise.
  149. """
  150. checks = ','.join(sorted(failed_checks))
  151. summary = [u'']
  152. if context in ['pre-install', 'health', 'adhoc']:
  153. # User was expecting to run checks, less explanation needed.
  154. summary.extend([
  155. u'You may configure or disable checks by setting Ansible '
  156. u'variables. To disable those above, set:',
  157. u' openshift_disable_check={checks}'.format(checks=checks),
  158. u'Consult check documentation for configurable variables.',
  159. ])
  160. else:
  161. # User may not be familiar with the checks, explain what checks are in
  162. # the first place.
  163. summary.extend([
  164. u'The execution of "{playbook}" includes checks designed to fail '
  165. u'early if the requirements of the playbook are not met. One or '
  166. u'more of these checks failed. To disregard these results,'
  167. u'explicitly disable checks by setting an Ansible variable:'.format(playbook=playbook),
  168. u' openshift_disable_check={checks}'.format(checks=checks),
  169. u'Failing check names are shown in the failure details above. '
  170. u'Some checks may be configurable by variables if your requirements '
  171. u'are different from the defaults; consult check documentation.',
  172. ])
  173. summary.append(
  174. u'Variables can be set in the inventory or passed on the command line '
  175. u'using the -e flag to ansible-playbook.'
  176. )
  177. return u'\n'.join(summary)