disk_availability.py 6.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148
  1. """Check that there is enough disk space in predefined paths."""
  2. import tempfile
  3. import os.path
  4. from openshift_checks import OpenShiftCheck, OpenShiftCheckException
  5. class DiskAvailability(OpenShiftCheck):
  6. """Check that recommended disk space is available before a first-time install."""
  7. name = "disk_availability"
  8. tags = ["preflight"]
  9. # Values taken from the official installation documentation:
  10. # https://docs.openshift.org/latest/install_config/install/prerequisites.html#system-requirements
  11. recommended_disk_space_bytes = {
  12. '/var': {
  13. 'oo_masters_to_config': 40 * 10**9,
  14. 'oo_nodes_to_config': 15 * 10**9,
  15. 'oo_etcd_to_config': 20 * 10**9,
  16. },
  17. # Used to copy client binaries into,
  18. # see roles/openshift_cli/library/openshift_container_binary_sync.py.
  19. '/usr/local/bin': {
  20. 'oo_masters_to_config': 1 * 10**9,
  21. 'oo_nodes_to_config': 1 * 10**9,
  22. 'oo_etcd_to_config': 1 * 10**9,
  23. },
  24. # Used as temporary storage in several cases.
  25. tempfile.gettempdir(): {
  26. 'oo_masters_to_config': 1 * 10**9,
  27. 'oo_nodes_to_config': 1 * 10**9,
  28. 'oo_etcd_to_config': 1 * 10**9,
  29. },
  30. }
  31. # recommended disk space for each location under an upgrade context
  32. recommended_disk_upgrade_bytes = {
  33. '/var': {
  34. 'oo_masters_to_config': 10 * 10**9,
  35. 'oo_nodes_to_config': 5 * 10 ** 9,
  36. 'oo_etcd_to_config': 5 * 10 ** 9,
  37. },
  38. }
  39. def is_active(self):
  40. """Skip hosts that do not have recommended disk space requirements."""
  41. group_names = self.get_var("group_names", default=[])
  42. active_groups = set()
  43. for recommendation in self.recommended_disk_space_bytes.values():
  44. active_groups.update(recommendation.keys())
  45. has_disk_space_recommendation = bool(active_groups.intersection(group_names))
  46. return super(DiskAvailability, self).is_active() and has_disk_space_recommendation
  47. def run(self):
  48. group_names = self.get_var("group_names")
  49. user_config = self.get_var("openshift_check_min_host_disk_gb", default={})
  50. try:
  51. # For backwards-compatibility, if openshift_check_min_host_disk_gb
  52. # is a number, then it overrides the required config for '/var'.
  53. number = float(user_config)
  54. user_config = {
  55. '/var': {
  56. 'oo_masters_to_config': number,
  57. 'oo_nodes_to_config': number,
  58. 'oo_etcd_to_config': number,
  59. },
  60. }
  61. except TypeError:
  62. # If it is not a number, then it should be a nested dict.
  63. pass
  64. self.register_log("recommended thresholds", self.recommended_disk_space_bytes)
  65. if user_config:
  66. self.register_log("user-configured thresholds", user_config)
  67. # TODO: as suggested in
  68. # https://github.com/openshift/openshift-ansible/pull/4436#discussion_r122180021,
  69. # maybe we could support checking disk availability in paths that are
  70. # not part of the official recommendation but present in the user
  71. # configuration.
  72. for path, recommendation in self.recommended_disk_space_bytes.items():
  73. free_bytes = self.free_bytes(path)
  74. recommended_bytes = max(recommendation.get(name, 0) for name in group_names)
  75. config = user_config.get(path, {})
  76. # NOTE: the user config is in GB, but we compare bytes, thus the
  77. # conversion.
  78. config_bytes = max(config.get(name, 0) for name in group_names) * 10**9
  79. recommended_bytes = config_bytes or recommended_bytes
  80. # if an "upgrade" context is set, update the minimum disk requirement
  81. # as this signifies an in-place upgrade - the node might have the
  82. # required total disk space, but some of that space may already be
  83. # in use by the existing OpenShift deployment.
  84. context = self.get_var("r_openshift_health_checker_playbook_context", default="")
  85. if context == "upgrade":
  86. recommended_upgrade_paths = self.recommended_disk_upgrade_bytes.get(path, {})
  87. if recommended_upgrade_paths:
  88. recommended_bytes = config_bytes or max(recommended_upgrade_paths.get(name, 0)
  89. for name in group_names)
  90. if free_bytes < recommended_bytes:
  91. free_gb = float(free_bytes) / 10**9
  92. recommended_gb = float(recommended_bytes) / 10**9
  93. msg = (
  94. 'Available disk space in "{}" ({:.1f} GB) '
  95. 'is below minimum recommended ({:.1f} GB)'
  96. ).format(path, free_gb, recommended_gb)
  97. # warn if check failed under an "upgrade" context
  98. # due to limits imposed by the user config
  99. if config_bytes and context == "upgrade":
  100. msg += ('\n\nMake sure to account for decreased disk space during an upgrade\n'
  101. 'due to an existing OpenShift deployment. Please check the value of\n'
  102. ' openshift_check_min_host_disk_gb={}\n'
  103. 'in your Ansible inventory, and lower the recommended disk space availability\n'
  104. 'if necessary for this upgrade.').format(config_bytes)
  105. self.register_failure(msg)
  106. return {}
  107. def find_ansible_submounts(self, path):
  108. """Return a list of ansible_mounts that are below the given path."""
  109. base = os.path.join(path, "")
  110. return [
  111. mount
  112. for mount in self.get_var("ansible_mounts")
  113. if mount["mount"].startswith(base)
  114. ]
  115. def free_bytes(self, path):
  116. """Return the size available in path based on ansible_mounts."""
  117. submounts = sum(mnt.get('size_available', 0) for mnt in self.find_ansible_submounts(path))
  118. mount = self.find_ansible_mount(path)
  119. try:
  120. return mount['size_available'] + submounts
  121. except KeyError:
  122. raise OpenShiftCheckException(
  123. 'Unable to retrieve disk availability for "{path}".\n'
  124. 'Ansible facts included a matching mount point for this path:\n'
  125. ' {mount}\n'
  126. 'however it is missing the size_available field.\n'
  127. 'To investigate, you can inspect the output of `ansible -m setup <host>`'
  128. ''.format(path=path, mount=mount)
  129. )