upgrade.yml 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344
  1. ---
  2. ###############################################################################
  3. # Upgrade Masters
  4. ###############################################################################
  5. # Create service signer cert when missing. Service signer certificate
  6. # is added to master config in the master_config_upgrade hook.
  7. - name: Determine if service signer cert must be created
  8. hosts: oo_first_master
  9. tasks:
  10. - name: Determine if service signer certificate must be created
  11. stat:
  12. path: "{{ openshift.common.config_base }}/master/service-signer.crt"
  13. register: service_signer_cert_stat
  14. changed_when: false
  15. - import_playbook: create_service_signer_cert.yml
  16. # oc adm migrate storage should be run prior to etcd v3 upgrade
  17. # See: https://github.com/openshift/origin/pull/14625#issuecomment-308467060
  18. - name: Pre master upgrade - Upgrade all storage
  19. hosts: oo_first_master
  20. roles:
  21. - openshift_facts
  22. tasks:
  23. - name: Upgrade all storage
  24. command: >
  25. {{ openshift_client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  26. migrate storage --include=* --confirm
  27. register: l_pb_upgrade_control_plane_pre_upgrade_storage
  28. when: openshift_upgrade_pre_storage_migration_enabled | default(true) | bool
  29. failed_when:
  30. - l_pb_upgrade_control_plane_pre_upgrade_storage.rc != 0
  31. - openshift_upgrade_pre_storage_migration_fatal | default(true) | bool
  32. # Set openshift_master_facts separately. In order to reconcile
  33. # admission_config's, we currently must run openshift_master_facts and
  34. # then run openshift_facts.
  35. - name: Set OpenShift master facts
  36. hosts: oo_masters_to_config
  37. roles:
  38. - openshift_master_facts
  39. - name: configure vsphere svc account
  40. hosts: oo_first_master
  41. tasks:
  42. - include_role:
  43. name: openshift_cloud_provider
  44. tasks_from: vsphere-svc
  45. when:
  46. - openshift_cloudprovider_kind is defined
  47. - openshift_cloudprovider_kind == 'vsphere'
  48. - openshift_version | version_compare('3.9', '>=')
  49. # The main master upgrade play. Should handle all changes to the system in one pass, with
  50. # support for optional hooks to be defined.
  51. - name: Upgrade master
  52. hosts: oo_masters_to_config
  53. serial: 1
  54. roles:
  55. - openshift_facts
  56. tasks:
  57. # Run the pre-upgrade hook if defined:
  58. - debug: msg="Running master pre-upgrade hook {{ openshift_master_upgrade_pre_hook }}"
  59. when: openshift_master_upgrade_pre_hook is defined
  60. - include_tasks: "{{ openshift_master_upgrade_pre_hook }}"
  61. when: openshift_master_upgrade_pre_hook is defined
  62. - import_role:
  63. name: openshift_master
  64. tasks_from: upgrade.yml
  65. - name: update vsphere provider master config
  66. include_role:
  67. name: openshift_master
  68. tasks_from: update-vsphere
  69. when:
  70. - openshift_cloudprovider_kind is defined
  71. - openshift_cloudprovider_kind == 'vsphere'
  72. - openshift_version | version_compare('3.9', '>=')
  73. - name: Setup and enable bootstrapping options
  74. include_tasks: tasks/enable_bootstrap.yml
  75. when: openshift_master_bootstrap_enabled | default(false) | bool
  76. # Run the upgrade hook prior to restarting services/system if defined:
  77. - debug: msg="Running master upgrade hook {{ openshift_master_upgrade_hook }}"
  78. when: openshift_master_upgrade_hook is defined
  79. - include_tasks: "{{ openshift_master_upgrade_hook }}"
  80. when: openshift_master_upgrade_hook is defined
  81. - name: Disable master controller
  82. service:
  83. name: "{{ openshift_service_type }}-master-controllers"
  84. enabled: false
  85. when: openshift.common.rolling_restart_mode == 'system'
  86. - include_tasks: tasks/restart_hosts.yml
  87. when: openshift.common.rolling_restart_mode == 'system'
  88. - include_tasks: tasks/restart_services.yml
  89. when: openshift.common.rolling_restart_mode == 'services'
  90. # Run the post-upgrade hook if defined:
  91. - debug: msg="Running master post-upgrade hook {{ openshift_master_upgrade_post_hook }}"
  92. when: openshift_master_upgrade_post_hook is defined
  93. - include_tasks: "{{ openshift_master_upgrade_post_hook }}"
  94. when: openshift_master_upgrade_post_hook is defined
  95. - name: Post master upgrade - Upgrade clusterpolicies storage
  96. command: >
  97. {{ openshift_client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  98. migrate storage --include=clusterpolicies --confirm
  99. register: l_pb_upgrade_control_plane_post_upgrade_storage
  100. when:
  101. - openshift_upgrade_post_storage_migration_enabled | default(true) | bool
  102. - openshift_version is version_compare('3.7','<')
  103. failed_when:
  104. - l_pb_upgrade_control_plane_post_upgrade_storage.rc != 0
  105. - openshift_upgrade_post_storage_migration_fatal | default(false) | bool
  106. run_once: true
  107. delegate_to: "{{ groups.oo_first_master.0 }}"
  108. - set_fact:
  109. master_update_complete: True
  110. ##############################################################################
  111. # Gate on master update complete
  112. ##############################################################################
  113. - name: Gate on master update
  114. hosts: localhost
  115. connection: local
  116. tasks:
  117. - set_fact:
  118. master_update_completed: "{{ hostvars
  119. | lib_utils_oo_select_keys(groups.oo_masters_to_config)
  120. | lib_utils_oo_collect('inventory_hostname', {'master_update_complete': true}) }}"
  121. - set_fact:
  122. master_update_failed: "{{ groups.oo_masters_to_config | difference(master_update_completed) | list }}"
  123. - fail:
  124. msg: "Upgrade cannot continue. The following masters did not finish updating: {{ master_update_failed | join(',') }}"
  125. when: master_update_failed | length > 0
  126. ###############################################################################
  127. # Reconcile Cluster Roles, Cluster Role Bindings and Security Context Constraints
  128. ###############################################################################
  129. - name: Reconcile Cluster Roles and Cluster Role Bindings and Security Context Constraints
  130. hosts: oo_masters_to_config
  131. roles:
  132. - { role: openshift_cli }
  133. - { role: openshift_facts }
  134. vars:
  135. __master_shared_resource_viewer_file: "shared_resource_viewer_role.yaml"
  136. tasks:
  137. - name: Reconcile Cluster Roles
  138. command: >
  139. {{ openshift_client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  140. policy reconcile-cluster-roles --additive-only=true --confirm -o name
  141. register: reconcile_cluster_role_result
  142. when: openshift_version is version_compare('3.7','<')
  143. changed_when:
  144. - reconcile_cluster_role_result.stdout != ''
  145. - reconcile_cluster_role_result.rc == 0
  146. run_once: true
  147. - name: Reconcile Cluster Role Bindings
  148. command: >
  149. {{ openshift_client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  150. policy reconcile-cluster-role-bindings
  151. --exclude-groups=system:authenticated
  152. --exclude-groups=system:authenticated:oauth
  153. --exclude-groups=system:unauthenticated
  154. --exclude-users=system:anonymous
  155. --additive-only=true --confirm -o name
  156. when: openshift_version is version_compare('3.7','<')
  157. register: reconcile_bindings_result
  158. changed_when:
  159. - reconcile_bindings_result.stdout != ''
  160. - reconcile_bindings_result.rc == 0
  161. run_once: true
  162. - name: Reconcile Jenkins Pipeline Role Bindings
  163. command: >
  164. {{ openshift_client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig policy reconcile-cluster-role-bindings system:build-strategy-jenkinspipeline --confirm -o name
  165. run_once: true
  166. register: reconcile_jenkins_role_binding_result
  167. changed_when:
  168. - reconcile_jenkins_role_binding_result.stdout != ''
  169. - reconcile_jenkins_role_binding_result.rc == 0
  170. when:
  171. - openshift_version is version_compare('3.7','<')
  172. - when: openshift_upgrade_target is version_compare('3.7','<')
  173. block:
  174. - name: Retrieve shared-resource-viewer
  175. oc_obj:
  176. state: list
  177. kind: role
  178. name: "shared-resource-viewer"
  179. namespace: "openshift"
  180. register: objout
  181. - name: Determine if shared-resource-viewer is protected
  182. set_fact:
  183. __shared_resource_viewer_protected: true
  184. when:
  185. - "'results' in objout"
  186. - "'results' in objout['results']"
  187. - "'annotations' in objout['results']['results'][0]['metadata']"
  188. - "'openshift.io/reconcile-protect' in objout['results']['results'][0]['metadata']['annotations']"
  189. - "objout['results']['results'][0]['metadata']['annotations']['openshift.io/reconcile-protect'] == 'true'"
  190. - copy:
  191. src: "{{ item }}"
  192. dest: "/tmp/{{ item }}"
  193. with_items:
  194. - "{{ __master_shared_resource_viewer_file }}"
  195. when: __shared_resource_viewer_protected is not defined
  196. - name: Fixup shared-resource-viewer role
  197. oc_obj:
  198. state: present
  199. kind: role
  200. name: "shared-resource-viewer"
  201. namespace: "openshift"
  202. files:
  203. - "/tmp/{{ __master_shared_resource_viewer_file }}"
  204. delete_after: true
  205. when: __shared_resource_viewer_protected is not defined
  206. register: result
  207. retries: 3
  208. delay: 5
  209. until: result.rc == 0
  210. ignore_errors: true
  211. - name: Reconcile Security Context Constraints
  212. command: >
  213. {{ openshift_client_binary }} adm policy --config={{ openshift.common.config_base }}/master/admin.kubeconfig reconcile-sccs --confirm --additive-only=true -o name
  214. register: reconcile_scc_result
  215. changed_when:
  216. - reconcile_scc_result.stdout != ''
  217. - reconcile_scc_result.rc == 0
  218. run_once: true
  219. - name: Migrate storage post policy reconciliation
  220. command: >
  221. {{ openshift_client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  222. migrate storage --include=* --confirm
  223. run_once: true
  224. register: l_pb_upgrade_control_plane_post_upgrade_storage
  225. when: openshift_upgrade_post_storage_migration_enabled | default(true) | bool
  226. failed_when:
  227. - l_pb_upgrade_control_plane_post_upgrade_storage.rc != 0
  228. - openshift_upgrade_post_storage_migration_fatal | default(false) | bool
  229. - set_fact:
  230. reconcile_complete: True
  231. - name: Configure API aggregation on masters
  232. hosts: oo_masters_to_config
  233. serial: 1
  234. roles:
  235. - role: openshift_facts
  236. tasks:
  237. - include_tasks: tasks/wire_aggregator.yml
  238. ##############################################################################
  239. # Gate on reconcile
  240. ##############################################################################
  241. - name: Gate on reconcile
  242. hosts: localhost
  243. connection: local
  244. tasks:
  245. - set_fact:
  246. reconcile_completed: "{{ hostvars
  247. | lib_utils_oo_select_keys(groups.oo_masters_to_config)
  248. | lib_utils_oo_collect('inventory_hostname', {'reconcile_complete': true}) }}"
  249. - set_fact:
  250. reconcile_failed: "{{ groups.oo_masters_to_config | difference(reconcile_completed) | list }}"
  251. - fail:
  252. msg: "Upgrade cannot continue. The following masters did not finish reconciling: {{ reconcile_failed | join(',') }}"
  253. when: reconcile_failed | length > 0
  254. - name: Drain and upgrade master nodes
  255. # There is no need to update nodes in the middle of double upgrade
  256. # This would skip node update to 3.8 during 3.7->3.9 upgrade
  257. hosts: "{{ l_double_upgrade_cp | default(False) | ternary('all:!all', 'oo_masters_to_config:&oo_nodes_to_upgrade') }}"
  258. # This var must be set with -e on invocation, as it is not a per-host inventory var
  259. # and is evaluated early. Values such as "20%" can also be used.
  260. serial: "{{ openshift_upgrade_control_plane_nodes_serial | default(1) }}"
  261. max_fail_percentage: "{{ openshift_upgrade_control_plane_nodes_max_fail_percentage | default(0) }}"
  262. pre_tasks:
  263. - name: Load lib_openshift modules
  264. import_role:
  265. name: lib_openshift
  266. # TODO: To better handle re-trying failed upgrades, it would be nice to check if the node
  267. # or docker actually needs an upgrade before proceeding. Perhaps best to save this until
  268. # we merge upgrade functionality into the base roles and a normal config.yml playbook run.
  269. - name: Mark node unschedulable
  270. oc_adm_manage_node:
  271. node: "{{ openshift.node.nodename | lower }}"
  272. schedulable: False
  273. delegate_to: "{{ groups.oo_first_master.0 }}"
  274. retries: 10
  275. delay: 5
  276. register: node_unschedulable
  277. until: node_unschedulable is succeeded
  278. - name: Drain Node for Kubelet upgrade
  279. command: >
  280. {{ hostvars[groups.oo_first_master.0]['first_master_client_binary'] }} adm drain {{ openshift.node.nodename | lower }}
  281. --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  282. --force --delete-local-data --ignore-daemonsets
  283. --timeout={{ openshift_upgrade_nodes_drain_timeout | default(0) }}s
  284. delegate_to: "{{ groups.oo_first_master.0 }}"
  285. register: l_upgrade_control_plane_drain_result
  286. until: not (l_upgrade_control_plane_drain_result is failed)
  287. retries: "{{ 1 if ( openshift_upgrade_nodes_drain_timeout | default(0) | int ) == 0 else 0 }}"
  288. delay: 5
  289. failed_when:
  290. - l_upgrade_control_plane_drain_result is failed
  291. - openshift_upgrade_nodes_drain_timeout | default(0) | int == 0
  292. roles:
  293. - openshift_facts
  294. post_tasks:
  295. - import_role:
  296. name: openshift_node
  297. tasks_from: upgrade_pre.yml
  298. - import_role:
  299. name: openshift_node
  300. tasks_from: upgrade.yml
  301. - import_role:
  302. name: openshift_manage_node
  303. tasks_from: config.yml
  304. vars:
  305. openshift_master_host: "{{ groups.oo_first_master.0 }}"
  306. openshift_manage_node_is_master: true