upgrade_control_plane.yml 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341
  1. ---
  2. ###############################################################################
  3. # Upgrade Masters
  4. ###############################################################################
  5. # oc adm migrate storage should be run prior to etcd v3 upgrade
  6. # See: https://github.com/openshift/origin/pull/14625#issuecomment-308467060
  7. - name: Pre master upgrade - Upgrade all storage
  8. hosts: oo_first_master
  9. tasks:
  10. - name: Upgrade all storage
  11. command: >
  12. {{ openshift.common.client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  13. migrate storage --include=* --confirm
  14. register: l_pb_upgrade_control_plane_pre_upgrade_storage
  15. when: openshift_upgrade_pre_storage_migration_enabled | default(true,true) | bool
  16. failed_when:
  17. - openshift_upgrade_pre_storage_migration_enabled | default(true,true) | bool
  18. - l_pb_upgrade_control_plane_pre_upgrade_storage.rc != 0
  19. - openshift_upgrade_pre_storage_migration_fatal | default(true,true) | bool
  20. # If facts cache were for some reason deleted, this fact may not be set, and if not set
  21. # it will always default to true. This causes problems for the etcd data dir fact detection
  22. # so we must first make sure this is set correctly before attempting the backup.
  23. - name: Set master embedded_etcd fact
  24. hosts: oo_masters_to_config
  25. roles:
  26. - openshift_facts
  27. tasks:
  28. - openshift_facts:
  29. role: master
  30. local_facts:
  31. embedded_etcd: "{{ groups.oo_etcd_to_config | default([]) | length == 0 }}"
  32. debug_level: "{{ openshift_master_debug_level | default(openshift.common.debug_level | default(2)) }}"
  33. - name: Upgrade and backup etcd
  34. include: ./etcd/main.yml
  35. # Create service signer cert when missing. Service signer certificate
  36. # is added to master config in the master_config_upgrade hook.
  37. - name: Determine if service signer cert must be created
  38. hosts: oo_first_master
  39. tasks:
  40. - name: Determine if service signer certificate must be created
  41. stat:
  42. path: "{{ openshift.common.config_base }}/master/service-signer.crt"
  43. register: service_signer_cert_stat
  44. changed_when: false
  45. - include: create_service_signer_cert.yml
  46. # Set openshift_master_facts separately. In order to reconcile
  47. # admission_config's, we currently must run openshift_master_facts and
  48. # then run openshift_facts.
  49. - name: Set OpenShift master facts
  50. hosts: oo_masters_to_config
  51. roles:
  52. - openshift_master_facts
  53. # The main master upgrade play. Should handle all changes to the system in one pass, with
  54. # support for optional hooks to be defined.
  55. - name: Upgrade master
  56. hosts: oo_masters_to_config
  57. vars:
  58. openshift_master_ha: "{{ groups.oo_masters_to_config | length > 1 }}"
  59. serial: 1
  60. handlers:
  61. - include: ../../../../roles/openshift_master/handlers/main.yml
  62. static: yes
  63. roles:
  64. - openshift_facts
  65. - lib_utils
  66. post_tasks:
  67. # Run the pre-upgrade hook if defined:
  68. - debug: msg="Running master pre-upgrade hook {{ openshift_master_upgrade_pre_hook }}"
  69. when: openshift_master_upgrade_pre_hook is defined
  70. - include: "{{ openshift_master_upgrade_pre_hook }}"
  71. when: openshift_master_upgrade_pre_hook is defined
  72. - include: rpm_upgrade.yml component=master
  73. when: not openshift.common.is_containerized | bool
  74. - include_vars: ../../../../roles/openshift_master_facts/vars/main.yml
  75. - include: upgrade_scheduler.yml
  76. - include: "{{ master_config_hook }}"
  77. when: master_config_hook is defined
  78. - include_vars: ../../../../roles/openshift_master/vars/main.yml
  79. - name: Remove any legacy systemd units
  80. include: ../../../../roles/openshift_master/tasks/clean_systemd_units.yml
  81. - name: Update systemd units
  82. include: ../../../../roles/openshift_master/tasks/systemd_units.yml
  83. - name: Check for ca-bundle.crt
  84. stat:
  85. path: "{{ openshift.common.config_base }}/master/ca-bundle.crt"
  86. register: ca_bundle_stat
  87. failed_when: false
  88. - name: Check for ca.crt
  89. stat:
  90. path: "{{ openshift.common.config_base }}/master/ca.crt"
  91. register: ca_crt_stat
  92. failed_when: false
  93. - name: Migrate ca.crt to ca-bundle.crt
  94. command: mv ca.crt ca-bundle.crt
  95. args:
  96. chdir: "{{ openshift.common.config_base }}/master"
  97. when: ca_crt_stat.stat.isreg and not ca_bundle_stat.stat.exists
  98. - name: Link ca.crt to ca-bundle.crt
  99. file:
  100. src: "{{ openshift.common.config_base }}/master/ca-bundle.crt"
  101. path: "{{ openshift.common.config_base }}/master/ca.crt"
  102. state: link
  103. when: ca_crt_stat.stat.isreg and not ca_bundle_stat.stat.exists
  104. - name: Update oreg value
  105. yedit:
  106. src: "{{ openshift.common.config_base }}/master/master-config.yaml"
  107. key: 'imageConfig.format'
  108. value: "{{ oreg_url | default(oreg_url_master) }}"
  109. when: oreg_url is defined or oreg_url_master is defined
  110. # Run the upgrade hook prior to restarting services/system if defined:
  111. - debug: msg="Running master upgrade hook {{ openshift_master_upgrade_hook }}"
  112. when: openshift_master_upgrade_hook is defined
  113. - include: "{{ openshift_master_upgrade_hook }}"
  114. when: openshift_master_upgrade_hook is defined
  115. - include: ../../openshift-master/restart_hosts.yml
  116. when: openshift.common.rolling_restart_mode == 'system'
  117. - include: ../../openshift-master/restart_services.yml
  118. when: openshift.common.rolling_restart_mode == 'services'
  119. # Run the post-upgrade hook if defined:
  120. - debug: msg="Running master post-upgrade hook {{ openshift_master_upgrade_post_hook }}"
  121. when: openshift_master_upgrade_post_hook is defined
  122. - include: "{{ openshift_master_upgrade_post_hook }}"
  123. when: openshift_master_upgrade_post_hook is defined
  124. - name: Post master upgrade - Upgrade clusterpolicies storage
  125. command: >
  126. {{ openshift.common.client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  127. migrate storage --include=clusterpolicies --confirm
  128. register: l_pb_upgrade_control_plane_post_upgrade_storage
  129. when: openshift_upgrade_post_storage_migration_enabled | default(true,true) | bool
  130. failed_when:
  131. - openshift_upgrade_post_storage_migration_enabled | default(true,true) | bool
  132. - l_pb_upgrade_control_plane_post_upgrade_storage.rc != 0
  133. - openshift_upgrade_post_storage_migration_fatal | default(false,true) | bool
  134. run_once: true
  135. delegate_to: "{{ groups.oo_first_master.0 }}"
  136. - set_fact:
  137. master_update_complete: True
  138. ##############################################################################
  139. # Gate on master update complete
  140. ##############################################################################
  141. - name: Gate on master update
  142. hosts: localhost
  143. connection: local
  144. become: no
  145. tasks:
  146. - set_fact:
  147. master_update_completed: "{{ hostvars
  148. | oo_select_keys(groups.oo_masters_to_config)
  149. | oo_collect('inventory_hostname', {'master_update_complete': true}) }}"
  150. - set_fact:
  151. master_update_failed: "{{ groups.oo_masters_to_config | difference(master_update_completed) }}"
  152. - fail:
  153. msg: "Upgrade cannot continue. The following masters did not finish updating: {{ master_update_failed | join(',') }}"
  154. when: master_update_failed | length > 0
  155. ###############################################################################
  156. # Reconcile Cluster Roles, Cluster Role Bindings and Security Context Constraints
  157. ###############################################################################
  158. - name: Reconcile Cluster Roles and Cluster Role Bindings and Security Context Constraints
  159. hosts: oo_masters_to_config
  160. roles:
  161. - { role: openshift_cli }
  162. vars:
  163. origin_reconcile_bindings: "{{ deployment_type == 'origin' and openshift_version | version_compare('1.0.6', '>') }}"
  164. ent_reconcile_bindings: true
  165. openshift_docker_hosted_registry_network: "{{ hostvars[groups.oo_first_master.0].openshift.common.portal_net }}"
  166. # Another spot where we assume docker is running and do not want to accidentally trigger an unsafe
  167. # restart.
  168. skip_docker_role: True
  169. tasks:
  170. - name: Reconcile Cluster Roles
  171. command: >
  172. {{ openshift.common.client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  173. policy reconcile-cluster-roles --additive-only=true --confirm -o name
  174. register: reconcile_cluster_role_result
  175. changed_when:
  176. - reconcile_cluster_role_result.stdout != ''
  177. - reconcile_cluster_role_result.rc == 0
  178. run_once: true
  179. - name: Reconcile Cluster Role Bindings
  180. command: >
  181. {{ openshift.common.client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  182. policy reconcile-cluster-role-bindings
  183. --exclude-groups=system:authenticated
  184. --exclude-groups=system:authenticated:oauth
  185. --exclude-groups=system:unauthenticated
  186. --exclude-users=system:anonymous
  187. --additive-only=true --confirm -o name
  188. when: origin_reconcile_bindings | bool or ent_reconcile_bindings | bool
  189. register: reconcile_bindings_result
  190. changed_when:
  191. - reconcile_bindings_result.stdout != ''
  192. - reconcile_bindings_result.rc == 0
  193. run_once: true
  194. - name: Reconcile Jenkins Pipeline Role Bindings
  195. command: >
  196. {{ openshift.common.client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig policy reconcile-cluster-role-bindings system:build-strategy-jenkinspipeline --confirm -o name
  197. run_once: true
  198. register: reconcile_jenkins_role_binding_result
  199. changed_when:
  200. - reconcile_jenkins_role_binding_result.stdout != ''
  201. - reconcile_jenkins_role_binding_result.rc == 0
  202. when: openshift.common.version_gte_3_4_or_1_4 | bool
  203. - name: Reconcile Security Context Constraints
  204. command: >
  205. {{ openshift.common.client_binary }} adm policy --config={{ openshift.common.config_base }}/master/admin.kubeconfig reconcile-sccs --confirm --additive-only=true -o name
  206. register: reconcile_scc_result
  207. changed_when:
  208. - reconcile_scc_result.stdout != ''
  209. - reconcile_scc_result.rc == 0
  210. run_once: true
  211. - name: Migrate storage post policy reconciliation
  212. command: >
  213. {{ openshift.common.client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  214. migrate storage --include=* --confirm
  215. run_once: true
  216. register: l_pb_upgrade_control_plane_post_upgrade_storage
  217. when: openshift_upgrade_post_storage_migration_enabled | default(true,true) | bool
  218. failed_when:
  219. - openshift_upgrade_post_storage_migration_enabled | default(true,true) | bool
  220. - l_pb_upgrade_control_plane_post_upgrade_storage.rc != 0
  221. - openshift_upgrade_post_storage_migration_fatal | default(false,true) | bool
  222. - set_fact:
  223. reconcile_complete: True
  224. ##############################################################################
  225. # Gate on reconcile
  226. ##############################################################################
  227. - name: Gate on reconcile
  228. hosts: localhost
  229. connection: local
  230. become: no
  231. tasks:
  232. - set_fact:
  233. reconcile_completed: "{{ hostvars
  234. | oo_select_keys(groups.oo_masters_to_config)
  235. | oo_collect('inventory_hostname', {'reconcile_complete': true}) }}"
  236. - set_fact:
  237. reconcile_failed: "{{ groups.oo_masters_to_config | difference(reconcile_completed) }}"
  238. - fail:
  239. msg: "Upgrade cannot continue. The following masters did not finish reconciling: {{ reconcile_failed | join(',') }}"
  240. when: reconcile_failed | length > 0
  241. - name: Upgrade Docker on dedicated containerized etcd hosts
  242. hosts: oo_etcd_to_config:!oo_nodes_to_upgrade
  243. serial: 1
  244. any_errors_fatal: true
  245. roles:
  246. - openshift_facts
  247. tasks:
  248. - include: docker/upgrade.yml
  249. when: l_docker_upgrade is defined and l_docker_upgrade | bool and not openshift.common.is_atomic | bool
  250. - name: Drain and upgrade master nodes
  251. hosts: oo_masters_to_config:&oo_nodes_to_upgrade
  252. # This var must be set with -e on invocation, as it is not a per-host inventory var
  253. # and is evaluated early. Values such as "20%" can also be used.
  254. serial: "{{ openshift_upgrade_control_plane_nodes_serial | default(1) }}"
  255. max_fail_percentage: "{{ openshift_upgrade_control_plane_nodes_max_fail_percentage | default(0) }}"
  256. pre_tasks:
  257. - name: Load lib_openshift modules
  258. include_role:
  259. name: lib_openshift
  260. # TODO: To better handle re-trying failed upgrades, it would be nice to check if the node
  261. # or docker actually needs an upgrade before proceeding. Perhaps best to save this until
  262. # we merge upgrade functionality into the base roles and a normal config.yml playbook run.
  263. - name: Mark node unschedulable
  264. oc_adm_manage_node:
  265. node: "{{ openshift.node.nodename | lower }}"
  266. schedulable: False
  267. delegate_to: "{{ groups.oo_first_master.0 }}"
  268. retries: 10
  269. delay: 5
  270. register: node_unschedulable
  271. until: node_unschedulable|succeeded
  272. - name: Drain Node for Kubelet upgrade
  273. command: >
  274. {{ hostvars[groups.oo_first_master.0].openshift.common.admin_binary }} drain {{ openshift.node.nodename | lower }} --config={{ openshift.common.config_base }}/master/admin.kubeconfig --force --delete-local-data --ignore-daemonsets
  275. delegate_to: "{{ groups.oo_first_master.0 }}"
  276. register: l_upgrade_control_plane_drain_result
  277. until: not l_upgrade_control_plane_drain_result | failed
  278. retries: 60
  279. delay: 60
  280. roles:
  281. - lib_openshift
  282. - openshift_facts
  283. - docker
  284. - openshift_node_dnsmasq
  285. - openshift_node_upgrade
  286. post_tasks:
  287. - name: Set node schedulability
  288. oc_adm_manage_node:
  289. node: "{{ openshift.node.nodename | lower }}"
  290. schedulable: True
  291. delegate_to: "{{ groups.oo_first_master.0 }}"
  292. retries: 10
  293. delay: 5
  294. register: node_schedulable
  295. until: node_schedulable|succeeded
  296. when: node_unschedulable|changed