upgrade_control_plane.yml 11 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295
  1. ---
  2. ###############################################################################
  3. # Upgrade Masters
  4. ###############################################################################
  5. - name: Evaluate additional groups for upgrade
  6. hosts: localhost
  7. connection: local
  8. become: no
  9. tasks:
  10. - name: Evaluate etcd_hosts_to_backup
  11. add_host:
  12. name: "{{ item }}"
  13. groups: etcd_hosts_to_backup
  14. with_items: "{{ groups.oo_etcd_to_config if groups.oo_etcd_to_config is defined and groups.oo_etcd_to_config | length > 0 else groups.oo_first_master }}"
  15. changed_when: False
  16. # If facts cache were for some reason deleted, this fact may not be set, and if not set
  17. # it will always default to true. This causes problems for the etcd data dir fact detection
  18. # so we must first make sure this is set correctly before attempting the backup.
  19. - name: Set master embedded_etcd fact
  20. hosts: oo_masters_to_config
  21. roles:
  22. - openshift_facts
  23. tasks:
  24. - openshift_facts:
  25. role: master
  26. local_facts:
  27. embedded_etcd: "{{ groups.oo_etcd_to_config | default([]) | length == 0 }}"
  28. debug_level: "{{ openshift_master_debug_level | default(openshift.common.debug_level | default(2)) }}"
  29. - name: Upgrade and backup etcd
  30. include: ./etcd/main.yml
  31. # Create service signer cert when missing. Service signer certificate
  32. # is added to master config in the master_config_upgrade hook.
  33. - name: Determine if service signer cert must be created
  34. hosts: oo_first_master
  35. tasks:
  36. - name: Determine if service signer certificate must be created
  37. stat:
  38. path: "{{ openshift.common.config_base }}/master/service-signer.crt"
  39. register: service_signer_cert_stat
  40. changed_when: false
  41. - include: create_service_signer_cert.yml
  42. # Set openshift_master_facts separately. In order to reconcile
  43. # admission_config's, we currently must run openshift_master_facts and
  44. # then run openshift_facts.
  45. - name: Set OpenShift master facts
  46. hosts: oo_masters_to_config
  47. roles:
  48. - openshift_master_facts
  49. # The main master upgrade play. Should handle all changes to the system in one pass, with
  50. # support for optional hooks to be defined.
  51. - name: Upgrade master
  52. hosts: oo_masters_to_config
  53. vars:
  54. openshift_master_ha: "{{ groups.oo_masters_to_config | length > 1 }}"
  55. serial: 1
  56. handlers:
  57. - include: ../../../../roles/openshift_master/handlers/main.yml
  58. static: yes
  59. roles:
  60. - openshift_facts
  61. post_tasks:
  62. # Run the pre-upgrade hook if defined:
  63. - debug: msg="Running master pre-upgrade hook {{ openshift_master_upgrade_pre_hook }}"
  64. when: openshift_master_upgrade_pre_hook is defined
  65. - include: "{{ openshift_master_upgrade_pre_hook }}"
  66. when: openshift_master_upgrade_pre_hook is defined
  67. - include: rpm_upgrade.yml component=master
  68. when: not openshift.common.is_containerized | bool
  69. - include_vars: ../../../../roles/openshift_master_facts/vars/main.yml
  70. - include: upgrade_scheduler.yml
  71. - include: "{{ master_config_hook }}"
  72. when: master_config_hook is defined
  73. - include_vars: ../../../../roles/openshift_master/vars/main.yml
  74. - name: Update systemd units
  75. include: ../../../../roles/openshift_master/tasks/systemd_units.yml
  76. - name: Check for ca-bundle.crt
  77. stat:
  78. path: "{{ openshift.common.config_base }}/master/ca-bundle.crt"
  79. register: ca_bundle_stat
  80. failed_when: false
  81. - name: Check for ca.crt
  82. stat:
  83. path: "{{ openshift.common.config_base }}/master/ca.crt"
  84. register: ca_crt_stat
  85. failed_when: false
  86. - name: Migrate ca.crt to ca-bundle.crt
  87. command: mv ca.crt ca-bundle.crt
  88. args:
  89. chdir: "{{ openshift.common.config_base }}/master"
  90. when: ca_crt_stat.stat.isreg and not ca_bundle_stat.stat.exists
  91. - name: Link ca.crt to ca-bundle.crt
  92. file:
  93. src: "{{ openshift.common.config_base }}/master/ca-bundle.crt"
  94. path: "{{ openshift.common.config_base }}/master/ca.crt"
  95. state: link
  96. when: ca_crt_stat.stat.isreg and not ca_bundle_stat.stat.exists
  97. # Run the upgrade hook prior to restarting services/system if defined:
  98. - debug: msg="Running master upgrade hook {{ openshift_master_upgrade_hook }}"
  99. when: openshift_master_upgrade_hook is defined
  100. - include: "{{ openshift_master_upgrade_hook }}"
  101. when: openshift_master_upgrade_hook is defined
  102. - include: ../../openshift-master/restart_hosts.yml
  103. when: openshift.common.rolling_restart_mode == 'system'
  104. - include: ../../openshift-master/restart_services.yml
  105. when: openshift.common.rolling_restart_mode == 'services'
  106. # Run the post-upgrade hook if defined:
  107. - debug: msg="Running master post-upgrade hook {{ openshift_master_upgrade_post_hook }}"
  108. when: openshift_master_upgrade_post_hook is defined
  109. - include: "{{ openshift_master_upgrade_post_hook }}"
  110. when: openshift_master_upgrade_post_hook is defined
  111. - set_fact:
  112. master_update_complete: True
  113. ##############################################################################
  114. # Gate on master update complete
  115. ##############################################################################
  116. - name: Gate on master update
  117. hosts: localhost
  118. connection: local
  119. become: no
  120. tasks:
  121. - set_fact:
  122. master_update_completed: "{{ hostvars
  123. | oo_select_keys(groups.oo_masters_to_config)
  124. | oo_collect('inventory_hostname', {'master_update_complete': true}) }}"
  125. - set_fact:
  126. master_update_failed: "{{ groups.oo_masters_to_config | difference(master_update_completed) }}"
  127. - fail:
  128. msg: "Upgrade cannot continue. The following masters did not finish updating: {{ master_update_failed | join(',') }}"
  129. when: master_update_failed | length > 0
  130. ###############################################################################
  131. # Reconcile Cluster Roles, Cluster Role Bindings and Security Context Constraints
  132. ###############################################################################
  133. - name: Reconcile Cluster Roles and Cluster Role Bindings and Security Context Constraints
  134. hosts: oo_masters_to_config
  135. roles:
  136. - { role: openshift_cli }
  137. vars:
  138. origin_reconcile_bindings: "{{ deployment_type == 'origin' and openshift_version | version_compare('1.0.6', '>') }}"
  139. ent_reconcile_bindings: true
  140. openshift_docker_hosted_registry_network: "{{ hostvars[groups.oo_first_master.0].openshift.common.portal_net }}"
  141. # Another spot where we assume docker is running and do not want to accidentally trigger an unsafe
  142. # restart.
  143. skip_docker_role: True
  144. tasks:
  145. - name: Reconcile Cluster Roles
  146. command: >
  147. {{ openshift.common.client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  148. policy reconcile-cluster-roles --additive-only=true --confirm -o name
  149. register: reconcile_cluster_role_result
  150. changed_when:
  151. - reconcile_cluster_role_result.stdout != ''
  152. - reconcile_cluster_role_result.rc == 0
  153. run_once: true
  154. - name: Reconcile Cluster Role Bindings
  155. command: >
  156. {{ openshift.common.client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  157. policy reconcile-cluster-role-bindings
  158. --exclude-groups=system:authenticated
  159. --exclude-groups=system:authenticated:oauth
  160. --exclude-groups=system:unauthenticated
  161. --exclude-users=system:anonymous
  162. --additive-only=true --confirm -o name
  163. when: origin_reconcile_bindings | bool or ent_reconcile_bindings | bool
  164. register: reconcile_bindings_result
  165. changed_when:
  166. - reconcile_bindings_result.stdout != ''
  167. - reconcile_bindings_result.rc == 0
  168. run_once: true
  169. - name: Reconcile Jenkins Pipeline Role Bindings
  170. command: >
  171. {{ openshift.common.client_binary }} adm --config={{ openshift.common.config_base }}/master/admin.kubeconfig policy reconcile-cluster-role-bindings system:build-strategy-jenkinspipeline --confirm -o name
  172. run_once: true
  173. register: reconcile_jenkins_role_binding_result
  174. changed_when:
  175. - reconcile_jenkins_role_binding_result.stdout != ''
  176. - reconcile_jenkins_role_binding_result.rc == 0
  177. when: openshift.common.version_gte_3_4_or_1_4 | bool
  178. - name: Reconcile Security Context Constraints
  179. command: >
  180. {{ openshift.common.client_binary }} adm policy reconcile-sccs --confirm --additive-only=true -o name
  181. register: reconcile_scc_result
  182. changed_when:
  183. - reconcile_scc_result.stdout != ''
  184. - reconcile_scc_result.rc == 0
  185. run_once: true
  186. - set_fact:
  187. reconcile_complete: True
  188. ##############################################################################
  189. # Gate on reconcile
  190. ##############################################################################
  191. - name: Gate on reconcile
  192. hosts: localhost
  193. connection: local
  194. become: no
  195. tasks:
  196. - set_fact:
  197. reconcile_completed: "{{ hostvars
  198. | oo_select_keys(groups.oo_masters_to_config)
  199. | oo_collect('inventory_hostname', {'reconcile_complete': true}) }}"
  200. - set_fact:
  201. reconcile_failed: "{{ groups.oo_masters_to_config | difference(reconcile_completed) }}"
  202. - fail:
  203. msg: "Upgrade cannot continue. The following masters did not finish reconciling: {{ reconcile_failed | join(',') }}"
  204. when: reconcile_failed | length > 0
  205. - name: Upgrade Docker on dedicated containerized etcd hosts
  206. hosts: oo_etcd_to_config:!oo_nodes_to_upgrade
  207. serial: 1
  208. any_errors_fatal: true
  209. roles:
  210. - openshift_facts
  211. tasks:
  212. - include: docker/upgrade.yml
  213. when: l_docker_upgrade is defined and l_docker_upgrade | bool and not openshift.common.is_atomic | bool
  214. - name: Drain and upgrade master nodes
  215. hosts: oo_masters_to_config:&oo_nodes_to_upgrade
  216. # This var must be set with -e on invocation, as it is not a per-host inventory var
  217. # and is evaluated early. Values such as "20%" can also be used.
  218. serial: "{{ openshift_upgrade_nodes_serial | default(1) }}"
  219. any_errors_fatal: true
  220. pre_tasks:
  221. - name: Load lib_openshift modules
  222. include_role:
  223. name: lib_openshift
  224. # TODO: To better handle re-trying failed upgrades, it would be nice to check if the node
  225. # or docker actually needs an upgrade before proceeding. Perhaps best to save this until
  226. # we merge upgrade functionality into the base roles and a normal config.yml playbook run.
  227. - name: Mark node unschedulable
  228. oadm_manage_node:
  229. node: "{{ openshift.node.nodename | lower }}"
  230. schedulable: False
  231. delegate_to: "{{ groups.oo_first_master.0 }}"
  232. retries: 10
  233. delay: 5
  234. register: node_unschedulable
  235. until: node_unschedulable|succeeded
  236. - name: Drain Node for Kubelet upgrade
  237. command: >
  238. {{ hostvars[groups.oo_first_master.0].openshift.common.admin_binary }} drain {{ openshift.node.nodename | lower }} --force --delete-local-data --ignore-daemonsets
  239. delegate_to: "{{ groups.oo_first_master.0 }}"
  240. roles:
  241. - lib_openshift
  242. - openshift_facts
  243. - docker
  244. - openshift_node_upgrade
  245. post_tasks:
  246. - name: Set node schedulability
  247. oadm_manage_node:
  248. node: "{{ openshift.node.nodename | lower }}"
  249. schedulable: True
  250. delegate_to: "{{ groups.oo_first_master.0 }}"
  251. retries: 10
  252. delay: 5
  253. register: node_schedulable
  254. until: node_schedulable|succeeded
  255. when: node_unschedulable|changed