upgrade.yml 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394
  1. ---
  2. - name: Load master facts
  3. hosts: masters
  4. roles:
  5. - openshift_facts
  6. - name: Verify upgrade can proceed
  7. hosts: masters[0]
  8. vars:
  9. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  10. gather_facts: no
  11. tasks:
  12. # Pacemaker is currently the only supported upgrade path for multiple masters
  13. - fail:
  14. msg: "openshift_master_cluster_method must be set to 'pacemaker'"
  15. when: openshift_master_ha | bool and ((openshift_master_cluster_method is not defined) or (openshift_master_cluster_method is defined and openshift_master_cluster_method != "pacemaker"))
  16. - name: Run pre-upgrade checks on first master
  17. hosts: masters[0]
  18. tasks:
  19. # If this script errors out ansible will show the default stdout/stderr
  20. # which contains details for the user:
  21. - script: files/pre-upgrade-check
  22. - name: Evaluate etcd_hosts
  23. hosts: localhost
  24. tasks:
  25. - name: Evaluate etcd hosts
  26. add_host:
  27. name: "{{ groups.masters.0 }}"
  28. groups: etcd_hosts
  29. when: hostvars[groups.masters.0].openshift.master.embedded_etcd | bool
  30. - name: Evaluate etcd hosts
  31. add_host:
  32. name: "{{ item }}"
  33. groups: etcd_hosts
  34. with_items: groups.etcd
  35. when: not hostvars[groups.masters.0].openshift.master.embedded_etcd | bool
  36. - name: Backup etcd
  37. hosts: etcd_hosts
  38. vars:
  39. embedded_etcd: "{{ openshift.master.embedded_etcd }}"
  40. timestamp: "{{ lookup('pipe', 'date +%Y%m%d%H%M%S') }}"
  41. roles:
  42. - openshift_facts
  43. tasks:
  44. - stat: path=/var/lib/openshift
  45. register: var_lib_openshift
  46. - stat: path=/var/lib/origin
  47. register: var_lib_origin
  48. - name: Create origin symlink if necessary
  49. file: src=/var/lib/openshift/ dest=/var/lib/origin state=link
  50. when: var_lib_openshift.stat.exists == True and var_lib_origin.stat.exists == False
  51. - name: Check available disk space for etcd backup
  52. # We assume to be using the data dir for all backups.
  53. shell: >
  54. df --output=avail -k {{ openshift.common.data_dir }} | tail -n 1
  55. register: avail_disk
  56. - name: Check current embedded etcd disk usage
  57. shell: >
  58. du -k {{ openshift.master.etcd_data_dir }} | tail -n 1 | cut -f1
  59. register: etcd_disk_usage
  60. when: embedded_etcd | bool
  61. - name: Abort if insufficient disk space for etcd backup
  62. fail:
  63. msg: >
  64. {{ etcd_disk_usage.stdout }} Kb disk space required for etcd backup,
  65. {{ avail_disk.stdout }} Kb available.
  66. when: (embedded_etcd | bool) and (etcd_disk_usage.stdout|int > avail_disk.stdout|int)
  67. - name: Install etcd (for etcdctl)
  68. yum:
  69. pkg: etcd
  70. state: latest
  71. - name: Generate etcd backup
  72. command: >
  73. etcdctl backup --data-dir={{ openshift.master.etcd_data_dir }}
  74. --backup-dir={{ openshift.common.data_dir }}/etcd-backup-{{ timestamp }}
  75. - name: Display location of etcd backup
  76. debug:
  77. msg: "Etcd backup created in {{ openshift.common.data_dir }}/etcd-backup-{{ timestamp }}"
  78. - name: Update deployment type
  79. hosts: OSEv3
  80. roles:
  81. - openshift_facts
  82. post_tasks:
  83. - openshift_facts:
  84. role: common
  85. local_facts:
  86. deployment_type: "{{ deployment_type }}"
  87. - name: Perform upgrade version checking
  88. hosts: masters[0]
  89. tasks:
  90. - name: Clean yum cache
  91. command: yum clean all
  92. - name: Determine available versions
  93. script: files/versions.sh {{ openshift.common.service_type }} openshift
  94. register: g_versions_result
  95. - set_fact:
  96. g_aos_versions: "{{ g_versions_result.stdout | from_yaml }}"
  97. - set_fact:
  98. g_new_version: "{{ g_aos_versions.curr_version.split('-', 1).0 if g_aos_versions.avail_version is none else g_aos_versions.avail_version.split('-', 1).0 }}"
  99. - fail:
  100. msg: This playbook requires Origin 1.0.6 or later
  101. when: deployment_type == 'origin' and g_aos_versions.curr_version | version_compare('1.0.6','<')
  102. - fail:
  103. msg: This playbook requires Atomic OpenShift 3.0.2 or later
  104. when: deployment_type in ['openshift-enterprise', 'atomic-openshift'] and g_aos_versions.curr_version | version_compare('3.0.2','<')
  105. - fail:
  106. msg: Atomic OpenShift 3.1 packages not found
  107. when: deployment_type in ['openshift-enterprise', 'atomic-openshift'] and g_aos_versions.curr_version | version_compare('3.0.2.900','<') and (g_aos_versions.avail_version is none or g_aos_versions.avail_version | version_compare('3.0.2.900','<'))
  108. # Deployment type 'enterprise' is no longer valid if we're upgrading to 3.1 or beyond.
  109. # (still valid for 3.0.x to 3.0.y however) Using the global deployment_type here as
  110. # we're checking what was requested by the upgrade, not the current type on the system.
  111. - fail:
  112. msg: "Deployment type enterprise not supported for upgrade"
  113. when: deployment_type == "enterprise" and g_aos_versions.curr_version | version_compare('3.1', '>=')
  114. - name: Upgrade masters
  115. hosts: masters
  116. vars:
  117. openshift_version: "{{ openshift_pkg_version | default('') }}"
  118. tasks:
  119. - name: Upgrade to latest available kernel
  120. yum:
  121. pkg: kernel
  122. state: latest
  123. - name: Upgrade master packages
  124. command: yum update -y {{ openshift.common.service_type }}-master{{ openshift_version }}
  125. - name: Ensure python-yaml present for config upgrade
  126. yum:
  127. pkg: PyYAML
  128. state: installed
  129. - name: Upgrade master configuration
  130. openshift_upgrade_config:
  131. from_version: '3.0'
  132. to_version: '3.1'
  133. role: master
  134. config_base: "{{ hostvars[inventory_hostname].openshift.common.config_base }}"
  135. when: deployment_type in ['openshift-enterprise', 'atomic-enterprise'] and g_aos_versions.curr_version | version_compare('3.1', '>=')
  136. - set_fact:
  137. master_certs_missing: True
  138. master_cert_subdir: master-{{ openshift.common.hostname }}
  139. master_cert_config_dir: "{{ openshift.common.config_base }}/master"
  140. - name: Create temp directory for syncing certs
  141. hosts: localhost
  142. gather_facts: no
  143. tasks:
  144. - name: Create local temp directory for syncing certs
  145. local_action: command mktemp -d /tmp/openshift-ansible-XXXXXXX
  146. register: g_master_mktemp
  147. changed_when: False
  148. - name: Generate missing master certificates
  149. hosts: masters[0]
  150. vars:
  151. master_hostnames: "{{ hostvars
  152. | oo_select_keys(groups.masters)
  153. | oo_collect('openshift.common.all_hostnames')
  154. | oo_flatten | unique }}"
  155. master_generated_certs_dir: "{{ openshift.common.config_base }}/generated-configs"
  156. masters_needing_certs: "{{ hostvars
  157. | oo_select_keys(groups.masters)
  158. | difference([groups.masters.0]) }}"
  159. sync_tmpdir: "{{ hostvars.localhost.g_master_mktemp.stdout }}"
  160. openshift_deployment_type: "{{ deployment_type }}"
  161. roles:
  162. - openshift_master_certificates
  163. post_tasks:
  164. - name: Remove generated etcd client certs when using external etcd
  165. file:
  166. path: "{{ master_generated_certs_dir }}/{{ item.0.master_cert_subdir }}/{{ item.1 }}"
  167. state: absent
  168. when: groups.oo_etcd_to_config is defined and groups.oo_etcd_to_config
  169. with_nested:
  170. - masters_needing_certs
  171. - - master.etcd-client.crt
  172. - master.etcd-client.key
  173. - name: Create a tarball of the master certs
  174. command: >
  175. tar -czvf {{ master_generated_certs_dir }}/{{ item.master_cert_subdir }}.tgz
  176. -C {{ master_generated_certs_dir }}/{{ item.master_cert_subdir }} .
  177. with_items: masters_needing_certs
  178. - name: Retrieve the master cert tarball from the master
  179. fetch:
  180. src: "{{ master_generated_certs_dir }}/{{ item.master_cert_subdir }}.tgz"
  181. dest: "{{ sync_tmpdir }}/"
  182. flat: yes
  183. fail_on_missing: yes
  184. validate_checksum: yes
  185. with_items: masters_needing_certs
  186. - name: Sync certs and restart masters post configuration change
  187. hosts: masters
  188. vars:
  189. sync_tmpdir: "{{ hostvars.localhost.g_master_mktemp.stdout }}"
  190. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  191. tasks:
  192. - name: Unarchive the tarball on the master
  193. unarchive:
  194. src: "{{ sync_tmpdir }}/{{ master_cert_subdir }}.tgz"
  195. dest: "{{ master_cert_config_dir }}"
  196. when: inventory_hostname != groups.masters.0
  197. - name: Restart master services
  198. service: name="{{ openshift.common.service_type}}-master" state=restarted
  199. when: not openshift_master_ha | bool
  200. - name: Destroy cluster
  201. hosts: masters[0]
  202. vars:
  203. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  204. openshift_deployment_type: "{{ deployment_type }}"
  205. pre_tasks:
  206. - name: Check for configured cluster
  207. stat:
  208. path: /etc/corosync/corosync.conf
  209. register: corosync_conf
  210. when: openshift_master_ha | bool
  211. - name: Destroy cluster
  212. command: pcs cluster destroy --all
  213. when: openshift_master_ha | bool and corosync_conf.stat.exists == true
  214. - name: Start pcsd on masters
  215. hosts: masters
  216. vars:
  217. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  218. tasks:
  219. - name: Start pcsd
  220. service: name=pcsd state=started
  221. when: openshift_master_ha | bool
  222. - name: Re-create cluster
  223. hosts: masters[0]
  224. vars:
  225. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  226. openshift_deployment_type: "{{ deployment_type }}"
  227. omc_cluster_hosts: "{{ groups.masters | join(' ') }}"
  228. roles:
  229. - role: openshift_master_cluster
  230. when: openshift_master_ha | bool
  231. - name: Delete temporary directory on localhost
  232. hosts: localhost
  233. gather_facts: no
  234. tasks:
  235. - file: name={{ g_master_mktemp.stdout }} state=absent
  236. changed_when: False
  237. - name: Upgrade nodes
  238. hosts: nodes
  239. vars:
  240. openshift_version: "{{ openshift_pkg_version | default('') }}"
  241. roles:
  242. - openshift_facts
  243. tasks:
  244. - name: Upgrade node packages
  245. command: yum update -y {{ openshift.common.service_type }}-node{{ openshift_version }}
  246. - name: Restart node services
  247. service: name="{{ openshift.common.service_type }}-node" state=restarted
  248. - name: Update cluster policy and policy bindings
  249. hosts: masters[0]
  250. vars:
  251. origin_reconcile_bindings: "{{ deployment_type == 'origin' and g_new_version | version_compare('1.0.6', '>') }}"
  252. ent_reconcile_bindings: "{{ deployment_type in ['openshift-enterprise', 'atomic-enterprise'] and g_new_version | version_compare('3.0.2','>') }}"
  253. tasks:
  254. - name: oadm policy reconcile-cluster-roles --confirm
  255. command: >
  256. {{ openshift.common.admin_binary}} --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  257. policy reconcile-cluster-roles --confirm
  258. - name: oadm policy reconcile-cluster-role-bindings --confirm
  259. command: >
  260. {{ openshift.common.admin_binary}} --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  261. policy reconcile-cluster-role-bindings
  262. --exclude-groups=system:authenticated
  263. --exclude-groups=system:unauthenticated
  264. --exclude-users=system:anonymous
  265. --additive-only=true --confirm
  266. when: origin_reconcile_bindings | bool or ent_reconcile_bindings | bool
  267. - name: Restart masters post reconcile
  268. hosts: masters
  269. vars:
  270. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  271. tasks:
  272. - name: Restart master services
  273. service: name="{{ openshift.common.service_type}}-master" state=restarted
  274. when: not openshift_master_ha | bool
  275. - name: Restart cluster post reconcile
  276. hosts: masters[0]
  277. vars:
  278. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  279. tasks:
  280. - name: Restart master cluster
  281. command: pcs resource restart master
  282. when: openshift_master_ha | bool
  283. - name: Wait for the clustered master service to be available
  284. wait_for:
  285. host: "{{ openshift_master_cluster_vip }}"
  286. port: 8443
  287. state: started
  288. timeout: 180
  289. delay: 90
  290. when: openshift_master_ha | bool
  291. - name: Upgrade default router and registry
  292. hosts: masters[0]
  293. vars:
  294. - registry_image: "{{ openshift.master.registry_url | replace( '${component}', 'docker-registry' ) | replace ( '${version}', 'v' + g_new_version ) }}"
  295. - router_image: "{{ openshift.master.registry_url | replace( '${component}', 'haproxy-router' ) | replace ( '${version}', 'v' + g_new_version ) }}"
  296. - oc_cmd: "{{ openshift.common.client_binary }} --config={{ openshift.common.config_base }}/master/admin.kubeconfig"
  297. tasks:
  298. - name: Check for default router
  299. command: >
  300. {{ oc_cmd }} get -n default dc/router
  301. register: _default_router
  302. failed_when: false
  303. changed_when: false
  304. - name: Check for allowHostNetwork and allowHostPorts
  305. when: _default_router.rc == 0
  306. shell: >
  307. {{ oc_cmd }} get -o yaml scc/privileged | /usr/bin/grep -e allowHostPorts -e allowHostNetwork
  308. register: _scc
  309. - name: Grant allowHostNetwork and allowHostPorts
  310. when:
  311. - _default_router.rc == 0
  312. - "'false' in _scc.stdout"
  313. command: >
  314. {{ oc_cmd }} patch scc/privileged -p '{"allowHostPorts":true,"allowHostNetwork":true}' --loglevel=9
  315. - name: Update deployment config to 1.0.4/3.0.1 spec
  316. when: _default_router.rc == 0
  317. command: >
  318. {{ oc_cmd }} patch dc/router -p
  319. '{"spec":{"strategy":{"rollingParams":{"updatePercent":-10},"spec":{"serviceAccount":"router","serviceAccountName":"router"}}}}'
  320. - name: Switch to hostNetwork=true
  321. when: _default_router.rc == 0
  322. command: >
  323. {{ oc_cmd }} patch dc/router -p '{"spec":{"template":{"spec":{"hostNetwork":true}}}}'
  324. - name: Update router image to current version
  325. when: _default_router.rc == 0
  326. command: >
  327. {{ oc_cmd }} patch dc/router -p
  328. '{"spec":{"template":{"spec":{"containers":[{"name":"router","image":"{{ router_image }}"}]}}}}'
  329. - name: Check for default registry
  330. command: >
  331. {{ oc_cmd }} get -n default dc/docker-registry
  332. register: _default_registry
  333. failed_when: false
  334. changed_when: false
  335. - name: Update registry image to current version
  336. when: _default_registry.rc == 0
  337. command: >
  338. {{ oc_cmd }} patch dc/docker-registry -p
  339. '{"spec":{"template":{"spec":{"containers":[{"name":"registry","image":"{{ registry_image }}"}]}}}}'
  340. - name: Update image streams and templates
  341. hosts: masters[0]
  342. vars:
  343. openshift_examples_import_command: "update"
  344. openshift_deployment_type: "{{ deployment_type }}"
  345. roles:
  346. - openshift_examples