upgrade.yml 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386
  1. ---
  2. - name: Load master facts
  3. hosts: masters
  4. roles:
  5. - openshift_facts
  6. - name: Verify upgrade can proceed
  7. hosts: masters[0]
  8. vars:
  9. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  10. gather_facts: no
  11. tasks:
  12. # Checking the global deployment type rather than host facts, this is about
  13. # what the user is requesting.
  14. - fail:
  15. msg: "Deployment type enterprise not supported for upgrade"
  16. when: deployment_type == "enterprise"
  17. # Pacemaker is currently the only supported upgrade path for multiple masters
  18. - fail:
  19. msg: "openshift_master_cluster_method must be set to 'pacemaker'"
  20. when: openshift_master_ha | bool and ((openshift_master_cluster_method is not defined) or (openshift_master_cluster_method is defined and openshift_master_cluster_method != "pacemaker"))
  21. - name: Run pre-upgrade checks on first master
  22. hosts: masters[0]
  23. tasks:
  24. # If this script errors out ansible will show the default stdout/stderr
  25. # which contains details for the user:
  26. - script: files/pre-upgrade-check
  27. - name: Evaluate etcd_hosts
  28. hosts: localhost
  29. tasks:
  30. - name: Evaluate etcd hosts
  31. add_host:
  32. name: "{{ groups.masters.0 }}"
  33. groups: etcd_hosts
  34. when: hostvars[groups.masters.0].openshift.master.embedded_etcd | bool
  35. - name: Evaluate etcd hosts
  36. add_host:
  37. name: "{{ item }}"
  38. groups: etcd_hosts
  39. with_items: groups.etcd
  40. when: not hostvars[groups.masters.0].openshift.master.embedded_etcd | bool
  41. - name: Backup etcd
  42. hosts: etcd_hosts
  43. vars:
  44. embedded_etcd: "{{ openshift.master.embedded_etcd }}"
  45. timestamp: "{{ lookup('pipe', 'date +%Y%m%d%H%M%S') }}"
  46. roles:
  47. - openshift_facts
  48. tasks:
  49. - stat: path=/var/lib/openshift
  50. register: var_lib_openshift
  51. - stat: path=/var/lib/origin
  52. register: var_lib_origin
  53. - name: Create origin symlink if necessary
  54. file: src=/var/lib/openshift/ dest=/var/lib/origin state=link
  55. when: var_lib_openshift.stat.exists == True and var_lib_origin.stat.exists == False
  56. - name: Check available disk space for etcd backup
  57. # We assume to be using the data dir for all backups.
  58. shell: >
  59. df --output=avail -k {{ openshift.common.data_dir }} | tail -n 1
  60. register: avail_disk
  61. - name: Check current embedded etcd disk usage
  62. shell: >
  63. du -k {{ openshift.master.etcd_data_dir }} | tail -n 1 | cut -f1
  64. register: etcd_disk_usage
  65. when: embedded_etcd | bool
  66. - name: Abort if insufficient disk space for etcd backup
  67. fail:
  68. msg: >
  69. {{ etcd_disk_usage.stdout }} Kb disk space required for etcd backup,
  70. {{ avail_disk.stdout }} Kb available.
  71. when: (embedded_etcd | bool) and (etcd_disk_usage.stdout|int > avail_disk.stdout|int)
  72. - name: Install etcd (for etcdctl)
  73. yum:
  74. pkg: etcd
  75. state: latest
  76. - name: Generate etcd backup
  77. command: >
  78. etcdctl backup --data-dir={{ openshift.master.etcd_data_dir }}
  79. --backup-dir={{ openshift.common.data_dir }}/etcd-backup-{{ timestamp }}
  80. - name: Display location of etcd backup
  81. debug:
  82. msg: "Etcd backup created in {{ openshift.common.data_dir }}/etcd-backup-{{ timestamp }}"
  83. - name: Update deployment type
  84. hosts: OSEv3
  85. roles:
  86. - openshift_facts
  87. post_tasks:
  88. - openshift_facts:
  89. role: common
  90. local_facts:
  91. deployment_type: "{{ deployment_type }}"
  92. - name: Perform upgrade version checking
  93. hosts: masters[0]
  94. tasks:
  95. - name: Clean yum cache
  96. command: yum clean all
  97. - name: Determine available versions
  98. script: files/versions.sh {{ openshift.common.service_type }} openshift
  99. register: g_versions_result
  100. - set_fact:
  101. g_aos_versions: "{{ g_versions_result.stdout | from_yaml }}"
  102. - set_fact:
  103. g_new_version: "{{ g_aos_versions.curr_version.split('-', 1).0 if g_aos_versions.avail_version is none else g_aos_versions.avail_version.split('-', 1).0 }}"
  104. - fail:
  105. msg: This playbook requires Origin 1.0.6 or later
  106. when: deployment_type == 'origin' and g_aos_versions.curr_version | version_compare('1.0.6','<')
  107. - fail:
  108. msg: This playbook requires Atomic OpenShift 3.0.2 or later
  109. when: deployment_type in ['openshift-enterprise', 'atomic-openshift'] and g_aos_versions.curr_version | version_compare('3.0.2','<')
  110. - fail:
  111. msg: Atomic OpenShift 3.1 packages not found
  112. when: deployment_type in ['openshift-enterprise', 'atomic-openshift'] and g_aos_versions.curr_version | version_compare('3.0.2.900','<') and (g_aos_versions.avail_version is none or g_aos_versions.avail_version | version_compare('3.0.2.900','<'))
  113. - name: Upgrade masters
  114. hosts: masters
  115. vars:
  116. openshift_version: "{{ openshift_pkg_version | default('') }}"
  117. tasks:
  118. - name: Upgrade to latest available kernel
  119. yum:
  120. pkg: kernel
  121. state: latest
  122. - name: Upgrade master packages
  123. command: yum update -y {{ openshift.common.service_type }}-master{{ openshift_version }}
  124. - name: Ensure python-yaml present for config upgrade
  125. yum:
  126. pkg: python-yaml
  127. state: installed
  128. - debug: var=hostvars[inventory_hostname].openshift.common.config_base
  129. - name: Upgrade master configuration
  130. openshift_upgrade_config:
  131. from_version: '3.0'
  132. to_version: '3.1'
  133. role: master
  134. config_base: "{{ hostvars[inventory_hostname].openshift.common.config_base }}"
  135. - set_fact:
  136. master_certs_missing: True
  137. master_cert_subdir: master-{{ openshift.common.hostname }}
  138. master_cert_config_dir: "{{ openshift.common.config_base }}/master"
  139. - name: Create temp directory for syncing certs
  140. hosts: localhost
  141. gather_facts: no
  142. tasks:
  143. - name: Create local temp directory for syncing certs
  144. local_action: command mktemp -d /tmp/openshift-ansible-XXXXXXX
  145. register: g_master_mktemp
  146. changed_when: False
  147. - name: Generate missing master certificates
  148. hosts: masters[0]
  149. vars:
  150. master_hostnames: "{{ hostvars
  151. | oo_select_keys(groups.masters)
  152. | oo_collect('openshift.common.all_hostnames')
  153. | oo_flatten | unique }}"
  154. master_generated_certs_dir: "{{ openshift.common.config_base }}/generated-configs"
  155. masters_needing_certs: "{{ hostvars
  156. | oo_select_keys(groups.masters)
  157. | difference([groups.masters.0]) }}"
  158. sync_tmpdir: "{{ hostvars.localhost.g_master_mktemp.stdout }}"
  159. openshift_deployment_type: "{{ deployment_type }}"
  160. roles:
  161. - openshift_master_certificates
  162. post_tasks:
  163. - name: Remove generated etcd client certs when using external etcd
  164. file:
  165. path: "{{ master_generated_certs_dir }}/{{ item.0.master_cert_subdir }}/{{ item.1 }}"
  166. state: absent
  167. when: groups.oo_etcd_to_config is defined and groups.oo_etcd_to_config
  168. with_nested:
  169. - masters_needing_certs
  170. - - master.etcd-client.crt
  171. - master.etcd-client.key
  172. - name: Create a tarball of the master certs
  173. command: >
  174. tar -czvf {{ master_generated_certs_dir }}/{{ item.master_cert_subdir }}.tgz
  175. -C {{ master_generated_certs_dir }}/{{ item.master_cert_subdir }} .
  176. with_items: masters_needing_certs
  177. - name: Retrieve the master cert tarball from the master
  178. fetch:
  179. src: "{{ master_generated_certs_dir }}/{{ item.master_cert_subdir }}.tgz"
  180. dest: "{{ sync_tmpdir }}/"
  181. flat: yes
  182. fail_on_missing: yes
  183. validate_checksum: yes
  184. with_items: masters_needing_certs
  185. - name: Sync certs and restart masters post configuration change
  186. hosts: masters
  187. vars:
  188. sync_tmpdir: "{{ hostvars.localhost.g_master_mktemp.stdout }}"
  189. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  190. tasks:
  191. - name: Unarchive the tarball on the master
  192. unarchive:
  193. src: "{{ sync_tmpdir }}/{{ master_cert_subdir }}.tgz"
  194. dest: "{{ master_cert_config_dir }}"
  195. when: inventory_hostname != groups.masters.0
  196. - name: Restart master services
  197. service: name="{{ openshift.common.service_type}}-master" state=restarted
  198. when: not openshift_master_ha | bool
  199. - name: Destroy cluster
  200. hosts: masters[0]
  201. vars:
  202. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  203. openshift_deployment_type: "{{ deployment_type }}"
  204. pre_tasks:
  205. - name: Check for configured cluster
  206. stat:
  207. path: /etc/corosync/corosync.conf
  208. register: corosync_conf
  209. when: openshift_master_ha | bool
  210. - name: Destroy cluster
  211. command: pcs cluster destroy --all
  212. when: openshift_master_ha | bool and corosync_conf.stat.exists == true
  213. - name: Start pcsd on masters
  214. hosts: masters
  215. vars:
  216. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  217. tasks:
  218. - name: Start pcsd
  219. service: name=pcsd state=started
  220. when: openshift_master_ha | bool
  221. - name: Re-create cluster
  222. hosts: masters[0]
  223. vars:
  224. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  225. openshift_deployment_type: "{{ deployment_type }}"
  226. omc_cluster_hosts: "{{ groups.masters | join(' ') }}"
  227. roles:
  228. - role: openshift_master_cluster
  229. when: openshift_master_ha | bool
  230. - name: Delete temporary directory on localhost
  231. hosts: localhost
  232. gather_facts: no
  233. tasks:
  234. - file: name={{ g_master_mktemp.stdout }} state=absent
  235. changed_when: False
  236. - name: Upgrade nodes
  237. hosts: nodes
  238. vars:
  239. openshift_version: "{{ openshift_pkg_version | default('') }}"
  240. roles:
  241. - openshift_facts
  242. tasks:
  243. - name: Upgrade node packages
  244. command: yum update -y {{ openshift.common.service_type }}-node{{ openshift_version }}
  245. - name: Restart node services
  246. service: name="{{ openshift.common.service_type }}-node" state=restarted
  247. - name: Update cluster policy and policy bindings
  248. hosts: masters[0]
  249. vars:
  250. origin_reconcile_bindings: "{{ deployment_type == 'origin' and g_new_version | version_compare('1.0.6', '>') }}"
  251. ent_reconcile_bindings: "{{ deployment_type in ['openshift-enterprise', 'atomic-enterprise'] and g_new_version | version_compare('3.0.2','>') }}"
  252. tasks:
  253. - name: oadm policy reconcile-cluster-roles --confirm
  254. command: >
  255. {{ openshift.common.admin_binary}} --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  256. policy reconcile-cluster-roles --confirm
  257. - name: oadm policy reconcile-cluster-role-bindings --confirm
  258. command: >
  259. {{ openshift.common.admin_binary}} --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  260. policy reconcile-cluster-role-bindings
  261. --exclude-groups=system:authenticated
  262. --exclude-groups=system:unauthenticated
  263. --exclude-users=system:anonymous
  264. --additive-only=true --confirm
  265. when: origin_reconcile_bindings | bool or ent_reconcile_bindings | bool
  266. - name: Restart masters post reconcile
  267. hosts: masters
  268. vars:
  269. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  270. tasks:
  271. - name: Restart master services
  272. service: name="{{ openshift.common.service_type}}-master" state=restarted
  273. when: not openshift_master_ha | bool
  274. - name: Restart cluster post reconcile
  275. hosts: masters[0]
  276. vars:
  277. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  278. tasks:
  279. - name: Restart master cluster
  280. command: pcs resource restart master
  281. when: openshift_master_ha | bool
  282. - name: Upgrade default router and registry
  283. hosts: masters[0]
  284. vars:
  285. - registry_image: "{{ openshift.master.registry_url | replace( '${component}', 'docker-registry' ) | replace ( '${version}', 'v' + g_new_version ) }}"
  286. - router_image: "{{ openshift.master.registry_url | replace( '${component}', 'haproxy-router' ) | replace ( '${version}', 'v' + g_new_version ) }}"
  287. - oc_cmd: "{{ openshift.common.client_binary }} --config={{ openshift.common.config_base }}/master/admin.kubeconfig"
  288. tasks:
  289. - name: Check for default router
  290. command: >
  291. {{ oc_cmd }} get -n default dc/router
  292. register: _default_router
  293. failed_when: false
  294. changed_when: false
  295. - name: Check for allowHostNetwork and allowHostPorts
  296. when: _default_router.rc == 0
  297. shell: >
  298. {{ oc_cmd }} get -o yaml scc/privileged | /usr/bin/grep -e allowHostPorts -e allowHostNetwork
  299. register: _scc
  300. - name: Grant allowHostNetwork and allowHostPorts
  301. when:
  302. - _default_router.rc == 0
  303. - "'false' in _scc.stdout"
  304. command: >
  305. {{ oc_cmd }} patch scc/privileged -p '{"allowHostPorts":true,"allowHostNetwork":true}' --loglevel=9
  306. - name: Update deployment config to 1.0.4/3.0.1 spec
  307. when: _default_router.rc == 0
  308. command: >
  309. {{ oc_cmd }} patch dc/router -p
  310. '{"spec":{"strategy":{"rollingParams":{"updatePercent":-10},"spec":{"serviceAccount":"router","serviceAccountName":"router"}}}}'
  311. - name: Switch to hostNetwork=true
  312. when: _default_router.rc == 0
  313. command: >
  314. {{ oc_cmd }} patch dc/router -p '{"spec":{"template":{"spec":{"hostNetwork":true}}}}'
  315. - name: Update router image to current version
  316. when: _default_router.rc == 0
  317. command: >
  318. {{ oc_cmd }} patch dc/router -p
  319. '{"spec":{"template":{"spec":{"containers":[{"name":"router","image":"{{ router_image }}"}]}}}}'
  320. - name: Check for default registry
  321. command: >
  322. {{ oc_cmd }} get -n default dc/docker-registry
  323. register: _default_registry
  324. failed_when: false
  325. changed_when: false
  326. - name: Update registry image to current version
  327. when: _default_registry.rc == 0
  328. command: >
  329. {{ oc_cmd }} patch dc/docker-registry -p
  330. '{"spec":{"template":{"spec":{"containers":[{"name":"registry","image":"{{ registry_image }}"}]}}}}'
  331. - name: Update image streams and templates
  332. hosts: masters[0]
  333. vars:
  334. openshift_examples_import_command: "update"
  335. openshift_deployment_type: "{{ deployment_type }}"
  336. roles:
  337. - openshift_examples