upgrade.yml 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378
  1. ---
  2. - name: Load master facts
  3. hosts: masters
  4. roles:
  5. - openshift_facts
  6. - name: Verify upgrade can proceed
  7. hosts: masters[0]
  8. vars:
  9. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  10. gather_facts: no
  11. tasks:
  12. # Checking the global deployment type rather than host facts, this is about
  13. # what the user is requesting.
  14. - fail: msg="Deployment type enterprise not supported for upgrade"
  15. when: deployment_type == "enterprise"
  16. # Pacemaker is currently the only supported upgrade path for multiple masters
  17. - fail: msg="openshift_master_cluster_method must be set to 'pacemaker'"
  18. when: openshift_master_ha | bool and ((openshift_master_cluster_method is not defined) or (openshift_master_cluster_method is defined and openshift_master_cluster_method != "pacemaker"))
  19. - name: Run pre-upgrade checks on first master
  20. hosts: masters[0]
  21. tasks:
  22. # If this script errors out ansible will show the default stdout/stderr
  23. # which contains details for the user:
  24. - script: files/pre-upgrade-check
  25. - name: Evaluate etcd_hosts
  26. hosts: localhost
  27. tasks:
  28. - name: Evaluate etcd hosts
  29. add_host:
  30. name: "{{ groups.masters.0 }}"
  31. groups: etcd_hosts
  32. when: hostvars[groups.masters.0].openshift.master.embedded_etcd | bool
  33. - name: Evaluate etcd hosts
  34. add_host:
  35. name: "{{ item }}"
  36. groups: etcd_hosts
  37. with_items: groups.etcd
  38. when: not hostvars[groups.masters.0].openshift.master.embedded_etcd | bool
  39. - name: Backup etcd
  40. hosts: etcd_hosts
  41. vars:
  42. embedded_etcd: "{{ openshift.master.embedded_etcd }}"
  43. timestamp: "{{ lookup('pipe', 'date +%Y%m%d%H%M%S') }}"
  44. roles:
  45. - openshift_facts
  46. tasks:
  47. - stat: path=/var/lib/openshift
  48. register: var_lib_openshift
  49. - stat: path=/var/lib/origin
  50. register: var_lib_origin
  51. - name: Create origin symlink if necessary
  52. file: src=/var/lib/openshift/ dest=/var/lib/origin state=link
  53. when: var_lib_openshift.stat.exists == True and var_lib_origin.stat.exists == False
  54. - name: Check available disk space for etcd backup
  55. # We assume to be using the data dir for all backups.
  56. shell: >
  57. df --output=avail -k {{ openshift.common.data_dir }} | tail -n 1
  58. register: avail_disk
  59. - name: Check current embedded etcd disk usage
  60. shell: >
  61. du -k {{ openshift.master.etcd_data_dir }} | tail -n 1 | cut -f1
  62. register: etcd_disk_usage
  63. when: embedded_etcd | bool
  64. - name: Abort if insufficient disk space for etcd backup
  65. fail:
  66. msg: >
  67. {{ etcd_disk_usage.stdout }} Kb disk space required for etcd backup,
  68. {{ avail_disk.stdout }} Kb available.
  69. when: (embedded_etcd | bool) and (etcd_disk_usage.stdout|int > avail_disk.stdout|int)
  70. - name: Install etcd (for etcdctl)
  71. yum:
  72. pkg: etcd
  73. state: latest
  74. - name: Generate etcd backup
  75. command: >
  76. etcdctl backup --data-dir={{ openshift.master.etcd_data_dir }}
  77. --backup-dir={{ openshift.common.data_dir }}/etcd-backup-{{ timestamp }}
  78. - name: Display location of etcd backup
  79. debug:
  80. msg: "Etcd backup created in {{ openshift.common.data_dir }}/etcd-backup-{{ timestamp }}"
  81. - name: Update deployment type
  82. hosts: OSEv3
  83. roles:
  84. - openshift_facts
  85. post_tasks:
  86. - openshift_facts:
  87. role: common
  88. local_facts:
  89. deployment_type: "{{ deployment_type }}"
  90. - name: Perform upgrade version checking
  91. hosts: masters[0]
  92. tasks:
  93. - name: Clean yum cache
  94. command: yum clean all
  95. - name: Determine available versions
  96. script: files/versions.sh {{ openshift.common.service_type }} openshift
  97. register: g_versions_result
  98. - set_fact:
  99. g_aos_versions: "{{ g_versions_result.stdout | from_yaml }}"
  100. - set_fact:
  101. g_new_version: "{{ g_aos_versions.curr_version.split('-', 1).0 if g_aos_versions.avail_version is none else g_aos_versions.avail_version.split('-', 1).0 }}"
  102. - fail: This playbook requires Origin 1.0.6 or later
  103. when: deployment_type == 'origin' and g_aos_versions.curr_version | version_compare('1.0.6','<')
  104. - fail: This playbook requires Atomic OpenShift 3.0.2 or later
  105. when: deployment_type in ['openshift-enterprise', 'atomic-openshift'] and g_aos_versions.curr_version | version_compare('3.0.2','<')
  106. - name: Upgrade masters
  107. hosts: masters
  108. vars:
  109. openshift_version: "{{ openshift_pkg_version | default('') }}"
  110. tasks:
  111. - name: Upgrade to latest available kernel
  112. yum:
  113. pkg: kernel
  114. state: latest
  115. - name: Upgrade master packages
  116. command: yum update -y {{ openshift.common.service_type }}-master{{ openshift_version }}
  117. - name: Ensure python-yaml present for config upgrade
  118. yum:
  119. pkg: python-yaml
  120. state: installed
  121. - debug: var=hostvars[inventory_hostname].openshift.common.config_base
  122. - name: Upgrade master configuration
  123. openshift_upgrade_config:
  124. from_version: '3.0'
  125. to_version: '3.1'
  126. role: master
  127. config_base: "{{ hostvars[inventory_hostname].openshift.common.config_base }}"
  128. - set_fact:
  129. master_certs_missing: True
  130. master_cert_subdir: master-{{ openshift.common.hostname }}
  131. master_cert_config_dir: "{{ openshift.common.config_base }}/master"
  132. - name: Create temp directory for syncing certs
  133. hosts: localhost
  134. gather_facts: no
  135. tasks:
  136. - name: Create local temp directory for syncing certs
  137. local_action: command mktemp -d /tmp/openshift-ansible-XXXXXXX
  138. register: g_master_mktemp
  139. changed_when: False
  140. - name: Generate missing master certificates
  141. hosts: masters[0]
  142. vars:
  143. master_hostnames: "{{ hostvars
  144. | oo_select_keys(groups.masters)
  145. | oo_collect('openshift.common.all_hostnames')
  146. | oo_flatten | unique }}"
  147. master_generated_certs_dir: "{{ openshift.common.config_base }}/generated-configs"
  148. masters_needing_certs: "{{ hostvars
  149. | oo_select_keys(groups.masters)
  150. | difference([groups.masters.0]) }}"
  151. sync_tmpdir: "{{ hostvars.localhost.g_master_mktemp.stdout }}"
  152. openshift_deployment_type: "{{ deployment_type }}"
  153. roles:
  154. - openshift_master_certificates
  155. post_tasks:
  156. - name: Remove generated etcd client certs when using external etcd
  157. file:
  158. path: "{{ master_generated_certs_dir }}/{{ item.0.master_cert_subdir }}/{{ item.1 }}"
  159. state: absent
  160. when: groups.oo_etcd_to_config is defined and groups.oo_etcd_to_config
  161. with_nested:
  162. - masters_needing_certs
  163. - - master.etcd-client.crt
  164. - master.etcd-client.key
  165. - name: Create a tarball of the master certs
  166. command: >
  167. tar -czvf {{ master_generated_certs_dir }}/{{ item.master_cert_subdir }}.tgz
  168. -C {{ master_generated_certs_dir }}/{{ item.master_cert_subdir }} .
  169. with_items: masters_needing_certs
  170. - name: Retrieve the master cert tarball from the master
  171. fetch:
  172. src: "{{ master_generated_certs_dir }}/{{ item.master_cert_subdir }}.tgz"
  173. dest: "{{ sync_tmpdir }}/"
  174. flat: yes
  175. fail_on_missing: yes
  176. validate_checksum: yes
  177. with_items: masters_needing_certs
  178. - name: Sync certs and restart masters post configuration change
  179. hosts: masters
  180. vars:
  181. sync_tmpdir: "{{ hostvars.localhost.g_master_mktemp.stdout }}"
  182. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  183. tasks:
  184. - name: Unarchive the tarball on the master
  185. unarchive:
  186. src: "{{ sync_tmpdir }}/{{ master_cert_subdir }}.tgz"
  187. dest: "{{ master_cert_config_dir }}"
  188. when: inventory_hostname != groups.masters.0
  189. - name: Restart master services
  190. service: name="{{ openshift.common.service_type}}-master" state=restarted
  191. when: not openshift_master_ha | bool
  192. - name: Destroy cluster
  193. hosts: masters[0]
  194. vars:
  195. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  196. openshift_deployment_type: "{{ deployment_type }}"
  197. pre_tasks:
  198. - name: Check for configured cluster
  199. stat:
  200. path: /etc/corosync/corosync.conf
  201. register: corosync_conf
  202. when: openshift_master_ha | bool
  203. - name: Destroy cluster
  204. command: pcs cluster destroy --all
  205. when: openshift_master_ha | bool and corosync_conf.stat.exists == true
  206. - name: Start pcsd on masters
  207. hosts: masters
  208. vars:
  209. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  210. tasks:
  211. - name: Start pcsd
  212. service: name=pcsd state=started
  213. when: openshift_master_ha | bool
  214. - name: Re-create cluster
  215. hosts: masters[0]
  216. vars:
  217. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  218. openshift_deployment_type: "{{ deployment_type }}"
  219. omc_cluster_hosts: "{{ groups.masters | join(' ') }}"
  220. roles:
  221. - role: openshift_master_cluster
  222. when: openshift_master_ha | bool
  223. - name: Delete temporary directory on localhost
  224. hosts: localhost
  225. gather_facts: no
  226. tasks:
  227. - file: name={{ g_master_mktemp.stdout }} state=absent
  228. changed_when: False
  229. - name: Upgrade nodes
  230. hosts: nodes
  231. vars:
  232. openshift_version: "{{ openshift_pkg_version | default('') }}"
  233. roles:
  234. - openshift_facts
  235. tasks:
  236. - name: Upgrade node packages
  237. command: yum update -y {{ openshift.common.service_type }}-node{{ openshift_version }}
  238. - name: Restart node services
  239. service: name="{{ openshift.common.service_type }}-node" state=restarted
  240. - name: Update cluster policy and policy bindings
  241. hosts: masters[0]
  242. vars:
  243. origin_reconcile_bindings: "{{ deployment_type == 'origin' and g_new_version | version_compare('1.0.6', '>') }}"
  244. ent_reconcile_bindings: "{{ deployment_type in ['openshift-enterprise', 'atomic-enterprise'] and g_new_version | version_compare('3.0.2','>') }}"
  245. tasks:
  246. - name: oadm policy reconcile-cluster-roles --confirm
  247. command: >
  248. {{ openshift.common.admin_binary}} --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  249. policy reconcile-cluster-roles --confirm
  250. - name: oadm policy reconcile-cluster-role-bindings --confirm
  251. command: >
  252. {{ openshift.common.admin_binary}} --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  253. policy reconcile-cluster-role-bindings
  254. --exclude-groups=system:authenticated
  255. --exclude-groups=system:unauthenticated
  256. --exclude-users=system:anonymous
  257. --additive-only=true --confirm
  258. when: origin_reconcile_bindings | bool or ent_reconcile_bindings | bool
  259. - name: Restart masters post reconcile
  260. hosts: masters
  261. vars:
  262. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  263. tasks:
  264. - name: Restart master services
  265. service: name="{{ openshift.common.service_type}}-master" state=restarted
  266. when: not openshift_master_ha | bool
  267. - name: Restart cluster post reconcile
  268. hosts: masters[0]
  269. vars:
  270. openshift_master_ha: "{{ groups['masters'] | length > 1 }}"
  271. tasks:
  272. - name: Restart master cluster
  273. command: pcs resource restart master
  274. when: openshift_master_ha | bool
  275. - name: Upgrade default router and registry
  276. hosts: masters[0]
  277. vars:
  278. - registry_image: "{{ openshift.master.registry_url | replace( '${component}', 'docker-registry' ) | replace ( '${version}', 'v' + g_new_version ) }}"
  279. - router_image: "{{ openshift.master.registry_url | replace( '${component}', 'haproxy-router' ) | replace ( '${version}', 'v' + g_new_version ) }}"
  280. - oc_cmd: "{{ openshift.common.client_binary }} --config={{ openshift.common.config_base }}/master/admin.kubeconfig"
  281. tasks:
  282. - name: Check for default router
  283. command: >
  284. {{ oc_cmd }} get -n default dc/router
  285. register: _default_router
  286. failed_when: false
  287. changed_when: false
  288. - name: Check for allowHostNetwork and allowHostPorts
  289. when: _default_router.rc == 0
  290. shell: >
  291. {{ oc_cmd }} get -o yaml scc/privileged | /usr/bin/grep -e allowHostPorts -e allowHostNetwork
  292. register: _scc
  293. - name: Grant allowHostNetwork and allowHostPorts
  294. when:
  295. - _default_router.rc == 0
  296. - "'false' in _scc.stdout"
  297. command: >
  298. {{ oc_cmd }} patch scc/privileged -p '{"allowHostPorts":true,"allowHostNetwork":true}' --loglevel=9
  299. - name: Update deployment config to 1.0.4/3.0.1 spec
  300. when: _default_router.rc == 0
  301. command: >
  302. {{ oc_cmd }} patch dc/router -p
  303. '{"spec":{"strategy":{"rollingParams":{"updatePercent":-10},"spec":{"serviceAccount":"router","serviceAccountName":"router"}}}}'
  304. - name: Switch to hostNetwork=true
  305. when: _default_router.rc == 0
  306. command: >
  307. {{ oc_cmd }} patch dc/router -p '{"spec":{"template":{"spec":{"hostNetwork":true}}}}'
  308. - name: Update router image to current version
  309. when: _default_router.rc == 0
  310. command: >
  311. {{ oc_cmd }} patch dc/router -p
  312. '{"spec":{"template":{"spec":{"containers":[{"name":"router","image":"{{ router_image }}"}]}}}}'
  313. - name: Check for default registry
  314. command: >
  315. {{ oc_cmd }} get -n default dc/docker-registry
  316. register: _default_registry
  317. failed_when: false
  318. changed_when: false
  319. - name: Update registry image to current version
  320. when: _default_registry.rc == 0
  321. command: >
  322. {{ oc_cmd }} patch dc/docker-registry -p
  323. '{"spec":{"template":{"spec":{"containers":[{"name":"registry","image":"{{ registry_image }}"}]}}}}'
  324. - name: Update image streams and templates
  325. hosts: masters[0]
  326. vars:
  327. openshift_examples_import_command: "update"
  328. openshift_deployment_type: "{{ deployment_type }}"
  329. roles:
  330. - openshift_examples