backup.yml 4.2 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100
  1. ---
  2. - name: Backup etcd
  3. hosts: etcd_hosts_to_backup
  4. vars:
  5. embedded_etcd: "{{ groups.oo_etcd_to_config | default([]) | length == 0 }}"
  6. timestamp: "{{ lookup('pipe', 'date +%Y%m%d%H%M%S') }}"
  7. etcdctl_command: "{{ 'etcdctl' if not openshift.common.is_containerized or embedded_etcd else 'docker exec etcd_container etcdctl' if not openshift.common.is_etcd_system_container else 'runc exec etcd etcdctl' }}"
  8. roles:
  9. - openshift_facts
  10. tasks:
  11. # Ensure we persist the etcd role for this host in openshift_facts
  12. - openshift_facts:
  13. role: etcd
  14. local_facts: {}
  15. when: "'etcd' not in openshift"
  16. - stat: path=/var/lib/openshift
  17. register: var_lib_openshift
  18. - stat: path=/var/lib/origin
  19. register: var_lib_origin
  20. - name: Create origin symlink if necessary
  21. file: src=/var/lib/openshift/ dest=/var/lib/origin state=link
  22. when: var_lib_openshift.stat.exists == True and var_lib_origin.stat.exists == False
  23. # TODO: replace shell module with command and update later checks
  24. # We assume to be using the data dir for all backups.
  25. - name: Check available disk space for etcd backup
  26. shell: df --output=avail -k {{ openshift.common.data_dir }} | tail -n 1
  27. register: avail_disk
  28. # AUDIT:changed_when: `false` because we are only inspecting
  29. # state, not manipulating anything
  30. changed_when: false
  31. # TODO: replace shell module with command and update later checks
  32. - name: Check current embedded etcd disk usage
  33. shell: du -k {{ openshift.etcd.etcd_data_dir }} | tail -n 1 | cut -f1
  34. register: etcd_disk_usage
  35. when: embedded_etcd | bool
  36. # AUDIT:changed_when: `false` because we are only inspecting
  37. # state, not manipulating anything
  38. changed_when: false
  39. - name: Abort if insufficient disk space for etcd backup
  40. fail:
  41. msg: >
  42. {{ etcd_disk_usage.stdout }} Kb disk space required for etcd backup,
  43. {{ avail_disk.stdout }} Kb available.
  44. when: (embedded_etcd | bool) and (etcd_disk_usage.stdout|int > avail_disk.stdout|int)
  45. # For non containerized and non embedded we should have the correct version of
  46. # etcd installed already. So don't do anything.
  47. #
  48. # For embedded or containerized we need to use the latest because OCP 3.3 uses
  49. # a version of etcd that can only be backed up with etcd-3.x and if it's
  50. # containerized then etcd version may be newer than that on the host so
  51. # upgrade it.
  52. #
  53. # On atomic we have neither yum nor dnf so ansible throws a hard to debug error
  54. # if you use package there, like this: "Could not find a module for unknown."
  55. # see https://bugzilla.redhat.com/show_bug.cgi?id=1408668
  56. #
  57. # TODO - We should refactor all containerized backups to use the containerized
  58. # version of etcd to perform the backup rather than relying on the host's
  59. # binaries. Until we do that we'll continue to have problems backing up etcd
  60. # when atomic host has an older version than the version that's running in the
  61. # container whether that's embedded or not
  62. - name: Install latest etcd for containerized or embedded
  63. package:
  64. name: etcd
  65. state: latest
  66. when: ( embedded_etcd | bool or openshift.common.is_containerized ) and not openshift.common.is_atomic
  67. - name: Generate etcd backup
  68. command: >
  69. {{ etcdctl_command }} backup --data-dir={{ openshift.etcd.etcd_data_dir }}
  70. --backup-dir={{ openshift.common.data_dir }}/etcd-backup-{{ backup_tag | default('') }}{{ timestamp }}
  71. - set_fact:
  72. etcd_backup_complete: True
  73. - name: Display location of etcd backup
  74. debug:
  75. msg: "Etcd backup created in {{ openshift.common.data_dir }}/etcd-backup-{{ backup_tag | default('') }}{{ timestamp }}"
  76. - name: Gate on etcd backup
  77. hosts: localhost
  78. connection: local
  79. become: no
  80. tasks:
  81. - set_fact:
  82. etcd_backup_completed: "{{ hostvars
  83. | oo_select_keys(groups.etcd_hosts_to_backup)
  84. | oo_collect('inventory_hostname', {'etcd_backup_complete': true}) }}"
  85. - set_fact:
  86. etcd_backup_failed: "{{ groups.etcd_hosts_to_backup | difference(etcd_backup_completed) }}"
  87. - fail:
  88. msg: "Upgrade cannot continue. The following hosts did not complete etcd backup: {{ etcd_backup_failed | join(',') }}"
  89. when: etcd_backup_failed | length > 0