restart_cluster.yml 3.5 KB

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283
  1. ---
  2. ## get all pods for the cluster
  3. - command: >
  4. {{ openshift_client_binary }}
  5. --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  6. get pod
  7. -l component={{ _cluster_component }},provider=openshift
  8. -n {{ openshift_logging_elasticsearch_namespace }}
  9. -o jsonpath={.items[?(@.status.phase==\"Running\")].metadata.name}
  10. register: _cluster_pods
  11. # make a temp dir for admin certs
  12. - command: mktemp -d /tmp/openshift-logging-ansible-XXXXXX
  13. register: _logging_handler_tempdir
  14. changed_when: False
  15. check_mode: no
  16. - name: Exporting secrets to use communicating with the ES cluster
  17. command: >
  18. {{ openshift_client_binary }}
  19. --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  20. extract secret/logging-elasticsearch
  21. -n {{ openshift_logging_elasticsearch_namespace }}
  22. --keys=admin-cert --keys=admin-key
  23. --to={{ _logging_handler_tempdir.stdout }}
  24. ### Check for cluster state before making changes -- if its red, yellow or missing nodes then we don't want to continue
  25. - name: "Checking current health for {{ _es_node }} cluster"
  26. command: >
  27. curl -s -k
  28. --cert {{ _logging_handler_tempdir.stdout }}/admin-cert
  29. --key {{ _logging_handler_tempdir.stdout }}/admin-key
  30. https://logging-{{ _cluster_component }}.{{ openshift_logging_elasticsearch_namespace }}.svc:9200/_cluster/health?pretty
  31. register: _pod_status
  32. when: _cluster_pods.stdout_lines | count > 0
  33. - when:
  34. - _pod_status.stdout is defined
  35. - (_pod_status.stdout | from_json)['status'] in ['yellow', 'red'] or (_pod_status.stdout | from_json)['number_of_nodes'] != _cluster_pods.stdout_lines | count
  36. block:
  37. - name: Set Logging message to manually restart
  38. run_once: true
  39. set_stats:
  40. data:
  41. installer_phase_logging:
  42. message: "Cluster logging-{{ _cluster_component }} was not in an optimal state and will not be automatically restarted. Please see documentation regarding doing a {{ 'full' if full_restart_cluster | bool else 'rolling'}} cluster restart."
  43. - debug: msg="Cluster logging-{{ _cluster_component }} was not in an optimal state and will not be automatically restarted. Please see documentation regarding doing a {{ 'full' if full_restart_cluster | bool else 'rolling'}} cluster restart."
  44. - when: _pod_status.stdout is undefined or ( (_pod_status.stdout | from_json)['status'] in ['green'] and (_pod_status.stdout | from_json)['number_of_nodes'] == _cluster_pods.stdout_lines | count )
  45. block:
  46. - command: >
  47. {{ openshift_client_binary }}
  48. --config={{ openshift.common.config_base }}/master/admin.kubeconfig
  49. get dc
  50. -l component={{ _cluster_component }},provider=openshift
  51. -n {{ openshift_logging_elasticsearch_namespace }}
  52. -o jsonpath={.items[*].metadata.name}
  53. register: _cluster_dcs
  54. ## restart all dcs for full restart
  55. - name: "Performing full cluster restart for {{ _cluster_component }} cluster"
  56. include_tasks: full_cluster_restart.yml
  57. vars:
  58. logging_restart_cluster_dcs: "{{ _cluster_dcs.stdout_lines }}"
  59. when:
  60. - full_restart_cluster | bool
  61. ## restart the node if it's dc is in the list of nodes to restart
  62. - name: "Performing rolling cluster restart for {{ _cluster_component }} cluster"
  63. include_tasks: rolling_cluster_restart.yml
  64. vars:
  65. logging_restart_cluster_dcs: "{{ _restart_logging_nodes | intersect(_cluster_dcs.stdout) }}"
  66. when:
  67. - not full_restart_cluster | bool
  68. # remove temp dir
  69. - name: Cleaning up local temp dir
  70. file:
  71. path: "{{ _logging_handler_tempdir.stdout }}"
  72. state: absent
  73. changed_when: False
  74. become: false