main.yml 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330
  1. ---
  2. # TODO: add ability to configure certificates given either a local file to
  3. # point to or certificate contents, set in default cert locations.
  4. # Authentication Variable Validation
  5. # TODO: validate the different identity provider kinds as well
  6. - fail:
  7. msg: >
  8. Invalid OAuth grant method: {{ openshift_master_oauth_grant_method }}
  9. when:
  10. - openshift_master_oauth_grant_method not in openshift_master_valid_grant_methods
  11. - name: Check that origin image is present
  12. command: 'docker images -q "{{ osm_image }}"'
  13. register: control_plane_image
  14. # This task runs async to save time while the master is being configured
  15. - name: Pre-pull Origin image
  16. docker_image:
  17. name: "{{ osm_image }}"
  18. environment:
  19. NO_PROXY: "{{ openshift.common.no_proxy | default('') }}"
  20. when: control_plane_image.stdout_lines == []
  21. # 10 minutes to pull the image
  22. async: 600
  23. poll: 0
  24. register: image_prepull
  25. - name: Open up firewall ports
  26. import_tasks: firewall.yml
  27. - name: Prepare static pod scripts
  28. import_tasks: static_shim.yml
  29. - name: Create r_openshift_master_data_dir
  30. file:
  31. path: "{{ r_openshift_master_data_dir }}"
  32. state: directory
  33. mode: 0755
  34. owner: root
  35. group: root
  36. - import_tasks: registry_auth.yml
  37. - name: Create config parent directory if it does not exist
  38. file:
  39. path: "/etc/origin/master"
  40. state: directory
  41. - name: Create flexvolume directory when on atomic hosts
  42. file:
  43. state: directory
  44. path: "/etc/origin/kubelet-plugins/volume/exec"
  45. mode: '0750'
  46. when: openshift_is_atomic | bool
  47. - name: Flex volume directory on non-atomic host
  48. file:
  49. state: directory
  50. path: "/usr/libexec/kubernetes/kubelet-plugins/volume/exec/"
  51. mode: '0750'
  52. when: not openshift_is_atomic | bool
  53. - name: Create the policy file if it does not already exist
  54. command: >
  55. {{ openshift_client_binary }} adm create-bootstrap-policy-file
  56. --filename={{ openshift_master_policy }}
  57. args:
  58. creates: "{{ openshift_master_policy }}"
  59. - name: Create the scheduler config
  60. copy:
  61. content: "{{ scheduler_config | to_nice_json }}"
  62. dest: "{{ openshift_master_scheduler_conf }}"
  63. backup: true
  64. - import_tasks: htpass_provider.yml
  65. - name: Create the ldap ca file if needed
  66. copy:
  67. dest: "{{ item.ca if 'ca' in item and '/' in item.ca else '/etc/origin/master/' ~ item.ca | default('ldap_ca.crt') }}"
  68. content: "{{ openshift.master.ldap_ca }}"
  69. mode: 0600
  70. backup: yes
  71. when:
  72. - openshift.master.ldap_ca is defined
  73. - item.kind == 'LDAPPasswordIdentityProvider'
  74. with_items: "{{ openshift_master_identity_providers }}"
  75. - name: Create the openid ca file if needed
  76. copy:
  77. dest: "{{ item.ca if 'ca' in item and '/' in item.ca else '/etc/origin/master/' ~ item.ca | default('openid_ca.crt') }}"
  78. content: "{{ openshift.master.openid_ca }}"
  79. mode: 0600
  80. backup: yes
  81. when:
  82. - openshift.master.openid_ca is defined
  83. - item.kind == 'OpenIDIdentityProvider'
  84. - item.ca | default('') != ''
  85. with_items: "{{ openshift_master_identity_providers }}"
  86. - name: Create the request header ca file if needed
  87. copy:
  88. dest: "{{ item.clientCA if 'clientCA' in item and '/' in item.clientCA else '/etc/origin/master/' ~ item.clientCA | default('request_header_ca.crt') }}"
  89. content: "{{ openshift_master_request_header_ca }}"
  90. mode: 0600
  91. backup: yes
  92. when:
  93. - openshift_master_request_header_ca != l_osm_request_header_none
  94. - item.kind == 'RequestHeaderIdentityProvider'
  95. - item.clientCA | default('') != ''
  96. with_items: "{{ openshift_master_identity_providers }}"
  97. - name: Set fact of all etcd host IPs
  98. openshift_facts:
  99. role: common
  100. local_facts:
  101. no_proxy_etcd_host_ips: "{{ openshift_no_proxy_etcd_host_ips }}"
  102. - name: Create session secrets file
  103. template:
  104. dest: "{{ openshift_master_session_secrets_file }}"
  105. src: sessionSecretsFile.yaml.v1.j2
  106. owner: root
  107. group: root
  108. mode: 0600
  109. - set_fact:
  110. # translate_idps is a custom filter in role lib_utils
  111. translated_identity_providers: "{{ openshift_master_identity_providers | translate_idps('v1') }}"
  112. # TODO: add the validate parameter when there is a validation command to run
  113. - name: Create master config
  114. template:
  115. dest: "{{ openshift_master_config_file }}"
  116. src: master.yaml.v1.j2
  117. backup: true
  118. owner: root
  119. group: root
  120. mode: 0600
  121. - import_tasks: set_loopback_context.yml
  122. - name: Create the master service env file
  123. template:
  124. src: "master.env.j2"
  125. dest: /etc/origin/master/master.env
  126. backup: true
  127. - import_tasks: static.yml
  128. - name: Establish the default bootstrap kubeconfig for masters
  129. copy:
  130. remote_src: true
  131. src: "/etc/origin/master/admin.kubeconfig"
  132. dest: "{{ item }}"
  133. mode: 0600
  134. with_items:
  135. # bootstrap as an admin
  136. - /etc/origin/node/bootstrap.kubeconfig
  137. # copy to this location to bypass initial bootstrap request
  138. - /etc/origin/node/node.kubeconfig
  139. - name: Check status of control plane image pre-pull
  140. async_status:
  141. jid: "{{ image_prepull.ansible_job_id }}"
  142. register: job_result
  143. until: job_result.finished
  144. when: control_plane_image.stdout_lines == []
  145. retries: 20
  146. delay: 30
  147. failed_when: false
  148. - name: Check status of etcd image pre-pull
  149. async_status:
  150. jid: "{{ etcd_prepull.ansible_job_id }}"
  151. register: job_result
  152. until: job_result.finished
  153. when:
  154. - etcd_image_exists is defined
  155. - "'stdout_lines' in etcd_image_exists"
  156. - etcd_image_exists.stdout_lines == []
  157. retries: 20
  158. delay: 30
  159. failed_when: false
  160. - name: Start and enable self-hosting node
  161. systemd:
  162. name: "{{ openshift_service_type }}-node"
  163. state: restarted
  164. enabled: yes
  165. register: node_start
  166. ignore_errors: yes
  167. - when: node_start is failed
  168. block:
  169. - name: Get node logs
  170. command: journalctl --no-pager -n 300 -u {{ openshift_service_type }}-node
  171. register: logs_node
  172. ignore_errors: true
  173. - debug:
  174. msg: "{{ logs_node.stdout_lines }}"
  175. - fail:
  176. msg: Node start failed.
  177. - name: Wait for control plane pods to appear
  178. oc_obj:
  179. state: list
  180. kind: pod
  181. name: "master-{{ item }}-{{ openshift.node.nodename | lower }}"
  182. namespace: kube-system
  183. register: control_plane_pods
  184. until:
  185. - "'results' in control_plane_pods"
  186. - "'results' in control_plane_pods.results"
  187. - control_plane_pods.results.results | length > 0
  188. retries: 60
  189. delay: 5
  190. with_items:
  191. - "{{ 'etcd' if inventory_hostname in groups['oo_etcd_to_config'] else omit }}"
  192. - api
  193. - controllers
  194. ignore_errors: true
  195. - when: control_plane_pods is failed
  196. block:
  197. - name: Check status in the kube-system namespace
  198. command: >
  199. {{ openshift_client_binary }} status --config={{ openshift.common.config_base }}/master/admin.kubeconfig -n kube-system
  200. register: control_plane_status
  201. ignore_errors: true
  202. - debug:
  203. msg: "{{ control_plane_status.stdout_lines }}"
  204. - name: Get pods in the kube-system namespace
  205. command: >
  206. {{ openshift_client_binary }} get pods --config={{ openshift.common.config_base }}/master/admin.kubeconfig -n kube-system -o wide
  207. register: control_plane_pods_list
  208. ignore_errors: true
  209. - debug:
  210. msg: "{{ control_plane_pods_list.stdout_lines }}"
  211. - name: Get events in the kube-system namespace
  212. command: >
  213. {{ openshift_client_binary }} get events --config={{ openshift.common.config_base }}/master/admin.kubeconfig -n kube-system
  214. register: control_plane_events
  215. ignore_errors: true
  216. - debug:
  217. msg: "{{ control_plane_events.stdout_lines }}"
  218. - name: Get node logs
  219. command: journalctl --no-pager -n 300 -u {{ openshift_service_type }}-node
  220. register: logs_node
  221. ignore_errors: true
  222. - debug:
  223. msg: "{{ logs_node.stdout_lines }}"
  224. - name: Report control plane errors
  225. fail:
  226. msg: Control plane pods didn't come up
  227. - name: Wait for all control plane pods to become ready
  228. oc_obj:
  229. state: list
  230. kind: pod
  231. name: "master-{{ item }}-{{ openshift.node.nodename | lower }}"
  232. namespace: kube-system
  233. register: control_plane_health
  234. until:
  235. - "'results' in control_plane_health"
  236. - "'results' in control_plane_health.results"
  237. - control_plane_health.results.results | length > 0
  238. - "'status' in control_plane_health.results.results[0]"
  239. - "'conditions' in control_plane_health.results.results[0].status"
  240. - control_plane_health.results.results[0].status.conditions | selectattr('type', 'match', '^Ready$') | map(attribute='status') | join | bool == True
  241. retries: 60
  242. delay: 5
  243. with_items:
  244. - "{{ 'etcd' if inventory_hostname in groups['oo_etcd_to_config'] else '' }}"
  245. - api
  246. - controllers
  247. when:
  248. - item != ''
  249. - when: control_plane_health is failed
  250. block:
  251. - debug:
  252. msg: "{{ control_plane_pods_list.stdout_lines }}"
  253. - name: Get events in the kube-system namespace
  254. command: >
  255. {{ openshift_client_binary }} get events --config={{ openshift.common.config_base }}/master/admin.kubeconfig -n kube-system
  256. register: control_plane_events
  257. ignore_errors: true
  258. - debug:
  259. msg: "{{ control_plane_events.stdout_lines }}"
  260. - name: Get node logs
  261. command: journalctl --no-pager -n 300 -u {{ openshift_service_type }}-node
  262. register: logs_node
  263. ignore_errors: true
  264. - debug:
  265. msg: "{{ logs_node.stdout_lines }}"
  266. - name: Get API logs
  267. command: >
  268. /usr/local/bin/master-logs api api
  269. register: control_plane_logs_api
  270. ignore_errors: true
  271. - debug:
  272. msg: "{{ control_plane_logs_api.stdout_lines }}"
  273. - name: Get controllers logs
  274. command: >
  275. /usr/local/bin/master-logs controllers controllers
  276. register: control_plane_logs_controllers
  277. ignore_errors: true
  278. - debug:
  279. msg: "{{ control_plane_logs_controllers.stdout_lines }}"
  280. - name: Get etcd logs
  281. command: >
  282. /usr/local/bin/master-logs etcd etcd
  283. register: control_plane_logs_etcd
  284. when: inventory_hostname in groups['oo_etcd_to_config']
  285. ignore_errors: true
  286. - debug:
  287. msg: "{{ control_plane_logs_controllers.stdout_lines }}"
  288. when: inventory_hostname in groups['oo_etcd_to_config']
  289. - name: Report control plane errors
  290. fail:
  291. msg: Control plane pods didn't pass health check
  292. - import_tasks: check_master_api_is_ready.yml
  293. - name: Remove oc cache to refresh a list of APIs
  294. file:
  295. path: "~/.kube/cache"
  296. state: absent