openshift_cert_expiry.py 33 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839
  1. #!/usr/bin/python
  2. # -*- coding: utf-8 -*-
  3. # pylint: disable=line-too-long,invalid-name
  4. """For details on this module see DOCUMENTATION (below)"""
  5. import base64
  6. import datetime
  7. import io
  8. import os
  9. import subprocess
  10. import yaml
  11. # pylint import-error disabled because pylint cannot find the package
  12. # when installed in a virtualenv
  13. from ansible.module_utils.six.moves import configparser # pylint: disable=import-error
  14. from ansible.module_utils.basic import AnsibleModule
  15. try:
  16. # You can comment this import out and include a 'pass' in this
  17. # block if you're manually testing this module on a NON-ATOMIC
  18. # HOST (or any host that just doesn't have PyOpenSSL
  19. # available). That will force the `load_and_handle_cert` function
  20. # to use the Fake OpenSSL classes.
  21. import OpenSSL.crypto
  22. HAS_OPENSSL = True
  23. except ImportError:
  24. # Some platforms (such as RHEL Atomic) may not have the Python
  25. # OpenSSL library installed. In this case we will use a manual
  26. # work-around to parse each certificate.
  27. #
  28. # Check for 'OpenSSL.crypto' in `sys.modules` later.
  29. HAS_OPENSSL = False
  30. DOCUMENTATION = '''
  31. ---
  32. module: openshift_cert_expiry
  33. short_description: Check OpenShift Container Platform (OCP) and Kube certificate expirations on a cluster
  34. description:
  35. - The M(openshift_cert_expiry) module has two basic functions: to flag certificates which will expire in a set window of time from now, and to notify you about certificates which have already expired.
  36. - When the module finishes, a summary of the examination is returned. Each certificate in the summary has a C(health) key with a value of one of the following:
  37. - C(ok) - not expired, and outside of the expiration C(warning_days) window.
  38. - C(warning) - not expired, but will expire between now and the C(warning_days) window.
  39. - C(expired) - an expired certificate.
  40. - Certificate flagging follow this logic:
  41. - If the expiration date is before now then the certificate is classified as C(expired).
  42. - The certificates time to live (expiration date - now) is calculated, if that time window is less than C(warning_days) the certificate is classified as C(warning).
  43. - All other conditions are classified as C(ok).
  44. - The following keys are ALSO present in the certificate summary:
  45. - C(cert_cn) - The common name of the certificate (additional CNs present in SAN extensions are omitted)
  46. - C(days_remaining) - The number of days until the certificate expires.
  47. - C(expiry) - The date the certificate expires on.
  48. - C(path) - The full path to the certificate on the examined host.
  49. version_added: "1.0"
  50. options:
  51. config_base:
  52. description:
  53. - Base path to OCP system settings.
  54. required: false
  55. default: /etc/origin
  56. warning_days:
  57. description:
  58. - Flag certificates which will expire in C(warning_days) days from now.
  59. required: false
  60. default: 30
  61. show_all:
  62. description:
  63. - Enable this option to show analysis of ALL certificates examined by this module.
  64. - By default only certificates which have expired, or will expire within the C(warning_days) window will be reported.
  65. required: false
  66. default: false
  67. author: "Tim Bielawa (@tbielawa) <tbielawa@redhat.com>"
  68. '''
  69. EXAMPLES = '''
  70. # Default invocation, only notify about expired certificates or certificates which will expire within 30 days from now
  71. - openshift_cert_expiry:
  72. # Expand the warning window to show certificates expiring within a year from now
  73. - openshift_cert_expiry: warning_days=365
  74. # Show expired, soon to expire (now + 30 days), and all other certificates examined
  75. - openshift_cert_expiry: show_all=true
  76. '''
  77. class FakeOpenSSLCertificate(object):
  78. """This provides a rough mock of what you get from
  79. `OpenSSL.crypto.load_certificate()`. This is a work-around for
  80. platforms missing the Python OpenSSL library.
  81. """
  82. def __init__(self, cert_string):
  83. """`cert_string` is a certificate in the form you get from running a
  84. .crt through 'openssl x509 -in CERT.cert -text'"""
  85. self.cert_string = cert_string
  86. self.serial = None
  87. self.subject = None
  88. self.extensions = []
  89. self.not_after = None
  90. self._parse_cert()
  91. def _parse_cert(self):
  92. """Manually parse the certificate line by line"""
  93. self.extensions = []
  94. PARSING_ALT_NAMES = False
  95. PARSING_HEX_SERIAL = False
  96. for line in self.cert_string.split('\n'):
  97. l = line.strip()
  98. if PARSING_ALT_NAMES:
  99. # We're parsing a 'Subject Alternative Name' line
  100. self.extensions.append(
  101. FakeOpenSSLCertificateSANExtension(l))
  102. PARSING_ALT_NAMES = False
  103. continue
  104. if PARSING_HEX_SERIAL:
  105. # Hex serials arrive colon-delimited
  106. serial_raw = l.replace(':', '')
  107. # Convert to decimal
  108. self.serial = int('0x' + serial_raw, base=16)
  109. PARSING_HEX_SERIAL = False
  110. continue
  111. # parse out the bits that we can
  112. if l.startswith('Serial Number:'):
  113. # Decimal format:
  114. # Serial Number: 11 (0xb)
  115. # => 11
  116. # Hex Format (large serials):
  117. # Serial Number:
  118. # 0a:de:eb:24:04:75:ab:56:39:14:e9:5a:22:e2:85:bf
  119. # => 14449739080294792594019643629255165375
  120. if l.endswith(':'):
  121. PARSING_HEX_SERIAL = True
  122. continue
  123. self.serial = int(l.split()[-2])
  124. elif l.startswith('Not After :'):
  125. # Not After : Feb 7 18:19:35 2019 GMT
  126. # => strptime(str, '%b %d %H:%M:%S %Y %Z')
  127. # => strftime('%Y%m%d%H%M%SZ')
  128. # => 20190207181935Z
  129. not_after_raw = l.partition(' : ')[-1]
  130. # Last item: ('Not After', ' : ', 'Feb 7 18:19:35 2019 GMT')
  131. not_after_parsed = datetime.datetime.strptime(not_after_raw, '%b %d %H:%M:%S %Y %Z')
  132. self.not_after = not_after_parsed.strftime('%Y%m%d%H%M%SZ')
  133. elif l.startswith('X509v3 Subject Alternative Name:'):
  134. PARSING_ALT_NAMES = True
  135. continue
  136. elif l.startswith('Subject:'):
  137. # O = system:nodes, CN = system:node:m01.example.com
  138. self.subject = FakeOpenSSLCertificateSubjects(l.partition(': ')[-1])
  139. def get_serial_number(self):
  140. """Return the serial number of the cert"""
  141. return self.serial
  142. def get_subject(self):
  143. """Subjects must implement get_components() and return dicts or
  144. tuples. An 'openssl x509 -in CERT.cert -text' with 'Subject':
  145. Subject: Subject: O=system:nodes, CN=system:node:m01.example.com
  146. might return: [('O=system', 'nodes'), ('CN=system', 'node:m01.example.com')]
  147. """
  148. return self.subject
  149. def get_extension(self, i):
  150. """Extensions must implement get_short_name() and return the string
  151. 'subjectAltName'"""
  152. return self.extensions[i]
  153. def get_extension_count(self):
  154. """ get_extension_count """
  155. return len(self.extensions)
  156. def get_notAfter(self):
  157. """Returns a date stamp as a string in the form
  158. '20180922170439Z'. strptime the result with format param:
  159. '%Y%m%d%H%M%SZ'."""
  160. return self.not_after
  161. class FakeOpenSSLCertificateSANExtension(object): # pylint: disable=too-few-public-methods
  162. """Mocks what happens when `get_extension` is called on a certificate
  163. object"""
  164. def __init__(self, san_string):
  165. """With `san_string` as you get from:
  166. $ openssl x509 -in certificate.crt -text
  167. """
  168. self.san_string = san_string
  169. self.short_name = 'subjectAltName'
  170. def get_short_name(self):
  171. """Return the 'type' of this extension. It's always the same though
  172. because we only care about subjectAltName's"""
  173. return self.short_name
  174. def __str__(self):
  175. """Return this extension and the value as a simple string"""
  176. return self.san_string
  177. # pylint: disable=too-few-public-methods
  178. class FakeOpenSSLCertificateSubjects(object):
  179. """Mocks what happens when `get_subject` is called on a certificate
  180. object"""
  181. def __init__(self, subject_string):
  182. """With `subject_string` as you get from:
  183. $ openssl x509 -in certificate.crt -text
  184. """
  185. self.subjects = []
  186. for s in subject_string.split(', '):
  187. name, _, value = s.partition(' = ')
  188. self.subjects.append((name, value))
  189. def get_components(self):
  190. """Returns a list of tuples"""
  191. return self.subjects
  192. ######################################################################
  193. def filter_paths(path_list):
  194. """`path_list` - A list of file paths to check. Only files which exist
  195. will be returned
  196. """
  197. return [p for p in path_list if os.path.exists(os.path.realpath(p))]
  198. # pylint: disable=too-many-locals,too-many-branches
  199. #
  200. # TODO: Break this function down into smaller chunks
  201. def load_and_handle_cert(cert_string, now, base64decode=False, ans_module=None):
  202. """Load a certificate, split off the good parts, and return some
  203. useful data
  204. Params:
  205. - `cert_string` (string) - a certificate loaded into a string object
  206. - `now` (datetime) - a datetime object of the time to calculate the certificate 'time_remaining' against
  207. - `base64decode` (bool) - run base64.b64decode() on the input
  208. - `ans_module` (AnsibleModule) - The AnsibleModule object for this module (so we can raise errors)
  209. Returns:
  210. A tuple of the form:
  211. (cert_subject, cert_expiry_date, time_remaining, cert_serial_number)
  212. """
  213. if base64decode:
  214. _cert_string = base64.b64decode(cert_string).decode('utf-8')
  215. else:
  216. _cert_string = cert_string
  217. # Disable this. We 'redefine' the type because we are working
  218. # around a missing library on the target host.
  219. #
  220. # pylint: disable=redefined-variable-type
  221. if HAS_OPENSSL:
  222. # No work-around required
  223. cert_loaded = OpenSSL.crypto.load_certificate(
  224. OpenSSL.crypto.FILETYPE_PEM, _cert_string)
  225. else:
  226. # Missing library, work-around required. Run the 'openssl'
  227. # command on it to decode it
  228. cmd = 'openssl x509 -text'
  229. try:
  230. openssl_proc = subprocess.Popen(cmd.split(),
  231. stdout=subprocess.PIPE,
  232. stdin=subprocess.PIPE)
  233. except OSError:
  234. ans_module.fail_json(msg="Error: The 'OpenSSL' python library and CLI command were not found on the target host. Unable to parse any certificates. This host will not be included in generated reports.")
  235. else:
  236. openssl_decoded = openssl_proc.communicate(_cert_string.encode('utf-8'))[0].decode('utf-8')
  237. cert_loaded = FakeOpenSSLCertificate(openssl_decoded)
  238. ######################################################################
  239. # Read all possible names from the cert
  240. cert_subjects = []
  241. for name, value in cert_loaded.get_subject().get_components():
  242. if isinstance(name, bytes) or isinstance(value, bytes):
  243. name = name.decode('utf-8')
  244. value = value.decode('utf-8')
  245. cert_subjects.append('{}:{}'.format(name, value))
  246. # To read SANs from a cert we must read the subjectAltName
  247. # extension from the X509 Object. What makes this more difficult
  248. # is that pyOpenSSL does not give extensions as an iterable
  249. san = None
  250. for i in range(cert_loaded.get_extension_count()):
  251. ext = cert_loaded.get_extension(i)
  252. if ext.get_short_name() == 'subjectAltName':
  253. san = ext
  254. if san is not None:
  255. # The X509Extension object for subjectAltName prints as a
  256. # string with the alt names separated by a comma and a
  257. # space. Split the string by ', ' and then add our new names
  258. # to the list of existing names
  259. cert_subjects.extend(str(san).split(', '))
  260. cert_subject = ', '.join(cert_subjects)
  261. ######################################################################
  262. # Grab the expiration date
  263. not_after = cert_loaded.get_notAfter()
  264. # example get_notAfter() => 20180922170439Z
  265. if isinstance(not_after, bytes):
  266. not_after = not_after.decode('utf-8')
  267. cert_expiry_date = datetime.datetime.strptime(
  268. not_after,
  269. '%Y%m%d%H%M%SZ')
  270. time_remaining = cert_expiry_date - now
  271. return (cert_subject, cert_expiry_date, time_remaining, cert_loaded.get_serial_number())
  272. def classify_cert(cert_meta, now, time_remaining, expire_window, cert_list):
  273. """Given metadata about a certificate under examination, classify it
  274. into one of three categories, 'ok', 'warning', and 'expired'.
  275. Params:
  276. - `cert_meta` dict - A dict with certificate metadata. Required fields
  277. include: 'cert_cn', 'path', 'expiry', 'days_remaining', 'health'.
  278. - `now` (datetime) - a datetime object of the time to calculate the certificate 'time_remaining' against
  279. - `time_remaining` (datetime.timedelta) - a timedelta for how long until the cert expires
  280. - `expire_window` (datetime.timedelta) - a timedelta for how long the warning window is
  281. - `cert_list` list - A list to shove the classified cert into
  282. Return:
  283. - `cert_list` - The updated list of classified certificates
  284. """
  285. expiry_str = str(cert_meta['expiry'])
  286. # Categorization
  287. if cert_meta['expiry'] < now:
  288. # This already expired, must NOTIFY
  289. cert_meta['health'] = 'expired'
  290. elif time_remaining < expire_window:
  291. # WARN about this upcoming expirations
  292. cert_meta['health'] = 'warning'
  293. else:
  294. # Not expired or about to expire
  295. cert_meta['health'] = 'ok'
  296. cert_meta['expiry'] = expiry_str
  297. cert_meta['serial_hex'] = hex(int(cert_meta['serial']))
  298. cert_list.append(cert_meta)
  299. return cert_list
  300. def tabulate_summary(certificates, kubeconfigs, etcd_certs, router_certs, registry_certs):
  301. """Calculate the summary text for when the module finishes
  302. running. This includes counts of each classification and what have
  303. you.
  304. Params:
  305. - `certificates` (list of dicts) - Processed `expire_check_result`
  306. dicts with filled in `health` keys for system certificates.
  307. - `kubeconfigs` - as above for kubeconfigs
  308. - `etcd_certs` - as above for etcd certs
  309. Return:
  310. - `summary_results` (dict) - Counts of each cert type classification
  311. and total items examined.
  312. """
  313. items = certificates + kubeconfigs + etcd_certs + router_certs + registry_certs
  314. summary_results = {
  315. 'system_certificates': len(certificates),
  316. 'kubeconfig_certificates': len(kubeconfigs),
  317. 'etcd_certificates': len(etcd_certs),
  318. 'router_certs': len(router_certs),
  319. 'registry_certs': len(registry_certs),
  320. 'total': len(items),
  321. 'ok': 0,
  322. 'warning': 0,
  323. 'expired': 0
  324. }
  325. summary_results['expired'] = len([c for c in items if c['health'] == 'expired'])
  326. summary_results['warning'] = len([c for c in items if c['health'] == 'warning'])
  327. summary_results['ok'] = len([c for c in items if c['health'] == 'ok'])
  328. return summary_results
  329. ######################################################################
  330. # This is our module MAIN function after all, so there's bound to be a
  331. # lot of code bundled up into one block
  332. #
  333. # Reason: These checks are disabled because the issue was introduced
  334. # during a period where the pylint checks weren't enabled for this file
  335. # Status: temporarily disabled pending future refactoring
  336. # pylint: disable=too-many-locals,too-many-statements,too-many-branches
  337. def main():
  338. """This module examines certificates (in various forms) which compose
  339. an OpenShift Container Platform cluster
  340. """
  341. module = AnsibleModule(
  342. argument_spec=dict(
  343. config_base=dict(
  344. required=False,
  345. default="/etc/origin",
  346. type='str'),
  347. warning_days=dict(
  348. required=False,
  349. default=30,
  350. type='int'),
  351. show_all=dict(
  352. required=False,
  353. default=False,
  354. type='bool')
  355. ),
  356. supports_check_mode=True,
  357. )
  358. # Basic scaffolding for OpenShift specific certs
  359. openshift_base_config_path = os.path.realpath(module.params['config_base'])
  360. openshift_master_config_path = os.path.join(openshift_base_config_path,
  361. "master", "master-config.yaml")
  362. openshift_node_config_path = os.path.join(openshift_base_config_path,
  363. "node", "node-config.yaml")
  364. openshift_cert_check_paths = [
  365. openshift_master_config_path,
  366. openshift_node_config_path,
  367. ]
  368. # Paths for Kubeconfigs. Additional kubeconfigs are conditionally
  369. # checked later in the code
  370. master_kube_configs = ['admin', 'openshift-master',
  371. 'openshift-node', 'openshift-router',
  372. 'openshift-registry']
  373. kubeconfig_paths = []
  374. for m_kube_config in master_kube_configs:
  375. kubeconfig_paths.append(
  376. os.path.join(openshift_base_config_path, "master", m_kube_config + ".kubeconfig")
  377. )
  378. # Validate some paths we have the ability to do ahead of time
  379. openshift_cert_check_paths = filter_paths(openshift_cert_check_paths)
  380. kubeconfig_paths = filter_paths(kubeconfig_paths)
  381. # etcd, where do you hide your certs? Used when parsing etcd.conf
  382. etcd_cert_params = [
  383. "ETCD_CA_FILE",
  384. "ETCD_CERT_FILE",
  385. "ETCD_PEER_CA_FILE",
  386. "ETCD_PEER_CERT_FILE",
  387. ]
  388. # Expiry checking stuff
  389. now = datetime.datetime.now()
  390. # todo, catch exception for invalid input and return a fail_json
  391. warning_days = int(module.params['warning_days'])
  392. expire_window = datetime.timedelta(days=warning_days)
  393. # Module stuff
  394. #
  395. # The results of our cert checking to return from the task call
  396. check_results = {}
  397. check_results['meta'] = {}
  398. check_results['meta']['warning_days'] = warning_days
  399. check_results['meta']['checked_at_time'] = str(now)
  400. check_results['meta']['warn_before_date'] = str(now + expire_window)
  401. check_results['meta']['show_all'] = str(module.params['show_all'])
  402. # All the analyzed certs accumulate here
  403. ocp_certs = []
  404. ######################################################################
  405. # Sure, why not? Let's enable check mode.
  406. if module.check_mode:
  407. check_results['ocp_certs'] = []
  408. module.exit_json(
  409. check_results=check_results,
  410. msg="Checked 0 total certificates. Expired/Warning/OK: 0/0/0. Warning window: %s days" % module.params['warning_days'],
  411. rc=0,
  412. changed=False
  413. )
  414. ######################################################################
  415. # Check for OpenShift Container Platform specific certs
  416. ######################################################################
  417. for os_cert in filter_paths(openshift_cert_check_paths):
  418. # Open up that config file and locate the cert and CA
  419. with io.open(os_cert, 'r', encoding='utf-8') as fp:
  420. cert_meta = {}
  421. cfg = yaml.load(fp)
  422. # cert files are specified in parsed `fp` as relative to the path
  423. # of the original config file. 'master-config.yaml' with certFile
  424. # = 'foo.crt' implies that 'foo.crt' is in the same
  425. # directory. certFile = '../foo.crt' is in the parent directory.
  426. cfg_path = os.path.dirname(fp.name)
  427. cert_meta['certFile'] = os.path.join(cfg_path, cfg['servingInfo']['certFile'])
  428. cert_meta['clientCA'] = os.path.join(cfg_path, cfg['servingInfo']['clientCA'])
  429. ######################################################################
  430. # Load the certificate and the CA, parse their expiration dates into
  431. # datetime objects so we can manipulate them later
  432. for v in cert_meta.values():
  433. with io.open(v, 'r', encoding='utf-8') as fp:
  434. cert = fp.read()
  435. (cert_subject,
  436. cert_expiry_date,
  437. time_remaining,
  438. cert_serial) = load_and_handle_cert(cert, now, ans_module=module)
  439. expire_check_result = {
  440. 'cert_cn': cert_subject,
  441. 'path': fp.name,
  442. 'expiry': cert_expiry_date,
  443. 'days_remaining': time_remaining.days,
  444. 'health': None,
  445. 'serial': cert_serial
  446. }
  447. classify_cert(expire_check_result, now, time_remaining, expire_window, ocp_certs)
  448. ######################################################################
  449. # /Check for OpenShift Container Platform specific certs
  450. ######################################################################
  451. ######################################################################
  452. # Check service Kubeconfigs
  453. ######################################################################
  454. kubeconfigs = []
  455. # There may be additional kubeconfigs to check, but their naming
  456. # is less predictable than the ones we've already assembled.
  457. try:
  458. # Try to read the standard 'node-config.yaml' file to check if
  459. # this host is a node.
  460. with io.open(openshift_node_config_path, 'r', encoding='utf-8') as fp:
  461. cfg = yaml.load(fp)
  462. # OK, the config file exists, therefore this is a
  463. # node. Nodes have their own kubeconfig files to
  464. # communicate with the master API. Let's read the relative
  465. # path to that file from the node config.
  466. node_masterKubeConfig = cfg['masterKubeConfig']
  467. # As before, the path to the 'masterKubeConfig' file is
  468. # relative to `fp`
  469. cfg_path = os.path.dirname(fp.name)
  470. node_kubeconfig = os.path.join(cfg_path, node_masterKubeConfig)
  471. with io.open(node_kubeconfig, 'r', encoding='utf8') as fp:
  472. # Read in the nodes kubeconfig file and grab the good stuff
  473. cfg = yaml.load(fp)
  474. c = cfg['users'][0]['user']['client-certificate-data']
  475. (cert_subject,
  476. cert_expiry_date,
  477. time_remaining,
  478. cert_serial) = load_and_handle_cert(c, now, base64decode=True, ans_module=module)
  479. expire_check_result = {
  480. 'cert_cn': cert_subject,
  481. 'path': fp.name,
  482. 'expiry': cert_expiry_date,
  483. 'days_remaining': time_remaining.days,
  484. 'health': None,
  485. 'serial': cert_serial
  486. }
  487. classify_cert(expire_check_result, now, time_remaining, expire_window, kubeconfigs)
  488. except IOError:
  489. # This is not a node
  490. pass
  491. for kube in filter_paths(kubeconfig_paths):
  492. with io.open(kube, 'r', encoding='utf-8') as fp:
  493. # TODO: Maybe consider catching exceptions here?
  494. cfg = yaml.load(fp)
  495. # Per conversation, "the kubeconfigs you care about:
  496. # admin, router, registry should all be single
  497. # value". Following that advice we only grab the data for
  498. # the user at index 0 in the 'users' list. There should
  499. # not be more than one user.
  500. c = cfg['users'][0]['user']['client-certificate-data']
  501. (cert_subject,
  502. cert_expiry_date,
  503. time_remaining,
  504. cert_serial) = load_and_handle_cert(c, now, base64decode=True, ans_module=module)
  505. expire_check_result = {
  506. 'cert_cn': cert_subject,
  507. 'path': fp.name,
  508. 'expiry': cert_expiry_date,
  509. 'days_remaining': time_remaining.days,
  510. 'health': None,
  511. 'serial': cert_serial
  512. }
  513. classify_cert(expire_check_result, now, time_remaining, expire_window, kubeconfigs)
  514. ######################################################################
  515. # /Check service Kubeconfigs
  516. ######################################################################
  517. ######################################################################
  518. # Check etcd certs
  519. #
  520. # Two things to check: 'external' etcd, and embedded etcd.
  521. ######################################################################
  522. # FIRST: The 'external' etcd
  523. #
  524. # Some values may be duplicated, make this a set for now so we
  525. # unique them all
  526. etcd_certs_to_check = set([])
  527. etcd_certs = []
  528. etcd_cert_params.append('dne')
  529. try:
  530. with io.open('/etc/etcd/etcd.conf', 'r', encoding='utf-8') as fp:
  531. # Add dummy header section.
  532. config = io.StringIO()
  533. config.write(u'[ETCD]\n')
  534. config.write(fp.read().replace('%', '%%'))
  535. config.seek(0, os.SEEK_SET)
  536. etcd_config = configparser.ConfigParser()
  537. etcd_config.readfp(config)
  538. for param in etcd_cert_params:
  539. try:
  540. etcd_certs_to_check.add(etcd_config.get('ETCD', param))
  541. except configparser.NoOptionError:
  542. # That parameter does not exist, oh well...
  543. pass
  544. except IOError:
  545. # No etcd to see here, move along
  546. pass
  547. for etcd_cert in filter_paths(etcd_certs_to_check):
  548. with io.open(etcd_cert, 'r', encoding='utf-8') as fp:
  549. c = fp.read()
  550. (cert_subject,
  551. cert_expiry_date,
  552. time_remaining,
  553. cert_serial) = load_and_handle_cert(c, now, ans_module=module)
  554. expire_check_result = {
  555. 'cert_cn': cert_subject,
  556. 'path': fp.name,
  557. 'expiry': cert_expiry_date,
  558. 'days_remaining': time_remaining.days,
  559. 'health': None,
  560. 'serial': cert_serial
  561. }
  562. classify_cert(expire_check_result, now, time_remaining, expire_window, etcd_certs)
  563. ######################################################################
  564. # Now the embedded etcd
  565. ######################################################################
  566. try:
  567. with io.open('/etc/origin/master/master-config.yaml', 'r', encoding='utf-8') as fp:
  568. cfg = yaml.load(fp)
  569. except IOError:
  570. # Not present
  571. pass
  572. else:
  573. if cfg.get('etcdConfig', {}).get('servingInfo', {}).get('certFile', None) is not None:
  574. # This is embedded
  575. etcd_crt_name = cfg['etcdConfig']['servingInfo']['certFile']
  576. else:
  577. # Not embedded
  578. etcd_crt_name = None
  579. if etcd_crt_name is not None:
  580. # etcd_crt_name is relative to the location of the
  581. # master-config.yaml file
  582. cfg_path = os.path.dirname(fp.name)
  583. etcd_cert = os.path.join(cfg_path, etcd_crt_name)
  584. with open(etcd_cert, 'r') as etcd_fp:
  585. (cert_subject,
  586. cert_expiry_date,
  587. time_remaining,
  588. cert_serial) = load_and_handle_cert(etcd_fp.read(), now, ans_module=module)
  589. expire_check_result = {
  590. 'cert_cn': cert_subject,
  591. 'path': etcd_fp.name,
  592. 'expiry': cert_expiry_date,
  593. 'days_remaining': time_remaining.days,
  594. 'health': None,
  595. 'serial': cert_serial
  596. }
  597. classify_cert(expire_check_result, now, time_remaining, expire_window, etcd_certs)
  598. ######################################################################
  599. # /Check etcd certs
  600. ######################################################################
  601. ######################################################################
  602. # Check router/registry certs
  603. #
  604. # These are saved as secrets in etcd. That means that we can not
  605. # simply read a file to grab the data. Instead we're going to
  606. # subprocess out to the 'oc get' command. On non-masters this
  607. # command will fail, that is expected so we catch that exception.
  608. ######################################################################
  609. router_certs = []
  610. registry_certs = []
  611. ######################################################################
  612. # First the router certs
  613. try:
  614. router_secrets_raw = subprocess.Popen('oc get -n default secret router-certs -o yaml'.split(),
  615. stdout=subprocess.PIPE)
  616. router_ds = yaml.load(router_secrets_raw.communicate()[0])
  617. router_c = router_ds['data']['tls.crt']
  618. router_path = router_ds['metadata']['selfLink']
  619. except TypeError:
  620. # YAML couldn't load the result, this is not a master
  621. pass
  622. except OSError:
  623. # The OC command doesn't exist here. Move along.
  624. pass
  625. else:
  626. (cert_subject,
  627. cert_expiry_date,
  628. time_remaining,
  629. cert_serial) = load_and_handle_cert(router_c, now, base64decode=True, ans_module=module)
  630. expire_check_result = {
  631. 'cert_cn': cert_subject,
  632. 'path': router_path,
  633. 'expiry': cert_expiry_date,
  634. 'days_remaining': time_remaining.days,
  635. 'health': None,
  636. 'serial': cert_serial
  637. }
  638. classify_cert(expire_check_result, now, time_remaining, expire_window, router_certs)
  639. ######################################################################
  640. # Now for registry
  641. try:
  642. registry_secrets_raw = subprocess.Popen('oc get -n default secret registry-certificates -o yaml'.split(),
  643. stdout=subprocess.PIPE)
  644. registry_ds = yaml.load(registry_secrets_raw.communicate()[0])
  645. registry_c = registry_ds['data']['registry.crt']
  646. registry_path = registry_ds['metadata']['selfLink']
  647. except TypeError:
  648. # YAML couldn't load the result, this is not a master
  649. pass
  650. except OSError:
  651. # The OC command doesn't exist here. Move along.
  652. pass
  653. else:
  654. (cert_subject,
  655. cert_expiry_date,
  656. time_remaining,
  657. cert_serial) = load_and_handle_cert(registry_c, now, base64decode=True, ans_module=module)
  658. expire_check_result = {
  659. 'cert_cn': cert_subject,
  660. 'path': registry_path,
  661. 'expiry': cert_expiry_date,
  662. 'days_remaining': time_remaining.days,
  663. 'health': None,
  664. 'serial': cert_serial
  665. }
  666. classify_cert(expire_check_result, now, time_remaining, expire_window, registry_certs)
  667. ######################################################################
  668. # /Check router/registry certs
  669. ######################################################################
  670. res = tabulate_summary(ocp_certs, kubeconfigs, etcd_certs, router_certs, registry_certs)
  671. msg = "Checked {count} total certificates. Expired/Warning/OK: {exp}/{warn}/{ok}. Warning window: {window} days".format(
  672. count=res['total'],
  673. exp=res['expired'],
  674. warn=res['warning'],
  675. ok=res['ok'],
  676. window=int(module.params['warning_days']),
  677. )
  678. # By default we only return detailed information about expired or
  679. # warning certificates. If show_all is true then we will print all
  680. # the certificates examined.
  681. if not module.params['show_all']:
  682. check_results['ocp_certs'] = [crt for crt in ocp_certs if crt['health'] in ['expired', 'warning']]
  683. check_results['kubeconfigs'] = [crt for crt in kubeconfigs if crt['health'] in ['expired', 'warning']]
  684. check_results['etcd'] = [crt for crt in etcd_certs if crt['health'] in ['expired', 'warning']]
  685. check_results['registry'] = [crt for crt in registry_certs if crt['health'] in ['expired', 'warning']]
  686. check_results['router'] = [crt for crt in router_certs if crt['health'] in ['expired', 'warning']]
  687. else:
  688. check_results['ocp_certs'] = ocp_certs
  689. check_results['kubeconfigs'] = kubeconfigs
  690. check_results['etcd'] = etcd_certs
  691. check_results['registry'] = registry_certs
  692. check_results['router'] = router_certs
  693. # Sort the final results to report in order of ascending safety
  694. # time. That is to say, the certificates which will expire sooner
  695. # will be at the front of the list and certificates which will
  696. # expire later are at the end. Router and registry certs should be
  697. # limited to just 1 result, so don't bother sorting those.
  698. def cert_key(item):
  699. ''' return the days_remaining key '''
  700. return item['days_remaining']
  701. check_results['ocp_certs'] = sorted(check_results['ocp_certs'], key=cert_key)
  702. check_results['kubeconfigs'] = sorted(check_results['kubeconfigs'], key=cert_key)
  703. check_results['etcd'] = sorted(check_results['etcd'], key=cert_key)
  704. # This module will never change anything, but we might want to
  705. # change the return code parameter if there is some catastrophic
  706. # error we noticed earlier
  707. module.exit_json(
  708. check_results=check_results,
  709. summary=res,
  710. msg=msg,
  711. rc=0,
  712. changed=False
  713. )
  714. if __name__ == '__main__':
  715. main()