openshift_cert_expiry.py 33 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859
  1. #!/usr/bin/python
  2. # -*- coding: utf-8 -*-
  3. # pylint: disable=line-too-long,invalid-name
  4. """For details on this module see DOCUMENTATION (below)"""
  5. import datetime
  6. import io
  7. import os
  8. import subprocess
  9. import yaml
  10. # pylint import-error disabled because pylint cannot find the package
  11. # when installed in a virtualenv
  12. from ansible.module_utils.six.moves import configparser # pylint: disable=import-error
  13. from ansible.module_utils.basic import AnsibleModule
  14. try:
  15. # You can comment this import out and include a 'pass' in this
  16. # block if you're manually testing this module on a NON-ATOMIC
  17. # HOST (or any host that just doesn't have PyOpenSSL
  18. # available). That will force the `load_and_handle_cert` function
  19. # to use the Fake OpenSSL classes.
  20. import OpenSSL.crypto
  21. HAS_OPENSSL = True
  22. except ImportError:
  23. # Some platforms (such as RHEL Atomic) may not have the Python
  24. # OpenSSL library installed. In this case we will use a manual
  25. # work-around to parse each certificate.
  26. #
  27. # Check for 'OpenSSL.crypto' in `sys.modules` later.
  28. HAS_OPENSSL = False
  29. DOCUMENTATION = '''
  30. ---
  31. module: openshift_cert_expiry
  32. short_description: Check OpenShift Container Platform (OCP) and Kube certificate expirations on a cluster
  33. description:
  34. - The M(openshift_cert_expiry) module has two basic functions: to flag certificates which will expire in a set window of time from now, and to notify you about certificates which have already expired.
  35. - When the module finishes, a summary of the examination is returned. Each certificate in the summary has a C(health) key with a value of one of the following:
  36. - C(ok) - not expired, and outside of the expiration C(warning_days) window.
  37. - C(warning) - not expired, but will expire between now and the C(warning_days) window.
  38. - C(expired) - an expired certificate.
  39. - Certificate flagging follow this logic:
  40. - If the expiration date is before now then the certificate is classified as C(expired).
  41. - The certificates time to live (expiration date - now) is calculated, if that time window is less than C(warning_days) the certificate is classified as C(warning).
  42. - All other conditions are classified as C(ok).
  43. - The following keys are ALSO present in the certificate summary:
  44. - C(cert_cn) - The common name of the certificate (additional CNs present in SAN extensions are omitted)
  45. - C(days_remaining) - The number of days until the certificate expires.
  46. - C(expiry) - The date the certificate expires on.
  47. - C(path) - The full path to the certificate on the examined host.
  48. version_added: "1.0"
  49. options:
  50. config_base:
  51. description:
  52. - Base path to OCP system settings.
  53. required: false
  54. default: /etc/origin
  55. warning_days:
  56. description:
  57. - Flag certificates which will expire in C(warning_days) days from now.
  58. required: false
  59. default: 30
  60. show_all:
  61. description:
  62. - Enable this option to show analysis of ALL certificates examined by this module.
  63. - By default only certificates which have expired, or will expire within the C(warning_days) window will be reported.
  64. required: false
  65. default: false
  66. author: "Tim Bielawa (@tbielawa) <tbielawa@redhat.com>"
  67. '''
  68. EXAMPLES = '''
  69. # Default invocation, only notify about expired certificates or certificates which will expire within 30 days from now
  70. - openshift_cert_expiry:
  71. # Expand the warning window to show certificates expiring within a year from now
  72. - openshift_cert_expiry: warning_days=365
  73. # Show expired, soon to expire (now + 30 days), and all other certificates examined
  74. - openshift_cert_expiry: show_all=true
  75. '''
  76. class FakeOpenSSLCertificate(object):
  77. """This provides a rough mock of what you get from
  78. `OpenSSL.crypto.load_certificate()`. This is a work-around for
  79. platforms missing the Python OpenSSL library.
  80. """
  81. def __init__(self, cert_string):
  82. """`cert_string` is a certificate in the form you get from running a
  83. .crt through 'openssl x509 -in CERT.cert -text'"""
  84. self.cert_string = cert_string
  85. self.serial = None
  86. self.subject = None
  87. self.extensions = []
  88. self.not_after = None
  89. self._parse_cert()
  90. def _parse_cert(self):
  91. """Manually parse the certificate line by line"""
  92. self.extensions = []
  93. PARSING_ALT_NAMES = False
  94. PARSING_HEX_SERIAL = False
  95. for line in self.cert_string.split('\n'):
  96. l = line.strip()
  97. if PARSING_ALT_NAMES:
  98. # We're parsing a 'Subject Alternative Name' line
  99. self.extensions.append(
  100. FakeOpenSSLCertificateSANExtension(l))
  101. PARSING_ALT_NAMES = False
  102. continue
  103. if PARSING_HEX_SERIAL:
  104. # Hex serials arrive colon-delimited
  105. serial_raw = l.replace(':', '')
  106. # Convert to decimal
  107. self.serial = int('0x' + serial_raw, base=16)
  108. PARSING_HEX_SERIAL = False
  109. continue
  110. # parse out the bits that we can
  111. if l.startswith('Serial Number:'):
  112. # Decimal format:
  113. # Serial Number: 11 (0xb)
  114. # => 11
  115. # Hex Format (large serials):
  116. # Serial Number:
  117. # 0a:de:eb:24:04:75:ab:56:39:14:e9:5a:22:e2:85:bf
  118. # => 14449739080294792594019643629255165375
  119. if l.endswith(':'):
  120. PARSING_HEX_SERIAL = True
  121. continue
  122. self.serial = int(l.split()[-2])
  123. elif l.startswith('Not After :'):
  124. # Not After : Feb 7 18:19:35 2019 GMT
  125. # => strptime(str, '%b %d %H:%M:%S %Y %Z')
  126. # => strftime('%Y%m%d%H%M%SZ')
  127. # => 20190207181935Z
  128. not_after_raw = l.partition(' : ')[-1]
  129. # Last item: ('Not After', ' : ', 'Feb 7 18:19:35 2019 GMT')
  130. not_after_parsed = datetime.datetime.strptime(not_after_raw, '%b %d %H:%M:%S %Y %Z')
  131. self.not_after = not_after_parsed.strftime('%Y%m%d%H%M%SZ')
  132. elif l.startswith('X509v3 Subject Alternative Name:'):
  133. PARSING_ALT_NAMES = True
  134. continue
  135. elif l.startswith('Subject:'):
  136. # O = system:nodes, CN = system:node:m01.example.com
  137. self.subject = FakeOpenSSLCertificateSubjects(l.partition(': ')[-1])
  138. def get_serial_number(self):
  139. """Return the serial number of the cert"""
  140. return self.serial
  141. def get_subject(self):
  142. """Subjects must implement get_components() and return dicts or
  143. tuples. An 'openssl x509 -in CERT.cert -text' with 'Subject':
  144. Subject: Subject: O=system:nodes, CN=system:node:m01.example.com
  145. might return: [('O=system', 'nodes'), ('CN=system', 'node:m01.example.com')]
  146. """
  147. return self.subject
  148. def get_extension(self, i):
  149. """Extensions must implement get_short_name() and return the string
  150. 'subjectAltName'"""
  151. return self.extensions[i]
  152. def get_extension_count(self):
  153. """ get_extension_count """
  154. return len(self.extensions)
  155. def get_notAfter(self):
  156. """Returns a date stamp as a string in the form
  157. '20180922170439Z'. strptime the result with format param:
  158. '%Y%m%d%H%M%SZ'."""
  159. return self.not_after
  160. class FakeOpenSSLCertificateSANExtension(object): # pylint: disable=too-few-public-methods
  161. """Mocks what happens when `get_extension` is called on a certificate
  162. object"""
  163. def __init__(self, san_string):
  164. """With `san_string` as you get from:
  165. $ openssl x509 -in certificate.crt -text
  166. """
  167. self.san_string = san_string
  168. self.short_name = 'subjectAltName'
  169. def get_short_name(self):
  170. """Return the 'type' of this extension. It's always the same though
  171. because we only care about subjectAltName's"""
  172. return self.short_name
  173. def __str__(self):
  174. """Return this extension and the value as a simple string"""
  175. return self.san_string
  176. # pylint: disable=too-few-public-methods
  177. class FakeOpenSSLCertificateSubjects(object):
  178. """Mocks what happens when `get_subject` is called on a certificate
  179. object"""
  180. def __init__(self, subject_string):
  181. """With `subject_string` as you get from:
  182. $ openssl x509 -in certificate.crt -text
  183. """
  184. self.subjects = []
  185. for s in subject_string.split(', '):
  186. name, _, value = s.partition(' = ')
  187. self.subjects.append((name, value))
  188. def get_components(self):
  189. """Returns a list of tuples"""
  190. return self.subjects
  191. # We only need this for one thing, we don't care if it doesn't have
  192. # that many public methods
  193. #
  194. # pylint: disable=too-few-public-methods
  195. class FakeSecHead(object):
  196. """etcd does not begin their config file with an opening [section] as
  197. required by the Python ConfigParser module. We hack around it by
  198. slipping one in ourselves prior to parsing.
  199. Source: Alex Martelli - http://stackoverflow.com/a/2819788/6490583
  200. """
  201. def __init__(self, fp):
  202. self.fp = fp
  203. self.sechead = '[ETCD]\n'
  204. def readline(self):
  205. """Make this look like a file-type object"""
  206. if self.sechead:
  207. try:
  208. return self.sechead
  209. finally:
  210. self.sechead = None
  211. else:
  212. return self.fp.readline()
  213. ######################################################################
  214. def filter_paths(path_list):
  215. """`path_list` - A list of file paths to check. Only files which exist
  216. will be returned
  217. """
  218. return [p for p in path_list if os.path.exists(os.path.realpath(p))]
  219. # pylint: disable=too-many-locals,too-many-branches
  220. #
  221. # TODO: Break this function down into smaller chunks
  222. def load_and_handle_cert(cert_string, now, base64decode=False, ans_module=None):
  223. """Load a certificate, split off the good parts, and return some
  224. useful data
  225. Params:
  226. - `cert_string` (string) - a certificate loaded into a string object
  227. - `now` (datetime) - a datetime object of the time to calculate the certificate 'time_remaining' against
  228. - `base64decode` (bool) - run .decode('base64') on the input?
  229. - `ans_module` (AnsibleModule) - The AnsibleModule object for this module (so we can raise errors)
  230. Returns:
  231. A tuple of the form:
  232. (cert_subject, cert_expiry_date, time_remaining, cert_serial_number)
  233. """
  234. if base64decode:
  235. _cert_string = cert_string.decode('base-64')
  236. else:
  237. _cert_string = cert_string
  238. # Disable this. We 'redefine' the type because we are working
  239. # around a missing library on the target host.
  240. #
  241. # pylint: disable=redefined-variable-type
  242. if HAS_OPENSSL:
  243. # No work-around required
  244. cert_loaded = OpenSSL.crypto.load_certificate(
  245. OpenSSL.crypto.FILETYPE_PEM, _cert_string)
  246. else:
  247. # Missing library, work-around required. Run the 'openssl'
  248. # command on it to decode it
  249. cmd = 'openssl x509 -text'
  250. try:
  251. openssl_proc = subprocess.Popen(cmd.split(),
  252. stdout=subprocess.PIPE,
  253. stdin=subprocess.PIPE)
  254. except OSError:
  255. ans_module.fail_json(msg="Error: The 'OpenSSL' python library and CLI command were not found on the target host. Unable to parse any certificates. This host will not be included in generated reports.")
  256. else:
  257. openssl_decoded = openssl_proc.communicate(_cert_string.encode('utf-8'))[0].decode('utf-8')
  258. cert_loaded = FakeOpenSSLCertificate(openssl_decoded)
  259. ######################################################################
  260. # Read all possible names from the cert
  261. cert_subjects = []
  262. for name, value in cert_loaded.get_subject().get_components():
  263. cert_subjects.append('{}:{}'.format(name, value))
  264. # To read SANs from a cert we must read the subjectAltName
  265. # extension from the X509 Object. What makes this more difficult
  266. # is that pyOpenSSL does not give extensions as an iterable
  267. san = None
  268. for i in range(cert_loaded.get_extension_count()):
  269. ext = cert_loaded.get_extension(i)
  270. if ext.get_short_name() == 'subjectAltName':
  271. san = ext
  272. if san is not None:
  273. # The X509Extension object for subjectAltName prints as a
  274. # string with the alt names separated by a comma and a
  275. # space. Split the string by ', ' and then add our new names
  276. # to the list of existing names
  277. cert_subjects.extend(str(san).split(', '))
  278. cert_subject = ', '.join(cert_subjects)
  279. ######################################################################
  280. # Grab the expiration date
  281. not_after = cert_loaded.get_notAfter()
  282. # example get_notAfter() => 20180922170439Z
  283. if isinstance(not_after, bytes):
  284. not_after = not_after.decode('utf-8')
  285. cert_expiry_date = datetime.datetime.strptime(
  286. not_after,
  287. '%Y%m%d%H%M%SZ')
  288. time_remaining = cert_expiry_date - now
  289. return (cert_subject, cert_expiry_date, time_remaining, cert_loaded.get_serial_number())
  290. def classify_cert(cert_meta, now, time_remaining, expire_window, cert_list):
  291. """Given metadata about a certificate under examination, classify it
  292. into one of three categories, 'ok', 'warning', and 'expired'.
  293. Params:
  294. - `cert_meta` dict - A dict with certificate metadata. Required fields
  295. include: 'cert_cn', 'path', 'expiry', 'days_remaining', 'health'.
  296. - `now` (datetime) - a datetime object of the time to calculate the certificate 'time_remaining' against
  297. - `time_remaining` (datetime.timedelta) - a timedelta for how long until the cert expires
  298. - `expire_window` (datetime.timedelta) - a timedelta for how long the warning window is
  299. - `cert_list` list - A list to shove the classified cert into
  300. Return:
  301. - `cert_list` - The updated list of classified certificates
  302. """
  303. expiry_str = str(cert_meta['expiry'])
  304. # Categorization
  305. if cert_meta['expiry'] < now:
  306. # This already expired, must NOTIFY
  307. cert_meta['health'] = 'expired'
  308. elif time_remaining < expire_window:
  309. # WARN about this upcoming expirations
  310. cert_meta['health'] = 'warning'
  311. else:
  312. # Not expired or about to expire
  313. cert_meta['health'] = 'ok'
  314. cert_meta['expiry'] = expiry_str
  315. cert_meta['serial_hex'] = hex(int(cert_meta['serial']))
  316. cert_list.append(cert_meta)
  317. return cert_list
  318. def tabulate_summary(certificates, kubeconfigs, etcd_certs, router_certs, registry_certs):
  319. """Calculate the summary text for when the module finishes
  320. running. This includes counts of each classification and what have
  321. you.
  322. Params:
  323. - `certificates` (list of dicts) - Processed `expire_check_result`
  324. dicts with filled in `health` keys for system certificates.
  325. - `kubeconfigs` - as above for kubeconfigs
  326. - `etcd_certs` - as above for etcd certs
  327. Return:
  328. - `summary_results` (dict) - Counts of each cert type classification
  329. and total items examined.
  330. """
  331. items = certificates + kubeconfigs + etcd_certs + router_certs + registry_certs
  332. summary_results = {
  333. 'system_certificates': len(certificates),
  334. 'kubeconfig_certificates': len(kubeconfigs),
  335. 'etcd_certificates': len(etcd_certs),
  336. 'router_certs': len(router_certs),
  337. 'registry_certs': len(registry_certs),
  338. 'total': len(items),
  339. 'ok': 0,
  340. 'warning': 0,
  341. 'expired': 0
  342. }
  343. summary_results['expired'] = len([c for c in items if c['health'] == 'expired'])
  344. summary_results['warning'] = len([c for c in items if c['health'] == 'warning'])
  345. summary_results['ok'] = len([c for c in items if c['health'] == 'ok'])
  346. return summary_results
  347. ######################################################################
  348. # This is our module MAIN function after all, so there's bound to be a
  349. # lot of code bundled up into one block
  350. #
  351. # Reason: These checks are disabled because the issue was introduced
  352. # during a period where the pylint checks weren't enabled for this file
  353. # Status: temporarily disabled pending future refactoring
  354. # pylint: disable=too-many-locals,too-many-statements,too-many-branches
  355. def main():
  356. """This module examines certificates (in various forms) which compose
  357. an OpenShift Container Platform cluster
  358. """
  359. module = AnsibleModule(
  360. argument_spec=dict(
  361. config_base=dict(
  362. required=False,
  363. default="/etc/origin",
  364. type='str'),
  365. warning_days=dict(
  366. required=False,
  367. default=30,
  368. type='int'),
  369. show_all=dict(
  370. required=False,
  371. default=False,
  372. type='bool')
  373. ),
  374. supports_check_mode=True,
  375. )
  376. # Basic scaffolding for OpenShift specific certs
  377. openshift_base_config_path = os.path.realpath(module.params['config_base'])
  378. openshift_master_config_path = os.path.join(openshift_base_config_path,
  379. "master", "master-config.yaml")
  380. openshift_node_config_path = os.path.join(openshift_base_config_path,
  381. "node", "node-config.yaml")
  382. openshift_cert_check_paths = [
  383. openshift_master_config_path,
  384. openshift_node_config_path,
  385. ]
  386. # Paths for Kubeconfigs. Additional kubeconfigs are conditionally
  387. # checked later in the code
  388. master_kube_configs = ['admin', 'openshift-master',
  389. 'openshift-node', 'openshift-router',
  390. 'openshift-registry']
  391. kubeconfig_paths = []
  392. for m_kube_config in master_kube_configs:
  393. kubeconfig_paths.append(
  394. os.path.join(openshift_base_config_path, "master", m_kube_config + ".kubeconfig")
  395. )
  396. # Validate some paths we have the ability to do ahead of time
  397. openshift_cert_check_paths = filter_paths(openshift_cert_check_paths)
  398. kubeconfig_paths = filter_paths(kubeconfig_paths)
  399. # etcd, where do you hide your certs? Used when parsing etcd.conf
  400. etcd_cert_params = [
  401. "ETCD_CA_FILE",
  402. "ETCD_CERT_FILE",
  403. "ETCD_PEER_CA_FILE",
  404. "ETCD_PEER_CERT_FILE",
  405. ]
  406. # Expiry checking stuff
  407. now = datetime.datetime.now()
  408. # todo, catch exception for invalid input and return a fail_json
  409. warning_days = int(module.params['warning_days'])
  410. expire_window = datetime.timedelta(days=warning_days)
  411. # Module stuff
  412. #
  413. # The results of our cert checking to return from the task call
  414. check_results = {}
  415. check_results['meta'] = {}
  416. check_results['meta']['warning_days'] = warning_days
  417. check_results['meta']['checked_at_time'] = str(now)
  418. check_results['meta']['warn_before_date'] = str(now + expire_window)
  419. check_results['meta']['show_all'] = str(module.params['show_all'])
  420. # All the analyzed certs accumulate here
  421. ocp_certs = []
  422. ######################################################################
  423. # Sure, why not? Let's enable check mode.
  424. if module.check_mode:
  425. check_results['ocp_certs'] = []
  426. module.exit_json(
  427. check_results=check_results,
  428. msg="Checked 0 total certificates. Expired/Warning/OK: 0/0/0. Warning window: %s days" % module.params['warning_days'],
  429. rc=0,
  430. changed=False
  431. )
  432. ######################################################################
  433. # Check for OpenShift Container Platform specific certs
  434. ######################################################################
  435. for os_cert in filter_paths(openshift_cert_check_paths):
  436. # Open up that config file and locate the cert and CA
  437. with io.open(os_cert, 'r', encoding='utf-8') as fp:
  438. cert_meta = {}
  439. cfg = yaml.load(fp)
  440. # cert files are specified in parsed `fp` as relative to the path
  441. # of the original config file. 'master-config.yaml' with certFile
  442. # = 'foo.crt' implies that 'foo.crt' is in the same
  443. # directory. certFile = '../foo.crt' is in the parent directory.
  444. cfg_path = os.path.dirname(fp.name)
  445. cert_meta['certFile'] = os.path.join(cfg_path, cfg['servingInfo']['certFile'])
  446. cert_meta['clientCA'] = os.path.join(cfg_path, cfg['servingInfo']['clientCA'])
  447. ######################################################################
  448. # Load the certificate and the CA, parse their expiration dates into
  449. # datetime objects so we can manipulate them later
  450. for _, v in cert_meta.items():
  451. with io.open(v, 'r', encoding='utf-8') as fp:
  452. cert = fp.read()
  453. (cert_subject,
  454. cert_expiry_date,
  455. time_remaining,
  456. cert_serial) = load_and_handle_cert(cert, now, ans_module=module)
  457. expire_check_result = {
  458. 'cert_cn': cert_subject,
  459. 'path': fp.name,
  460. 'expiry': cert_expiry_date,
  461. 'days_remaining': time_remaining.days,
  462. 'health': None,
  463. 'serial': cert_serial
  464. }
  465. classify_cert(expire_check_result, now, time_remaining, expire_window, ocp_certs)
  466. ######################################################################
  467. # /Check for OpenShift Container Platform specific certs
  468. ######################################################################
  469. ######################################################################
  470. # Check service Kubeconfigs
  471. ######################################################################
  472. kubeconfigs = []
  473. # There may be additional kubeconfigs to check, but their naming
  474. # is less predictable than the ones we've already assembled.
  475. try:
  476. # Try to read the standard 'node-config.yaml' file to check if
  477. # this host is a node.
  478. with io.open(openshift_node_config_path, 'r', encoding='utf-8') as fp:
  479. cfg = yaml.load(fp)
  480. # OK, the config file exists, therefore this is a
  481. # node. Nodes have their own kubeconfig files to
  482. # communicate with the master API. Let's read the relative
  483. # path to that file from the node config.
  484. node_masterKubeConfig = cfg['masterKubeConfig']
  485. # As before, the path to the 'masterKubeConfig' file is
  486. # relative to `fp`
  487. cfg_path = os.path.dirname(fp.name)
  488. node_kubeconfig = os.path.join(cfg_path, node_masterKubeConfig)
  489. with io.open(node_kubeconfig, 'r', encoding='utf8') as fp:
  490. # Read in the nodes kubeconfig file and grab the good stuff
  491. cfg = yaml.load(fp)
  492. c = cfg['users'][0]['user']['client-certificate-data']
  493. (cert_subject,
  494. cert_expiry_date,
  495. time_remaining,
  496. cert_serial) = load_and_handle_cert(c, now, base64decode=True, ans_module=module)
  497. expire_check_result = {
  498. 'cert_cn': cert_subject,
  499. 'path': fp.name,
  500. 'expiry': cert_expiry_date,
  501. 'days_remaining': time_remaining.days,
  502. 'health': None,
  503. 'serial': cert_serial
  504. }
  505. classify_cert(expire_check_result, now, time_remaining, expire_window, kubeconfigs)
  506. except IOError:
  507. # This is not a node
  508. pass
  509. for kube in filter_paths(kubeconfig_paths):
  510. with io.open(kube, 'r', encoding='utf-8') as fp:
  511. # TODO: Maybe consider catching exceptions here?
  512. cfg = yaml.load(fp)
  513. # Per conversation, "the kubeconfigs you care about:
  514. # admin, router, registry should all be single
  515. # value". Following that advice we only grab the data for
  516. # the user at index 0 in the 'users' list. There should
  517. # not be more than one user.
  518. c = cfg['users'][0]['user']['client-certificate-data']
  519. (cert_subject,
  520. cert_expiry_date,
  521. time_remaining,
  522. cert_serial) = load_and_handle_cert(c, now, base64decode=True, ans_module=module)
  523. expire_check_result = {
  524. 'cert_cn': cert_subject,
  525. 'path': fp.name,
  526. 'expiry': cert_expiry_date,
  527. 'days_remaining': time_remaining.days,
  528. 'health': None,
  529. 'serial': cert_serial
  530. }
  531. classify_cert(expire_check_result, now, time_remaining, expire_window, kubeconfigs)
  532. ######################################################################
  533. # /Check service Kubeconfigs
  534. ######################################################################
  535. ######################################################################
  536. # Check etcd certs
  537. #
  538. # Two things to check: 'external' etcd, and embedded etcd.
  539. ######################################################################
  540. # FIRST: The 'external' etcd
  541. #
  542. # Some values may be duplicated, make this a set for now so we
  543. # unique them all
  544. etcd_certs_to_check = set([])
  545. etcd_certs = []
  546. etcd_cert_params.append('dne')
  547. try:
  548. with io.open('/etc/etcd/etcd.conf', 'r', encoding='utf-8') as fp:
  549. etcd_config = configparser.ConfigParser()
  550. # Reason: This check is disabled because the issue was introduced
  551. # during a period where the pylint checks weren't enabled for this file
  552. # Status: temporarily disabled pending future refactoring
  553. # pylint: disable=deprecated-method
  554. etcd_config.readfp(FakeSecHead(fp))
  555. for param in etcd_cert_params:
  556. try:
  557. etcd_certs_to_check.add(etcd_config.get('ETCD', param))
  558. except configparser.NoOptionError:
  559. # That parameter does not exist, oh well...
  560. pass
  561. except IOError:
  562. # No etcd to see here, move along
  563. pass
  564. for etcd_cert in filter_paths(etcd_certs_to_check):
  565. with io.open(etcd_cert, 'r', encoding='utf-8') as fp:
  566. c = fp.read()
  567. (cert_subject,
  568. cert_expiry_date,
  569. time_remaining,
  570. cert_serial) = load_and_handle_cert(c, now, ans_module=module)
  571. expire_check_result = {
  572. 'cert_cn': cert_subject,
  573. 'path': fp.name,
  574. 'expiry': cert_expiry_date,
  575. 'days_remaining': time_remaining.days,
  576. 'health': None,
  577. 'serial': cert_serial
  578. }
  579. classify_cert(expire_check_result, now, time_remaining, expire_window, etcd_certs)
  580. ######################################################################
  581. # Now the embedded etcd
  582. ######################################################################
  583. try:
  584. with io.open('/etc/origin/master/master-config.yaml', 'r', encoding='utf-8') as fp:
  585. cfg = yaml.load(fp)
  586. except IOError:
  587. # Not present
  588. pass
  589. else:
  590. if cfg.get('etcdConfig', {}).get('servingInfo', {}).get('certFile', None) is not None:
  591. # This is embedded
  592. etcd_crt_name = cfg['etcdConfig']['servingInfo']['certFile']
  593. else:
  594. # Not embedded
  595. etcd_crt_name = None
  596. if etcd_crt_name is not None:
  597. # etcd_crt_name is relative to the location of the
  598. # master-config.yaml file
  599. cfg_path = os.path.dirname(fp.name)
  600. etcd_cert = os.path.join(cfg_path, etcd_crt_name)
  601. with open(etcd_cert, 'r') as etcd_fp:
  602. (cert_subject,
  603. cert_expiry_date,
  604. time_remaining,
  605. cert_serial) = load_and_handle_cert(etcd_fp.read(), now, ans_module=module)
  606. expire_check_result = {
  607. 'cert_cn': cert_subject,
  608. 'path': etcd_fp.name,
  609. 'expiry': cert_expiry_date,
  610. 'days_remaining': time_remaining.days,
  611. 'health': None,
  612. 'serial': cert_serial
  613. }
  614. classify_cert(expire_check_result, now, time_remaining, expire_window, etcd_certs)
  615. ######################################################################
  616. # /Check etcd certs
  617. ######################################################################
  618. ######################################################################
  619. # Check router/registry certs
  620. #
  621. # These are saved as secrets in etcd. That means that we can not
  622. # simply read a file to grab the data. Instead we're going to
  623. # subprocess out to the 'oc get' command. On non-masters this
  624. # command will fail, that is expected so we catch that exception.
  625. ######################################################################
  626. router_certs = []
  627. registry_certs = []
  628. ######################################################################
  629. # First the router certs
  630. try:
  631. router_secrets_raw = subprocess.Popen('oc get -n default secret router-certs -o yaml'.split(),
  632. stdout=subprocess.PIPE)
  633. router_ds = yaml.load(router_secrets_raw.communicate()[0])
  634. router_c = router_ds['data']['tls.crt']
  635. router_path = router_ds['metadata']['selfLink']
  636. except TypeError:
  637. # YAML couldn't load the result, this is not a master
  638. pass
  639. except OSError:
  640. # The OC command doesn't exist here. Move along.
  641. pass
  642. else:
  643. (cert_subject,
  644. cert_expiry_date,
  645. time_remaining,
  646. cert_serial) = load_and_handle_cert(router_c, now, base64decode=True, ans_module=module)
  647. expire_check_result = {
  648. 'cert_cn': cert_subject,
  649. 'path': router_path,
  650. 'expiry': cert_expiry_date,
  651. 'days_remaining': time_remaining.days,
  652. 'health': None,
  653. 'serial': cert_serial
  654. }
  655. classify_cert(expire_check_result, now, time_remaining, expire_window, router_certs)
  656. ######################################################################
  657. # Now for registry
  658. try:
  659. registry_secrets_raw = subprocess.Popen('oc get -n default secret registry-certificates -o yaml'.split(),
  660. stdout=subprocess.PIPE)
  661. registry_ds = yaml.load(registry_secrets_raw.communicate()[0])
  662. registry_c = registry_ds['data']['registry.crt']
  663. registry_path = registry_ds['metadata']['selfLink']
  664. except TypeError:
  665. # YAML couldn't load the result, this is not a master
  666. pass
  667. except OSError:
  668. # The OC command doesn't exist here. Move along.
  669. pass
  670. else:
  671. (cert_subject,
  672. cert_expiry_date,
  673. time_remaining,
  674. cert_serial) = load_and_handle_cert(registry_c, now, base64decode=True, ans_module=module)
  675. expire_check_result = {
  676. 'cert_cn': cert_subject,
  677. 'path': registry_path,
  678. 'expiry': cert_expiry_date,
  679. 'days_remaining': time_remaining.days,
  680. 'health': None,
  681. 'serial': cert_serial
  682. }
  683. classify_cert(expire_check_result, now, time_remaining, expire_window, registry_certs)
  684. ######################################################################
  685. # /Check router/registry certs
  686. ######################################################################
  687. res = tabulate_summary(ocp_certs, kubeconfigs, etcd_certs, router_certs, registry_certs)
  688. msg = "Checked {count} total certificates. Expired/Warning/OK: {exp}/{warn}/{ok}. Warning window: {window} days".format(
  689. count=res['total'],
  690. exp=res['expired'],
  691. warn=res['warning'],
  692. ok=res['ok'],
  693. window=int(module.params['warning_days']),
  694. )
  695. # By default we only return detailed information about expired or
  696. # warning certificates. If show_all is true then we will print all
  697. # the certificates examined.
  698. if not module.params['show_all']:
  699. check_results['ocp_certs'] = [crt for crt in ocp_certs if crt['health'] in ['expired', 'warning']]
  700. check_results['kubeconfigs'] = [crt for crt in kubeconfigs if crt['health'] in ['expired', 'warning']]
  701. check_results['etcd'] = [crt for crt in etcd_certs if crt['health'] in ['expired', 'warning']]
  702. check_results['registry'] = [crt for crt in registry_certs if crt['health'] in ['expired', 'warning']]
  703. check_results['router'] = [crt for crt in router_certs if crt['health'] in ['expired', 'warning']]
  704. else:
  705. check_results['ocp_certs'] = ocp_certs
  706. check_results['kubeconfigs'] = kubeconfigs
  707. check_results['etcd'] = etcd_certs
  708. check_results['registry'] = registry_certs
  709. check_results['router'] = router_certs
  710. # Sort the final results to report in order of ascending safety
  711. # time. That is to say, the certificates which will expire sooner
  712. # will be at the front of the list and certificates which will
  713. # expire later are at the end. Router and registry certs should be
  714. # limited to just 1 result, so don't bother sorting those.
  715. def cert_key(item):
  716. ''' return the days_remaining key '''
  717. return item['days_remaining']
  718. check_results['ocp_certs'] = sorted(check_results['ocp_certs'], key=cert_key)
  719. check_results['kubeconfigs'] = sorted(check_results['kubeconfigs'], key=cert_key)
  720. check_results['etcd'] = sorted(check_results['etcd'], key=cert_key)
  721. # This module will never change anything, but we might want to
  722. # change the return code parameter if there is some catastrophic
  723. # error we noticed earlier
  724. module.exit_json(
  725. check_results=check_results,
  726. summary=res,
  727. msg=msg,
  728. rc=0,
  729. changed=False
  730. )
  731. if __name__ == '__main__':
  732. main()