cluster 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407
  1. #!/usr/bin/env python2
  2. # vim: expandtab:tabstop=4:shiftwidth=4
  3. import argparse
  4. import ConfigParser
  5. import os
  6. import sys
  7. import subprocess
  8. import traceback
  9. class Cluster(object):
  10. """
  11. Provide Command, Control and Configuration (c3) Interface for OpenShift Clusters
  12. """
  13. def __init__(self):
  14. # setup ansible ssh environment
  15. if 'ANSIBLE_SSH_ARGS' not in os.environ:
  16. os.environ['ANSIBLE_SSH_ARGS'] = (
  17. '-o ForwardAgent=yes '
  18. '-o StrictHostKeyChecking=no '
  19. '-o UserKnownHostsFile=/dev/null '
  20. '-o ControlMaster=auto '
  21. '-o ControlPersist=600s '
  22. )
  23. # Because of `UserKnownHostsFile=/dev/null`
  24. # our `.ssh/known_hosts` file most probably misses the ssh host public keys
  25. # of our servers.
  26. # In that case, ansible serializes the execution of ansible modules
  27. # because we might be interactively prompted to accept the ssh host public keys.
  28. # Because of `StrictHostKeyChecking=no` we know that we won't be prompted
  29. # So, we don't want our modules execution to be serialized.
  30. os.environ['ANSIBLE_HOST_KEY_CHECKING'] = 'False'
  31. # TODO: A more secure way to proceed would consist in dynamically
  32. # retrieving the ssh host public keys from the IaaS interface
  33. if 'ANSIBLE_SSH_PIPELINING' not in os.environ:
  34. os.environ['ANSIBLE_SSH_PIPELINING'] = 'True'
  35. def get_deployment_type(self, args):
  36. """
  37. Get the deployment_type based on the environment variables and the
  38. command line arguments
  39. :param args: command line arguments provided by the user
  40. :return: string representing the deployment type
  41. """
  42. deployment_type = 'origin'
  43. if args.deployment_type:
  44. deployment_type = args.deployment_type
  45. elif 'OS_DEPLOYMENT_TYPE' in os.environ:
  46. deployment_type = os.environ['OS_DEPLOYMENT_TYPE']
  47. return deployment_type
  48. def create(self, args):
  49. """
  50. Create an OpenShift cluster for given provider
  51. :param args: command line arguments provided by user
  52. """
  53. cluster = {'cluster_id': args.cluster_id,
  54. 'deployment_type': self.get_deployment_type(args)}
  55. playbook = "playbooks/{0}/openshift-cluster/launch.yml".format(args.provider)
  56. inventory = self.setup_provider(args.provider)
  57. cluster['num_masters'] = args.masters
  58. cluster['num_nodes'] = args.nodes
  59. cluster['num_infra'] = args.infra
  60. cluster['num_etcd'] = args.etcd
  61. cluster['cluster_env'] = args.env
  62. self.action(args, inventory, cluster, playbook)
  63. def add_nodes(self, args):
  64. """
  65. Add nodes to an existing cluster for given provider
  66. :param args: command line arguments provided by user
  67. """
  68. cluster = {'cluster_id': args.cluster_id,
  69. 'deployment_type': self.get_deployment_type(args),
  70. }
  71. playbook = "playbooks/{0}/openshift-cluster/add_nodes.yml".format(args.provider)
  72. inventory = self.setup_provider(args.provider)
  73. cluster['num_nodes'] = args.nodes
  74. cluster['num_infra'] = args.infra
  75. cluster['cluster_env'] = args.env
  76. self.action(args, inventory, cluster, playbook)
  77. def terminate(self, args):
  78. """
  79. Destroy OpenShift cluster
  80. :param args: command line arguments provided by user
  81. """
  82. cluster = {'cluster_id': args.cluster_id,
  83. 'deployment_type': self.get_deployment_type(args),
  84. 'cluster_env': args.env,
  85. }
  86. playbook = "playbooks/{0}/openshift-cluster/terminate.yml".format(args.provider)
  87. inventory = self.setup_provider(args.provider)
  88. self.action(args, inventory, cluster, playbook)
  89. def list(self, args):
  90. """
  91. List VMs in cluster
  92. :param args: command line arguments provided by user
  93. """
  94. cluster = {'cluster_id': args.cluster_id,
  95. 'deployment_type': self.get_deployment_type(args),
  96. 'cluster_env': args.env,
  97. }
  98. playbook = "playbooks/{0}/openshift-cluster/list.yml".format(args.provider)
  99. inventory = self.setup_provider(args.provider)
  100. self.action(args, inventory, cluster, playbook)
  101. def config(self, args):
  102. """
  103. Configure or reconfigure OpenShift across clustered VMs
  104. :param args: command line arguments provided by user
  105. """
  106. cluster = {'cluster_id': args.cluster_id,
  107. 'deployment_type': self.get_deployment_type(args),
  108. 'cluster_env': args.env,
  109. }
  110. playbook = "playbooks/{0}/openshift-cluster/config.yml".format(args.provider)
  111. inventory = self.setup_provider(args.provider)
  112. self.action(args, inventory, cluster, playbook)
  113. def update(self, args):
  114. """
  115. Update to latest OpenShift across clustered VMs
  116. :param args: command line arguments provided by user
  117. """
  118. cluster = {'cluster_id': args.cluster_id,
  119. 'deployment_type': self.get_deployment_type(args),
  120. 'cluster_env': args.env,
  121. }
  122. playbook = "playbooks/{0}/openshift-cluster/update.yml".format(args.provider)
  123. inventory = self.setup_provider(args.provider)
  124. self.action(args, inventory, cluster, playbook)
  125. def service(self, args):
  126. """
  127. Make the same service call across all nodes in the cluster
  128. :param args: command line arguments provided by user
  129. """
  130. cluster = {'cluster_id': args.cluster_id,
  131. 'deployment_type': self.get_deployment_type(args),
  132. 'new_cluster_state': args.state,
  133. 'cluster_env': args.env,
  134. }
  135. playbook = "playbooks/{0}/openshift-cluster/service.yml".format(args.provider)
  136. inventory = self.setup_provider(args.provider)
  137. self.action(args, inventory, cluster, playbook)
  138. def setup_provider(self, provider):
  139. """
  140. Setup ansible playbook environment
  141. :param provider: command line arguments provided by user
  142. :return: path to inventory for given provider
  143. """
  144. config = ConfigParser.ConfigParser()
  145. if 'gce' == provider:
  146. gce_ini_default_path = os.path.join('inventory/gce/hosts/gce.ini')
  147. gce_ini_path = os.environ.get('GCE_INI_PATH', gce_ini_default_path)
  148. if os.path.exists(gce_ini_path):
  149. config.readfp(open(gce_ini_path))
  150. for key in config.options('gce'):
  151. os.environ[key] = config.get('gce', key)
  152. inventory = '-i inventory/gce/hosts'
  153. elif 'aws' == provider:
  154. config.readfp(open('inventory/aws/hosts/ec2.ini'))
  155. for key in config.options('ec2'):
  156. os.environ[key] = config.get('ec2', key)
  157. inventory = '-i inventory/aws/hosts'
  158. key_vars = ['AWS_ACCESS_KEY_ID', 'AWS_SECRET_ACCESS_KEY']
  159. key_missing = [key for key in key_vars if key not in os.environ]
  160. boto_conf_files = ['~/.aws/credentials', '~/.boto']
  161. conf_exists = lambda conf: os.path.isfile(os.path.expanduser(conf))
  162. boto_configs = [conf for conf in boto_conf_files if conf_exists(conf)]
  163. if len(key_missing) > 0 and len(boto_configs) == 0:
  164. raise ValueError("PROVIDER aws requires {0} environment variable(s). See README_AWS.md".format(key_missing))
  165. elif 'libvirt' == provider:
  166. inventory = '-i inventory/libvirt/hosts'
  167. elif 'openstack' == provider:
  168. inventory = '-i inventory/openstack/hosts'
  169. else:
  170. # this code should never be reached
  171. raise ValueError("invalid PROVIDER {0}".format(provider))
  172. return inventory
  173. def action(self, args, inventory, cluster, playbook):
  174. """
  175. Build ansible-playbook command line and execute
  176. :param args: command line arguments provided by user
  177. :param inventory: derived provider library
  178. :param cluster: cluster variables for kubernetes
  179. :param playbook: ansible playbook to execute
  180. """
  181. verbose = ''
  182. if args.verbose > 0:
  183. verbose = '-{0}'.format('v' * args.verbose)
  184. if args.option:
  185. for opt in args.option:
  186. k, v = opt.split('=', 1)
  187. cluster['cli_' + k] = v
  188. ansible_extra_vars = '-e \'{0}\''.format(
  189. ' '.join(['%s=%s' % (key, value) for (key, value) in cluster.items()])
  190. )
  191. command = 'ansible-playbook {0} {1} {2} {3}'.format(
  192. verbose, inventory, ansible_extra_vars, playbook
  193. )
  194. if args.profile:
  195. command = 'ANSIBLE_CALLBACK_PLUGINS=ansible-profile/callback_plugins ' + command
  196. if args.verbose > 1:
  197. command = 'time {0}'.format(command)
  198. if args.verbose > 0:
  199. sys.stderr.write('RUN [{0}]\n'.format(command))
  200. sys.stderr.flush()
  201. try:
  202. subprocess.check_call(command, shell=True)
  203. except subprocess.CalledProcessError as exc:
  204. raise ActionFailed("ACTION [{0}] failed: {1}"
  205. .format(args.action, exc))
  206. class ActionFailed(Exception):
  207. """
  208. Raised when action failed.
  209. """
  210. pass
  211. if __name__ == '__main__':
  212. """
  213. User command to invoke ansible playbooks in a "known" configuration
  214. Reads ~/.openshift-ansible for default configuration items
  215. [DEFAULT]
  216. validate_cluster_ids = False
  217. cluster_ids = marketing,sales
  218. providers = gce,aws,libvirt,openstack
  219. """
  220. warning = ("================================================================================\n"
  221. "ATTENTION: You are running a community supported utility that has not been\n"
  222. "tested by Red Hat. Visit https://docs.openshift.com for supported installation\n"
  223. "instructions.\n"
  224. "================================================================================\n\n")
  225. sys.stderr.write(warning)
  226. cluster_config = ConfigParser.SafeConfigParser({
  227. 'cluster_ids': 'marketing,sales',
  228. 'validate_cluster_ids': 'False',
  229. 'providers': 'gce,aws,libvirt,openstack',
  230. })
  231. path = os.path.expanduser("~/.openshift-ansible")
  232. if os.path.isfile(path):
  233. cluster_config.read(path)
  234. cluster = Cluster()
  235. parser = argparse.ArgumentParser(
  236. formatter_class=argparse.RawDescriptionHelpFormatter,
  237. description='Python wrapper to ensure proper configuration for OpenShift ansible playbooks',
  238. epilog='''\
  239. This wrapper is overriding the following ansible variables:
  240. * ANSIBLE_SSH_ARGS:
  241. If not set in the environment, this wrapper will use the following value:
  242. `-o ForwardAgent=yes -o StrictHostKeyChecking=no -o UserKnownHostsFile=/dev/null -o ControlMaster=auto -o ControlPersist=600s`
  243. If set in the environment, the environment variable value is left untouched and used.
  244. * ANSIBLE_SSH_PIPELINING:
  245. If not set in the environment, this wrapper will set it to `True`.
  246. If you experience issue with Ansible ssh pipelining, you can disable it by explicitely set this environment variable to `False`.
  247. '''
  248. )
  249. parser.add_argument('-v', '--verbose', action='count',
  250. help='Multiple -v options increase the verbosity')
  251. parser.add_argument('--version', action='version', version='%(prog)s 0.3')
  252. meta_parser = argparse.ArgumentParser(add_help=False)
  253. providers = cluster_config.get('DEFAULT', 'providers').split(',')
  254. meta_parser.add_argument('provider', choices=providers, help='provider')
  255. if cluster_config.get('DEFAULT', 'validate_cluster_ids').lower() in ("yes", "true", "1"):
  256. meta_parser.add_argument('cluster_id', choices=cluster_config.get('DEFAULT', 'cluster_ids').split(','),
  257. help='prefix for cluster VM names')
  258. else:
  259. meta_parser.add_argument('cluster_id', help='prefix for cluster VM names')
  260. meta_parser.add_argument('-t', '--deployment-type',
  261. choices=['origin', 'atomic-enterprise', 'openshift-enterprise'],
  262. help='Deployment type. (default: origin)')
  263. meta_parser.add_argument('-o', '--option', action='append',
  264. help='options')
  265. meta_parser.add_argument('--env', default='dev', type=str,
  266. help='environment for the cluster. Defaults to \'dev\'.')
  267. meta_parser.add_argument('-p', '--profile', action='store_true',
  268. help='Enable playbook profiling')
  269. action_parser = parser.add_subparsers(dest='action', title='actions',
  270. description='Choose from valid actions')
  271. create_parser = action_parser.add_parser('create', help='Create a cluster',
  272. parents=[meta_parser])
  273. create_parser.add_argument('-m', '--masters', default=1, type=int,
  274. help='number of masters to create in cluster')
  275. create_parser.add_argument('-n', '--nodes', default=2, type=int,
  276. help='number of nodes to create in cluster')
  277. create_parser.add_argument('-i', '--infra', default=1, type=int,
  278. help='number of infra nodes to create in cluster')
  279. create_parser.add_argument('-e', '--etcd', default=0, type=int,
  280. help='number of external etcd hosts to create in cluster')
  281. create_parser.set_defaults(func=cluster.create)
  282. create_parser = action_parser.add_parser('add-nodes', help='Add nodes to a cluster',
  283. parents=[meta_parser])
  284. create_parser.add_argument('-n', '--nodes', default=1, type=int,
  285. help='number of nodes to add to the cluster')
  286. create_parser.add_argument('-i', '--infra', default=1, type=int,
  287. help='number of infra nodes to add to the cluster')
  288. create_parser.set_defaults(func=cluster.add_nodes)
  289. config_parser = action_parser.add_parser('config',
  290. help='Configure or reconfigure a cluster',
  291. parents=[meta_parser])
  292. config_parser.set_defaults(func=cluster.config)
  293. terminate_parser = action_parser.add_parser('terminate',
  294. help='Destroy a cluster',
  295. parents=[meta_parser])
  296. terminate_parser.add_argument('-f', '--force', action='store_true',
  297. help='Destroy cluster without confirmation')
  298. terminate_parser.set_defaults(func=cluster.terminate)
  299. update_parser = action_parser.add_parser('update',
  300. help='Update OpenShift across cluster',
  301. parents=[meta_parser])
  302. update_parser.add_argument('-f', '--force', action='store_true',
  303. help='Update cluster without confirmation')
  304. update_parser.set_defaults(func=cluster.update)
  305. list_parser = action_parser.add_parser('list', help='List VMs in cluster',
  306. parents=[meta_parser])
  307. list_parser.set_defaults(func=cluster.list)
  308. service_parser = action_parser.add_parser('service', help='service for openshift across cluster',
  309. parents=[meta_parser])
  310. # choices are the only ones valid for the ansible service module: http://docs.ansible.com/service_module.html
  311. service_parser.add_argument('state', choices=['started', 'stopped', 'restarted', 'reloaded'],
  312. help='make service call across cluster')
  313. service_parser.set_defaults(func=cluster.service)
  314. args = parser.parse_args()
  315. if 'terminate' == args.action and not args.force:
  316. answer = raw_input("This will destroy the ENTIRE {0} cluster. Are you sure? [y/N] ".format(args.cluster_id))
  317. if answer not in ['y', 'Y']:
  318. sys.stderr.write('\nACTION [terminate] aborted by user!\n')
  319. exit(1)
  320. if 'update' == args.action and not args.force:
  321. answer = raw_input(
  322. "This is destructive and could corrupt {0} cluster. Continue? [y/N] ".format(args.cluster_id))
  323. if answer not in ['y', 'Y']:
  324. sys.stderr.write('\nACTION [update] aborted by user!\n')
  325. exit(1)
  326. try:
  327. args.func(args)
  328. except Exception as exc:
  329. if args.verbose:
  330. traceback.print_exc(file=sys.stderr)
  331. else:
  332. print >>sys.stderr, exc
  333. exit(1)