cluster 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424
  1. #!/usr/bin/env python2
  2. import argparse
  3. import ConfigParser
  4. import os
  5. import sys
  6. import subprocess
  7. import traceback
  8. class Cluster(object):
  9. """
  10. Provide Command, Control and Configuration (c3) Interface for OpenShift Clusters
  11. """
  12. def __init__(self):
  13. # setup ansible ssh environment
  14. if 'ANSIBLE_SSH_ARGS' not in os.environ:
  15. os.environ['ANSIBLE_SSH_ARGS'] = (
  16. '-o ForwardAgent=yes '
  17. '-o StrictHostKeyChecking=no '
  18. '-o UserKnownHostsFile=/dev/null '
  19. '-o ControlMaster=auto '
  20. '-o ControlPersist=600s '
  21. )
  22. # Because of `UserKnownHostsFile=/dev/null`
  23. # our `.ssh/known_hosts` file most probably misses the ssh host public keys
  24. # of our servers.
  25. # In that case, ansible serializes the execution of ansible modules
  26. # because we might be interactively prompted to accept the ssh host public keys.
  27. # Because of `StrictHostKeyChecking=no` we know that we won't be prompted
  28. # So, we don't want our modules execution to be serialized.
  29. os.environ['ANSIBLE_HOST_KEY_CHECKING'] = 'False'
  30. # TODO: A more secure way to proceed would consist in dynamically
  31. # retrieving the ssh host public keys from the IaaS interface
  32. if 'ANSIBLE_SSH_PIPELINING' not in os.environ:
  33. os.environ['ANSIBLE_SSH_PIPELINING'] = 'True'
  34. def get_deployment_type(self, args):
  35. """
  36. Get the deployment_type based on the environment variables and the
  37. command line arguments
  38. :param args: command line arguments provided by the user
  39. :return: string representing the deployment type
  40. """
  41. deployment_type = 'origin'
  42. if args.deployment_type:
  43. deployment_type = args.deployment_type
  44. elif 'OS_DEPLOYMENT_TYPE' in os.environ:
  45. deployment_type = os.environ['OS_DEPLOYMENT_TYPE']
  46. return deployment_type
  47. def create(self, args):
  48. """
  49. Create an OpenShift cluster for given provider
  50. :param args: command line arguments provided by user
  51. """
  52. cluster = {'cluster_id': args.cluster_id,
  53. 'deployment_type': self.get_deployment_type(args)}
  54. playbook = "playbooks/{0}/openshift-cluster/launch.yml".format(args.provider)
  55. inventory = self.setup_provider(args.provider)
  56. cluster['num_masters'] = args.masters
  57. cluster['num_nodes'] = args.nodes
  58. cluster['num_infra'] = args.infra
  59. cluster['num_etcd'] = args.etcd
  60. cluster['cluster_env'] = args.env
  61. if args.cloudprovider and args.provider == 'openstack':
  62. cluster['openshift_cloudprovider_kind'] = 'openstack'
  63. cluster['openshift_cloudprovider_openstack_auth_url'] = os.getenv('OS_AUTH_URL')
  64. cluster['openshift_cloudprovider_openstack_username'] = os.getenv('OS_USERNAME')
  65. cluster['openshift_cloudprovider_openstack_password'] = os.getenv('OS_PASSWORD')
  66. if 'OS_USER_DOMAIN_ID' in os.environ:
  67. cluster['openshift_cloudprovider_openstack_domain_id'] = os.getenv('OS_USER_DOMAIN_ID')
  68. if 'OS_USER_DOMAIN_NAME' in os.environ:
  69. cluster['openshift_cloudprovider_openstack_domain_name'] = os.getenv('OS_USER_DOMAIN_NAME')
  70. if 'OS_PROJECT_ID' in os.environ or 'OS_TENANT_ID' in os.environ:
  71. cluster['openshift_cloudprovider_openstack_tenant_id'] = os.getenv('OS_PROJECT_ID',os.getenv('OS_TENANT_ID'))
  72. if 'OS_PROJECT_NAME' is os.environ or 'OS_TENANT_NAME' in os.environ:
  73. cluster['openshift_cloudprovider_openstack_tenant_name'] = os.getenv('OS_PROJECT_NAME',os.getenv('OS_TENANT_NAME'))
  74. if 'OS_REGION_NAME' in os.environ:
  75. cluster['openshift_cloudprovider_openstack_region'] = os.getenv('OS_REGION_NAME')
  76. self.action(args, inventory, cluster, playbook)
  77. def add_nodes(self, args):
  78. """
  79. Add nodes to an existing cluster for given provider
  80. :param args: command line arguments provided by user
  81. """
  82. cluster = {'cluster_id': args.cluster_id,
  83. 'deployment_type': self.get_deployment_type(args),
  84. }
  85. playbook = "playbooks/{0}/openshift-cluster/add_nodes.yml".format(args.provider)
  86. inventory = self.setup_provider(args.provider)
  87. cluster['num_nodes'] = args.nodes
  88. cluster['num_infra'] = args.infra
  89. cluster['cluster_env'] = args.env
  90. self.action(args, inventory, cluster, playbook)
  91. def terminate(self, args):
  92. """
  93. Destroy OpenShift cluster
  94. :param args: command line arguments provided by user
  95. """
  96. cluster = {'cluster_id': args.cluster_id,
  97. 'deployment_type': self.get_deployment_type(args),
  98. 'cluster_env': args.env,
  99. }
  100. playbook = "playbooks/{0}/openshift-cluster/terminate.yml".format(args.provider)
  101. inventory = self.setup_provider(args.provider)
  102. self.action(args, inventory, cluster, playbook)
  103. def list(self, args):
  104. """
  105. List VMs in cluster
  106. :param args: command line arguments provided by user
  107. """
  108. cluster = {'cluster_id': args.cluster_id,
  109. 'deployment_type': self.get_deployment_type(args),
  110. 'cluster_env': args.env,
  111. }
  112. playbook = "playbooks/{0}/openshift-cluster/list.yml".format(args.provider)
  113. inventory = self.setup_provider(args.provider)
  114. self.action(args, inventory, cluster, playbook)
  115. def config(self, args):
  116. """
  117. Configure or reconfigure OpenShift across clustered VMs
  118. :param args: command line arguments provided by user
  119. """
  120. cluster = {'cluster_id': args.cluster_id,
  121. 'deployment_type': self.get_deployment_type(args),
  122. 'cluster_env': args.env,
  123. }
  124. playbook = "playbooks/{0}/openshift-cluster/config.yml".format(args.provider)
  125. inventory = self.setup_provider(args.provider)
  126. self.action(args, inventory, cluster, playbook)
  127. def update(self, args):
  128. """
  129. Update to latest OpenShift across clustered VMs
  130. :param args: command line arguments provided by user
  131. """
  132. cluster = {'cluster_id': args.cluster_id,
  133. 'deployment_type': self.get_deployment_type(args),
  134. 'cluster_env': args.env,
  135. }
  136. playbook = "playbooks/{0}/openshift-cluster/update.yml".format(args.provider)
  137. inventory = self.setup_provider(args.provider)
  138. self.action(args, inventory, cluster, playbook)
  139. def service(self, args):
  140. """
  141. Make the same service call across all nodes in the cluster
  142. :param args: command line arguments provided by user
  143. """
  144. cluster = {'cluster_id': args.cluster_id,
  145. 'deployment_type': self.get_deployment_type(args),
  146. 'new_cluster_state': args.state,
  147. 'cluster_env': args.env,
  148. }
  149. playbook = "playbooks/{0}/openshift-cluster/service.yml".format(args.provider)
  150. inventory = self.setup_provider(args.provider)
  151. self.action(args, inventory, cluster, playbook)
  152. def setup_provider(self, provider):
  153. """
  154. Setup ansible playbook environment
  155. :param provider: command line arguments provided by user
  156. :return: path to inventory for given provider
  157. """
  158. config = ConfigParser.ConfigParser()
  159. if 'gce' == provider:
  160. gce_ini_default_path = os.path.join('inventory/gce/hosts/gce.ini')
  161. gce_ini_path = os.environ.get('GCE_INI_PATH', gce_ini_default_path)
  162. if os.path.exists(gce_ini_path):
  163. config.readfp(open(gce_ini_path))
  164. for key in config.options('gce'):
  165. os.environ[key] = config.get('gce', key)
  166. inventory = '-i inventory/gce/hosts'
  167. elif 'aws' == provider:
  168. config.readfp(open('inventory/aws/hosts/ec2.ini'))
  169. for key in config.options('ec2'):
  170. os.environ[key] = config.get('ec2', key)
  171. inventory = '-i inventory/aws/hosts'
  172. key_vars = ['AWS_ACCESS_KEY_ID', 'AWS_SECRET_ACCESS_KEY']
  173. key_missing = [key for key in key_vars if key not in os.environ]
  174. boto_conf_files = ['~/.aws/credentials', '~/.boto']
  175. conf_exists = lambda conf: os.path.isfile(os.path.expanduser(conf))
  176. boto_configs = [conf for conf in boto_conf_files if conf_exists(conf)]
  177. if len(key_missing) > 0 and len(boto_configs) == 0:
  178. raise ValueError("PROVIDER aws requires {0} environment variable(s). See README_AWS.md".format(key_missing))
  179. elif 'libvirt' == provider:
  180. inventory = '-i inventory/libvirt/hosts'
  181. elif 'openstack' == provider:
  182. inventory = '-i inventory/openstack/hosts'
  183. else:
  184. # this code should never be reached
  185. raise ValueError("invalid PROVIDER {0}".format(provider))
  186. return inventory
  187. def action(self, args, inventory, cluster, playbook):
  188. """
  189. Build ansible-playbook command line and execute
  190. :param args: command line arguments provided by user
  191. :param inventory: derived provider library
  192. :param cluster: cluster variables for kubernetes
  193. :param playbook: ansible playbook to execute
  194. """
  195. verbose = ''
  196. if args.verbose > 0:
  197. verbose = '-{0}'.format('v' * args.verbose)
  198. if args.option:
  199. for opt in args.option:
  200. k, v = opt.split('=', 1)
  201. cluster['cli_' + k] = v
  202. ansible_extra_vars = '-e \'{0}\''.format(
  203. ' '.join(['%s=%s' % (key, value) for (key, value) in cluster.items()])
  204. )
  205. command = 'ansible-playbook {0} {1} {2} {3}'.format(
  206. verbose, inventory, ansible_extra_vars, playbook
  207. )
  208. if args.profile:
  209. command = 'ANSIBLE_CALLBACK_PLUGINS=ansible-profile/callback_plugins ' + command
  210. if args.verbose > 1:
  211. command = 'time {0}'.format(command)
  212. if args.verbose > 0:
  213. sys.stderr.write('RUN [{0}]\n'.format(command))
  214. sys.stderr.flush()
  215. try:
  216. subprocess.check_call(command, shell=True)
  217. except subprocess.CalledProcessError as exc:
  218. raise ActionFailed("ACTION [{0}] failed: {1}"
  219. .format(args.action, exc))
  220. class ActionFailed(Exception):
  221. """
  222. Raised when action failed.
  223. """
  224. pass
  225. if __name__ == '__main__':
  226. """
  227. User command to invoke ansible playbooks in a "known" configuration
  228. Reads ~/.openshift-ansible for default configuration items
  229. [DEFAULT]
  230. validate_cluster_ids = False
  231. cluster_ids = marketing,sales
  232. providers = gce,aws,libvirt,openstack
  233. """
  234. warning = ("================================================================================\n"
  235. "ATTENTION: You are running a community supported utility that has not been\n"
  236. "tested by Red Hat. Visit https://docs.openshift.com for supported installation\n"
  237. "instructions.\n"
  238. "================================================================================\n\n")
  239. sys.stderr.write(warning)
  240. cluster_config = ConfigParser.SafeConfigParser({
  241. 'cluster_ids': 'marketing,sales',
  242. 'validate_cluster_ids': 'False',
  243. 'providers': 'gce,aws,libvirt,openstack',
  244. })
  245. path = os.path.expanduser("~/.openshift-ansible")
  246. if os.path.isfile(path):
  247. cluster_config.read(path)
  248. cluster = Cluster()
  249. parser = argparse.ArgumentParser(
  250. formatter_class=argparse.RawDescriptionHelpFormatter,
  251. description='Python wrapper to ensure proper configuration for OpenShift ansible playbooks',
  252. epilog='''\
  253. This wrapper is overriding the following ansible variables:
  254. * ANSIBLE_SSH_ARGS:
  255. If not set in the environment, this wrapper will use the following value:
  256. `-o ForwardAgent=yes -o StrictHostKeyChecking=no -o UserKnownHostsFile=/dev/null -o ControlMaster=auto -o ControlPersist=600s`
  257. If set in the environment, the environment variable value is left untouched and used.
  258. * ANSIBLE_SSH_PIPELINING:
  259. If not set in the environment, this wrapper will set it to `True`.
  260. If you experience issues with Ansible SSH pipelining, you can disable it by explicitly setting this environment variable to `False`.
  261. '''
  262. )
  263. parser.add_argument('-v', '--verbose', action='count',
  264. help='Multiple -v options increase the verbosity')
  265. parser.add_argument('--version', action='version', version='%(prog)s 0.3')
  266. meta_parser = argparse.ArgumentParser(add_help=False)
  267. providers = cluster_config.get('DEFAULT', 'providers').split(',')
  268. meta_parser.add_argument('provider', choices=providers, help='provider')
  269. if cluster_config.get('DEFAULT', 'validate_cluster_ids').lower() in ("yes", "true", "1"):
  270. meta_parser.add_argument('cluster_id', choices=cluster_config.get('DEFAULT', 'cluster_ids').split(','),
  271. help='prefix for cluster VM names')
  272. else:
  273. meta_parser.add_argument('cluster_id', help='prefix for cluster VM names')
  274. meta_parser.add_argument('-t', '--deployment-type',
  275. choices=['origin', 'atomic-enterprise', 'openshift-enterprise'],
  276. help='Deployment type. (default: origin)')
  277. meta_parser.add_argument('-o', '--option', action='append',
  278. help='options')
  279. meta_parser.add_argument('--env', default='dev', type=str,
  280. help='environment for the cluster. Defaults to \'dev\'.')
  281. meta_parser.add_argument('-p', '--profile', action='store_true',
  282. help='Enable playbook profiling')
  283. action_parser = parser.add_subparsers(dest='action', title='actions',
  284. description='Choose from valid actions')
  285. create_parser = action_parser.add_parser('create', help='Create a cluster',
  286. parents=[meta_parser])
  287. create_parser.add_argument('-c', '--cloudprovider', action='store_true',
  288. help='Enable the cloudprovider')
  289. create_parser.add_argument('-m', '--masters', default=1, type=int,
  290. help='number of masters to create in cluster')
  291. create_parser.add_argument('-n', '--nodes', default=2, type=int,
  292. help='number of nodes to create in cluster')
  293. create_parser.add_argument('-i', '--infra', default=1, type=int,
  294. help='number of infra nodes to create in cluster')
  295. create_parser.add_argument('-e', '--etcd', default=0, type=int,
  296. help='number of external etcd hosts to create in cluster')
  297. create_parser.set_defaults(func=cluster.create)
  298. create_parser = action_parser.add_parser('add-nodes', help='Add nodes to a cluster',
  299. parents=[meta_parser])
  300. create_parser.add_argument('-n', '--nodes', default=1, type=int,
  301. help='number of nodes to add to the cluster')
  302. create_parser.add_argument('-i', '--infra', default=1, type=int,
  303. help='number of infra nodes to add to the cluster')
  304. create_parser.set_defaults(func=cluster.add_nodes)
  305. config_parser = action_parser.add_parser('config',
  306. help='Configure or reconfigure a cluster',
  307. parents=[meta_parser])
  308. config_parser.set_defaults(func=cluster.config)
  309. terminate_parser = action_parser.add_parser('terminate',
  310. help='Destroy a cluster',
  311. parents=[meta_parser])
  312. terminate_parser.add_argument('-f', '--force', action='store_true',
  313. help='Destroy cluster without confirmation')
  314. terminate_parser.set_defaults(func=cluster.terminate)
  315. update_parser = action_parser.add_parser('update',
  316. help='Update OpenShift across cluster',
  317. parents=[meta_parser])
  318. update_parser.add_argument('-f', '--force', action='store_true',
  319. help='Update cluster without confirmation')
  320. update_parser.set_defaults(func=cluster.update)
  321. list_parser = action_parser.add_parser('list', help='List VMs in cluster',
  322. parents=[meta_parser])
  323. list_parser.set_defaults(func=cluster.list)
  324. service_parser = action_parser.add_parser('service', help='service for openshift across cluster',
  325. parents=[meta_parser])
  326. # choices are the only ones valid for the ansible service module: http://docs.ansible.com/service_module.html
  327. service_parser.add_argument('state', choices=['started', 'stopped', 'restarted', 'reloaded'],
  328. help='make service call across cluster')
  329. service_parser.set_defaults(func=cluster.service)
  330. args = parser.parse_args()
  331. if 'terminate' == args.action and not args.force:
  332. answer = raw_input("This will destroy the ENTIRE {0} cluster. Are you sure? [y/N] ".format(args.cluster_id))
  333. if answer not in ['y', 'Y']:
  334. sys.stderr.write('\nACTION [terminate] aborted by user!\n')
  335. exit(1)
  336. if 'update' == args.action and not args.force:
  337. answer = raw_input(
  338. "This is destructive and could corrupt {0} cluster. Continue? [y/N] ".format(args.cluster_id))
  339. if answer not in ['y', 'Y']:
  340. sys.stderr.write('\nACTION [update] aborted by user!\n')
  341. exit(1)
  342. try:
  343. args.func(args)
  344. except Exception as exc:
  345. if args.verbose:
  346. traceback.print_exc(file=sys.stderr)
  347. else:
  348. print >>sys.stderr, exc
  349. exit(1)