gce.py 17 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477
  1. #!/usr/bin/env python2
  2. # pylint: skip-file
  3. # Copyright 2013 Google Inc.
  4. #
  5. # This file is part of Ansible
  6. #
  7. # Ansible is free software: you can redistribute it and/or modify
  8. # it under the terms of the GNU General Public License as published by
  9. # the Free Software Foundation, either version 3 of the License, or
  10. # (at your option) any later version.
  11. #
  12. # Ansible is distributed in the hope that it will be useful,
  13. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  14. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  15. # GNU General Public License for more details.
  16. #
  17. # You should have received a copy of the GNU General Public License
  18. # along with Ansible. If not, see <http://www.gnu.org/licenses/>.
  19. '''
  20. GCE external inventory script
  21. =================================
  22. Generates inventory that Ansible can understand by making API requests
  23. Google Compute Engine via the libcloud library. Full install/configuration
  24. instructions for the gce* modules can be found in the comments of
  25. ansible/test/gce_tests.py.
  26. When run against a specific host, this script returns the following variables
  27. based on the data obtained from the libcloud Node object:
  28. - gce_uuid
  29. - gce_id
  30. - gce_image
  31. - gce_machine_type
  32. - gce_private_ip
  33. - gce_public_ip
  34. - gce_name
  35. - gce_description
  36. - gce_status
  37. - gce_zone
  38. - gce_tags
  39. - gce_metadata
  40. - gce_network
  41. When run in --list mode, instances are grouped by the following categories:
  42. - zone:
  43. zone group name examples are us-central1-b, europe-west1-a, etc.
  44. - instance tags:
  45. An entry is created for each tag. For example, if you have two instances
  46. with a common tag called 'foo', they will both be grouped together under
  47. the 'tag_foo' name.
  48. - network name:
  49. the name of the network is appended to 'network_' (e.g. the 'default'
  50. network will result in a group named 'network_default')
  51. - machine type
  52. types follow a pattern like n1-standard-4, g1-small, etc.
  53. - running status:
  54. group name prefixed with 'status_' (e.g. status_running, status_stopped,..)
  55. - image:
  56. when using an ephemeral/scratch disk, this will be set to the image name
  57. used when creating the instance (e.g. debian-7-wheezy-v20130816). when
  58. your instance was created with a root persistent disk it will be set to
  59. 'persistent_disk' since there is no current way to determine the image.
  60. Examples:
  61. Execute uname on all instances in the us-central1-a zone
  62. $ ansible -i gce.py us-central1-a -m shell -a "/bin/uname -a"
  63. Use the GCE inventory script to print out instance specific information
  64. $ contrib/inventory/gce.py --host my_instance
  65. Author: Eric Johnson <erjohnso@google.com>
  66. Contributors: Matt Hite <mhite@hotmail.com>, Tom Melendez <supertom@google.com>
  67. Version: 0.0.3
  68. '''
  69. __requires__ = ['pycrypto>=2.6']
  70. try:
  71. import pkg_resources
  72. except ImportError:
  73. # Use pkg_resources to find the correct versions of libraries and set
  74. # sys.path appropriately when there are multiversion installs. We don't
  75. # fail here as there is code that better expresses the errors where the
  76. # library is used.
  77. pass
  78. USER_AGENT_PRODUCT="Ansible-gce_inventory_plugin"
  79. USER_AGENT_VERSION="v2"
  80. import sys
  81. import os
  82. import argparse
  83. from time import time
  84. import ConfigParser
  85. import logging
  86. logging.getLogger('libcloud.common.google').addHandler(logging.NullHandler())
  87. try:
  88. import json
  89. except ImportError:
  90. import simplejson as json
  91. try:
  92. from libcloud.compute.types import Provider
  93. from libcloud.compute.providers import get_driver
  94. _ = Provider.GCE
  95. except:
  96. sys.exit("GCE inventory script requires libcloud >= 0.13")
  97. class CloudInventoryCache(object):
  98. def __init__(self, cache_name='ansible-cloud-cache', cache_path='/tmp',
  99. cache_max_age=300):
  100. cache_dir = os.path.expanduser(cache_path)
  101. if not os.path.exists(cache_dir):
  102. os.makedirs(cache_dir)
  103. self.cache_path_cache = os.path.join(cache_dir, cache_name)
  104. self.cache_max_age = cache_max_age
  105. def is_valid(self, max_age=None):
  106. ''' Determines if the cache files have expired, or if it is still valid '''
  107. if max_age is None:
  108. max_age = self.cache_max_age
  109. if os.path.isfile(self.cache_path_cache):
  110. mod_time = os.path.getmtime(self.cache_path_cache)
  111. current_time = time()
  112. if (mod_time + max_age) > current_time:
  113. return True
  114. return False
  115. def get_all_data_from_cache(self, filename=''):
  116. ''' Reads the JSON inventory from the cache file. Returns Python dictionary. '''
  117. data = ''
  118. if not filename:
  119. filename = self.cache_path_cache
  120. with open(filename, 'r') as cache:
  121. data = cache.read()
  122. return json.loads(data)
  123. def write_to_cache(self, data, filename=''):
  124. ''' Writes data to file as JSON. Returns True. '''
  125. if not filename:
  126. filename = self.cache_path_cache
  127. json_data = json.dumps(data)
  128. with open(filename, 'w') as cache:
  129. cache.write(json_data)
  130. return True
  131. class GceInventory(object):
  132. def __init__(self):
  133. # Cache object
  134. self.cache = None
  135. # dictionary containing inventory read from disk
  136. self.inventory = {}
  137. # Read settings and parse CLI arguments
  138. self.parse_cli_args()
  139. self.config = self.get_config()
  140. self.driver = self.get_gce_driver()
  141. self.ip_type = self.get_inventory_options()
  142. if self.ip_type:
  143. self.ip_type = self.ip_type.lower()
  144. # Cache management
  145. start_inventory_time = time()
  146. cache_used = False
  147. if self.args.refresh_cache or not self.cache.is_valid():
  148. self.do_api_calls_update_cache()
  149. else:
  150. self.load_inventory_from_cache()
  151. cache_used = True
  152. self.inventory['_meta']['stats'] = {'use_cache': True}
  153. self.inventory['_meta']['stats'] = {
  154. 'inventory_load_time': time() - start_inventory_time,
  155. 'cache_used': cache_used
  156. }
  157. # Just display data for specific host
  158. if self.args.host:
  159. print(self.json_format_dict(
  160. self.inventory['_meta']['hostvars'][self.args.host],
  161. pretty=self.args.pretty))
  162. else:
  163. # Otherwise, assume user wants all instances grouped
  164. zones = self.parse_env_zones()
  165. print(self.json_format_dict(self.inventory,
  166. pretty=self.args.pretty))
  167. sys.exit(0)
  168. def get_config(self):
  169. """
  170. Reads the settings from the gce.ini file.
  171. Populates a SafeConfigParser object with defaults and
  172. attempts to read an .ini-style configuration from the filename
  173. specified in GCE_INI_PATH. If the environment variable is
  174. not present, the filename defaults to gce.ini in the current
  175. working directory.
  176. """
  177. gce_ini_default_path = os.path.join(
  178. os.path.dirname(os.path.realpath(__file__)), "gce.ini")
  179. gce_ini_path = os.environ.get('GCE_INI_PATH', gce_ini_default_path)
  180. # Create a ConfigParser.
  181. # This provides empty defaults to each key, so that environment
  182. # variable configuration (as opposed to INI configuration) is able
  183. # to work.
  184. config = ConfigParser.SafeConfigParser(defaults={
  185. 'gce_service_account_email_address': '',
  186. 'gce_service_account_pem_file_path': '',
  187. 'gce_project_id': '',
  188. 'libcloud_secrets': '',
  189. 'inventory_ip_type': '',
  190. 'cache_path': '~/.ansible/tmp',
  191. 'cache_max_age': '300'
  192. })
  193. if 'gce' not in config.sections():
  194. config.add_section('gce')
  195. if 'inventory' not in config.sections():
  196. config.add_section('inventory')
  197. if 'cache' not in config.sections():
  198. config.add_section('cache')
  199. config.read(gce_ini_path)
  200. #########
  201. # Section added for processing ini settings
  202. #########
  203. # Set the instance_states filter based on config file options
  204. self.instance_states = []
  205. if config.has_option('gce', 'instance_states'):
  206. states = config.get('gce', 'instance_states')
  207. # Ignore if instance_states is an empty string.
  208. if states:
  209. self.instance_states = states.split(',')
  210. # Caching
  211. cache_path = config.get('cache', 'cache_path')
  212. cache_max_age = config.getint('cache', 'cache_max_age')
  213. # TOOD(supertom): support project-specific caches
  214. cache_name = 'ansible-gce.cache'
  215. self.cache = CloudInventoryCache(cache_path=cache_path,
  216. cache_max_age=cache_max_age,
  217. cache_name=cache_name)
  218. return config
  219. def get_inventory_options(self):
  220. """Determine inventory options. Environment variables always
  221. take precedence over configuration files."""
  222. ip_type = self.config.get('inventory', 'inventory_ip_type')
  223. # If the appropriate environment variables are set, they override
  224. # other configuration
  225. ip_type = os.environ.get('INVENTORY_IP_TYPE', ip_type)
  226. return ip_type
  227. def get_gce_driver(self):
  228. """Determine the GCE authorization settings and return a
  229. libcloud driver.
  230. """
  231. # Attempt to get GCE params from a configuration file, if one
  232. # exists.
  233. secrets_path = self.config.get('gce', 'libcloud_secrets')
  234. secrets_found = False
  235. try:
  236. import secrets
  237. args = list(getattr(secrets, 'GCE_PARAMS', []))
  238. kwargs = getattr(secrets, 'GCE_KEYWORD_PARAMS', {})
  239. secrets_found = True
  240. except:
  241. pass
  242. if not secrets_found and secrets_path:
  243. if not secrets_path.endswith('secrets.py'):
  244. err = "Must specify libcloud secrets file as "
  245. err += "/absolute/path/to/secrets.py"
  246. sys.exit(err)
  247. sys.path.append(os.path.dirname(secrets_path))
  248. try:
  249. import secrets
  250. args = list(getattr(secrets, 'GCE_PARAMS', []))
  251. kwargs = getattr(secrets, 'GCE_KEYWORD_PARAMS', {})
  252. secrets_found = True
  253. except:
  254. pass
  255. if not secrets_found:
  256. args = [
  257. self.config.get('gce','gce_service_account_email_address'),
  258. self.config.get('gce','gce_service_account_pem_file_path')
  259. ]
  260. kwargs = {'project': self.config.get('gce', 'gce_project_id')}
  261. # If the appropriate environment variables are set, they override
  262. # other configuration; process those into our args and kwargs.
  263. args[0] = os.environ.get('GCE_EMAIL', args[0])
  264. args[1] = os.environ.get('GCE_PEM_FILE_PATH', args[1])
  265. kwargs['project'] = os.environ.get('GCE_PROJECT', kwargs['project'])
  266. # Retrieve and return the GCE driver.
  267. gce = get_driver(Provider.GCE)(*args, **kwargs)
  268. gce.connection.user_agent_append(
  269. '%s/%s' % (USER_AGENT_PRODUCT, USER_AGENT_VERSION),
  270. )
  271. return gce
  272. def parse_env_zones(self):
  273. '''returns a list of comma separated zones parsed from the GCE_ZONE environment variable.
  274. If provided, this will be used to filter the results of the grouped_instances call'''
  275. import csv
  276. reader = csv.reader([os.environ.get('GCE_ZONE',"")], skipinitialspace=True)
  277. zones = [r for r in reader]
  278. return [z for z in zones[0]]
  279. def parse_cli_args(self):
  280. ''' Command line argument processing '''
  281. parser = argparse.ArgumentParser(
  282. description='Produce an Ansible Inventory file based on GCE')
  283. parser.add_argument('--list', action='store_true', default=True,
  284. help='List instances (default: True)')
  285. parser.add_argument('--host', action='store',
  286. help='Get all information about an instance')
  287. parser.add_argument('--pretty', action='store_true', default=False,
  288. help='Pretty format (default: False)')
  289. parser.add_argument(
  290. '--refresh-cache', action='store_true', default=False,
  291. help='Force refresh of cache by making API requests (default: False - use cache files)')
  292. self.args = parser.parse_args()
  293. def node_to_dict(self, inst):
  294. md = {}
  295. if inst is None:
  296. return {}
  297. if 'items' in inst.extra['metadata']:
  298. for entry in inst.extra['metadata']['items']:
  299. md[entry['key']] = entry['value']
  300. net = inst.extra['networkInterfaces'][0]['network'].split('/')[-1]
  301. # default to exernal IP unless user has specified they prefer internal
  302. if self.ip_type == 'internal':
  303. ssh_host = inst.private_ips[0]
  304. else:
  305. ssh_host = inst.public_ips[0] if len(inst.public_ips) >= 1 else inst.private_ips[0]
  306. return {
  307. 'gce_uuid': inst.uuid,
  308. 'gce_id': inst.id,
  309. 'gce_image': inst.image,
  310. 'gce_machine_type': inst.size,
  311. 'gce_private_ip': inst.private_ips[0],
  312. 'gce_public_ip': inst.public_ips[0] if len(inst.public_ips) >= 1 else None,
  313. 'gce_name': inst.name,
  314. 'gce_description': inst.extra['description'],
  315. 'gce_status': inst.extra['status'],
  316. 'gce_zone': inst.extra['zone'].name,
  317. 'gce_tags': inst.extra['tags'],
  318. 'gce_metadata': md,
  319. 'gce_network': net,
  320. # Hosts don't have a public name, so we add an IP
  321. 'ansible_ssh_host': ssh_host
  322. }
  323. def load_inventory_from_cache(self):
  324. ''' Loads inventory from JSON on disk. '''
  325. try:
  326. self.inventory = self.cache.get_all_data_from_cache()
  327. hosts = self.inventory['_meta']['hostvars']
  328. except Exception as e:
  329. print(
  330. "Invalid inventory file %s. Please rebuild with -refresh-cache option."
  331. % (self.cache.cache_path_cache))
  332. raise
  333. def do_api_calls_update_cache(self):
  334. ''' Do API calls and save data in cache. '''
  335. zones = self.parse_env_zones()
  336. data = self.group_instances(zones)
  337. self.cache.write_to_cache(data)
  338. self.inventory = data
  339. def list_nodes(self):
  340. all_nodes = []
  341. params, more_results = {'maxResults': 500}, True
  342. while more_results:
  343. self.driver.connection.gce_params=params
  344. all_nodes.extend(self.driver.list_nodes())
  345. more_results = 'pageToken' in params
  346. return all_nodes
  347. def group_instances(self, zones=None):
  348. '''Group all instances'''
  349. groups = {}
  350. meta = {}
  351. meta["hostvars"] = {}
  352. for node in self.list_nodes():
  353. # This check filters on the desired instance states defined in the
  354. # config file with the instance_states config option.
  355. #
  356. # If the instance_states list is _empty_ then _ALL_ states are returned.
  357. #
  358. # If the instance_states list is _populated_ then check the current
  359. # state against the instance_states list
  360. if self.instance_states and not node.extra['status'] in self.instance_states:
  361. continue
  362. name = node.name
  363. meta["hostvars"][name] = self.node_to_dict(node)
  364. zone = node.extra['zone'].name
  365. # To avoid making multiple requests per zone
  366. # we list all nodes and then filter the results
  367. if zones and zone not in zones:
  368. continue
  369. if zone in groups: groups[zone].append(name)
  370. else: groups[zone] = [name]
  371. tags = node.extra['tags']
  372. for t in tags:
  373. if t.startswith('group-'):
  374. tag = t[6:]
  375. else:
  376. tag = 'tag_%s' % t
  377. if tag in groups: groups[tag].append(name)
  378. else: groups[tag] = [name]
  379. net = node.extra['networkInterfaces'][0]['network'].split('/')[-1]
  380. net = 'network_%s' % net
  381. if net in groups: groups[net].append(name)
  382. else: groups[net] = [name]
  383. machine_type = node.size
  384. if machine_type in groups: groups[machine_type].append(name)
  385. else: groups[machine_type] = [name]
  386. image = node.image and node.image or 'persistent_disk'
  387. if image in groups: groups[image].append(name)
  388. else: groups[image] = [name]
  389. status = node.extra['status']
  390. stat = 'status_%s' % status.lower()
  391. if stat in groups: groups[stat].append(name)
  392. else: groups[stat] = [name]
  393. groups["_meta"] = meta
  394. return groups
  395. def json_format_dict(self, data, pretty=False):
  396. ''' Converts a dict to a JSON object and dumps it as a formatted
  397. string '''
  398. if pretty:
  399. return json.dumps(data, sort_keys=True, indent=2)
  400. else:
  401. return json.dumps(data)
  402. # Run the script
  403. if __name__ == '__main__':
  404. GceInventory()