ec2.py 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610
  1. #!/usr/bin/env python
  2. '''
  3. EC2 external inventory script
  4. =================================
  5. Generates inventory that Ansible can understand by making API request to
  6. AWS EC2 using the Boto library.
  7. NOTE: This script assumes Ansible is being executed where the environment
  8. variables needed for Boto have already been set:
  9. export AWS_ACCESS_KEY_ID='AK123'
  10. export AWS_SECRET_ACCESS_KEY='abc123'
  11. This script also assumes there is an ec2.ini file alongside it. To specify a
  12. different path to ec2.ini, define the EC2_INI_PATH environment variable:
  13. export EC2_INI_PATH=/path/to/my_ec2.ini
  14. If you're using eucalyptus you need to set the above variables and
  15. you need to define:
  16. export EC2_URL=http://hostname_of_your_cc:port/services/Eucalyptus
  17. For more details, see: http://docs.pythonboto.org/en/latest/boto_config_tut.html
  18. When run against a specific host, this script returns the following variables:
  19. - ec2_ami_launch_index
  20. - ec2_architecture
  21. - ec2_association
  22. - ec2_attachTime
  23. - ec2_attachment
  24. - ec2_attachmentId
  25. - ec2_client_token
  26. - ec2_deleteOnTermination
  27. - ec2_description
  28. - ec2_deviceIndex
  29. - ec2_dns_name
  30. - ec2_eventsSet
  31. - ec2_group_name
  32. - ec2_hypervisor
  33. - ec2_id
  34. - ec2_image_id
  35. - ec2_instanceState
  36. - ec2_instance_type
  37. - ec2_ipOwnerId
  38. - ec2_ip_address
  39. - ec2_item
  40. - ec2_kernel
  41. - ec2_key_name
  42. - ec2_launch_time
  43. - ec2_monitored
  44. - ec2_monitoring
  45. - ec2_networkInterfaceId
  46. - ec2_ownerId
  47. - ec2_persistent
  48. - ec2_placement
  49. - ec2_platform
  50. - ec2_previous_state
  51. - ec2_private_dns_name
  52. - ec2_private_ip_address
  53. - ec2_publicIp
  54. - ec2_public_dns_name
  55. - ec2_ramdisk
  56. - ec2_reason
  57. - ec2_region
  58. - ec2_requester_id
  59. - ec2_root_device_name
  60. - ec2_root_device_type
  61. - ec2_security_group_ids
  62. - ec2_security_group_names
  63. - ec2_shutdown_state
  64. - ec2_sourceDestCheck
  65. - ec2_spot_instance_request_id
  66. - ec2_state
  67. - ec2_state_code
  68. - ec2_state_reason
  69. - ec2_status
  70. - ec2_subnet_id
  71. - ec2_tenancy
  72. - ec2_virtualization_type
  73. - ec2_vpc_id
  74. These variables are pulled out of a boto.ec2.instance object. There is a lack of
  75. consistency with variable spellings (camelCase and underscores) since this
  76. just loops through all variables the object exposes. It is preferred to use the
  77. ones with underscores when multiple exist.
  78. In addition, if an instance has AWS Tags associated with it, each tag is a new
  79. variable named:
  80. - ec2_tag_[Key] = [Value]
  81. Security groups are comma-separated in 'ec2_security_group_ids' and
  82. 'ec2_security_group_names'.
  83. '''
  84. # (c) 2012, Peter Sankauskas
  85. #
  86. # This file is part of Ansible,
  87. #
  88. # Ansible is free software: you can redistribute it and/or modify
  89. # it under the terms of the GNU General Public License as published by
  90. # the Free Software Foundation, either version 3 of the License, or
  91. # (at your option) any later version.
  92. #
  93. # Ansible is distributed in the hope that it will be useful,
  94. # but WITHOUT ANY WARRANTY; without even the implied warranty of
  95. # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
  96. # GNU General Public License for more details.
  97. #
  98. # You should have received a copy of the GNU General Public License
  99. # along with Ansible. If not, see <http://www.gnu.org/licenses/>.
  100. ######################################################################
  101. import sys
  102. import os
  103. import argparse
  104. import re
  105. from time import time
  106. import boto
  107. from boto import ec2
  108. from boto import rds
  109. from boto import route53
  110. import ConfigParser
  111. try:
  112. import json
  113. except ImportError:
  114. import simplejson as json
  115. class Ec2Inventory(object):
  116. def _empty_inventory(self):
  117. return {"_meta" : {"hostvars" : {}}}
  118. def __init__(self):
  119. ''' Main execution path '''
  120. # Inventory grouped by instance IDs, tags, security groups, regions,
  121. # and availability zones
  122. self.inventory = self._empty_inventory()
  123. # Index of hostname (address) to instance ID
  124. self.index = {}
  125. # Read settings and parse CLI arguments
  126. self.read_settings()
  127. self.parse_cli_args()
  128. # Cache
  129. if self.args.refresh_cache:
  130. self.do_api_calls_update_cache()
  131. elif not self.is_cache_valid():
  132. self.do_api_calls_update_cache()
  133. # Data to print
  134. if self.args.host:
  135. data_to_print = self.get_host_info()
  136. elif self.args.list:
  137. # Display list of instances for inventory
  138. if self.inventory == self._empty_inventory():
  139. data_to_print = self.get_inventory_from_cache()
  140. else:
  141. data_to_print = self.json_format_dict(self.inventory, True)
  142. print data_to_print
  143. def is_cache_valid(self):
  144. ''' Determines if the cache files have expired, or if it is still valid '''
  145. if os.path.isfile(self.cache_path_cache):
  146. mod_time = os.path.getmtime(self.cache_path_cache)
  147. current_time = time()
  148. if (mod_time + self.cache_max_age) > current_time:
  149. if os.path.isfile(self.cache_path_index):
  150. return True
  151. return False
  152. def read_settings(self):
  153. ''' Reads the settings from the ec2.ini file '''
  154. config = ConfigParser.SafeConfigParser()
  155. ec2_default_ini_path = os.path.join(os.path.dirname(os.path.realpath(__file__)), 'ec2.ini')
  156. ec2_ini_path = os.environ.get('EC2_INI_PATH', ec2_default_ini_path)
  157. config.read(ec2_ini_path)
  158. # is eucalyptus?
  159. self.eucalyptus_host = None
  160. self.eucalyptus = False
  161. if config.has_option('ec2', 'eucalyptus'):
  162. self.eucalyptus = config.getboolean('ec2', 'eucalyptus')
  163. if self.eucalyptus and config.has_option('ec2', 'eucalyptus_host'):
  164. self.eucalyptus_host = config.get('ec2', 'eucalyptus_host')
  165. # Regions
  166. self.regions = []
  167. configRegions = config.get('ec2', 'regions')
  168. configRegions_exclude = config.get('ec2', 'regions_exclude')
  169. if (configRegions == 'all'):
  170. if self.eucalyptus_host:
  171. self.regions.append(boto.connect_euca(host=self.eucalyptus_host).region.name)
  172. else:
  173. for regionInfo in ec2.regions():
  174. if regionInfo.name not in configRegions_exclude:
  175. self.regions.append(regionInfo.name)
  176. else:
  177. self.regions = configRegions.split(",")
  178. # Destination addresses
  179. self.destination_variable = config.get('ec2', 'destination_variable')
  180. self.vpc_destination_variable = config.get('ec2', 'vpc_destination_variable')
  181. # Route53
  182. self.route53_enabled = config.getboolean('ec2', 'route53')
  183. self.route53_excluded_zones = []
  184. if config.has_option('ec2', 'route53_excluded_zones'):
  185. self.route53_excluded_zones.extend(
  186. config.get('ec2', 'route53_excluded_zones', '').split(','))
  187. # Cache related
  188. cache_dir = os.path.expanduser(config.get('ec2', 'cache_path'))
  189. if not os.path.exists(cache_dir):
  190. os.makedirs(cache_dir)
  191. self.cache_path_cache = cache_dir + "/ansible-ec2.cache"
  192. self.cache_path_index = cache_dir + "/ansible-ec2.index"
  193. self.cache_max_age = config.getint('ec2', 'cache_max_age')
  194. def parse_cli_args(self):
  195. ''' Command line argument processing '''
  196. parser = argparse.ArgumentParser(description='Produce an Ansible Inventory file based on EC2')
  197. parser.add_argument('--list', action='store_true', default=True,
  198. help='List instances (default: True)')
  199. parser.add_argument('--host', action='store',
  200. help='Get all the variables about a specific instance')
  201. parser.add_argument('--refresh-cache', action='store_true', default=False,
  202. help='Force refresh of cache by making API requests to EC2 (default: False - use cache files)')
  203. self.args = parser.parse_args()
  204. def do_api_calls_update_cache(self):
  205. ''' Do API calls to each region, and save data in cache files '''
  206. if self.route53_enabled:
  207. self.get_route53_records()
  208. for region in self.regions:
  209. self.get_instances_by_region(region)
  210. self.get_rds_instances_by_region(region)
  211. self.write_to_cache(self.inventory, self.cache_path_cache)
  212. self.write_to_cache(self.index, self.cache_path_index)
  213. def get_instances_by_region(self, region):
  214. ''' Makes an AWS EC2 API call to the list of instances in a particular
  215. region '''
  216. try:
  217. if self.eucalyptus:
  218. conn = boto.connect_euca(host=self.eucalyptus_host)
  219. conn.APIVersion = '2010-08-31'
  220. else:
  221. conn = ec2.connect_to_region(region)
  222. # connect_to_region will fail "silently" by returning None if the region name is wrong or not supported
  223. if conn is None:
  224. print("region name: %s likely not supported, or AWS is down. connection to region failed." % region)
  225. sys.exit(1)
  226. reservations = conn.get_all_instances()
  227. for reservation in reservations:
  228. for instance in reservation.instances:
  229. self.add_instance(instance, region)
  230. except boto.exception.BotoServerError, e:
  231. if not self.eucalyptus:
  232. print "Looks like AWS is down again:"
  233. print e
  234. sys.exit(1)
  235. def get_rds_instances_by_region(self, region):
  236. ''' Makes an AWS API call to the list of RDS instances in a particular
  237. region '''
  238. try:
  239. conn = rds.connect_to_region(region)
  240. if conn:
  241. instances = conn.get_all_dbinstances()
  242. for instance in instances:
  243. self.add_rds_instance(instance, region)
  244. except boto.exception.BotoServerError, e:
  245. if not e.reason == "Forbidden":
  246. print "Looks like AWS RDS is down: "
  247. print e
  248. sys.exit(1)
  249. def get_instance(self, region, instance_id):
  250. ''' Gets details about a specific instance '''
  251. if self.eucalyptus:
  252. conn = boto.connect_euca(self.eucalyptus_host)
  253. conn.APIVersion = '2010-08-31'
  254. else:
  255. conn = ec2.connect_to_region(region)
  256. # connect_to_region will fail "silently" by returning None if the region name is wrong or not supported
  257. if conn is None:
  258. print("region name: %s likely not supported, or AWS is down. connection to region failed." % region)
  259. sys.exit(1)
  260. reservations = conn.get_all_instances([instance_id])
  261. for reservation in reservations:
  262. for instance in reservation.instances:
  263. return instance
  264. def add_instance(self, instance, region):
  265. ''' Adds an instance to the inventory and index, as long as it is
  266. addressable '''
  267. # Only want running instances
  268. if instance.state != 'running':
  269. return
  270. # Select the best destination address
  271. if instance.subnet_id:
  272. dest = getattr(instance, self.vpc_destination_variable)
  273. else:
  274. dest = getattr(instance, self.destination_variable)
  275. if not dest:
  276. # Skip instances we cannot address (e.g. private VPC subnet)
  277. return
  278. # Add to index
  279. self.index[dest] = [region, instance.id]
  280. # Inventory: Group by instance ID (always a group of 1)
  281. self.inventory[instance.id] = [dest]
  282. # Inventory: Group by region
  283. self.push(self.inventory, region, dest)
  284. # Inventory: Group by availability zone
  285. self.push(self.inventory, instance.placement, dest)
  286. # Inventory: Group by instance type
  287. self.push(self.inventory, self.to_safe('type_' + instance.instance_type), dest)
  288. # Inventory: Group by key pair
  289. if instance.key_name:
  290. self.push(self.inventory, self.to_safe('key_' + instance.key_name), dest)
  291. # Inventory: Group by security group
  292. try:
  293. for group in instance.groups:
  294. key = self.to_safe("security_group_" + group.name)
  295. self.push(self.inventory, key, dest)
  296. except AttributeError:
  297. print 'Package boto seems a bit older.'
  298. print 'Please upgrade boto >= 2.3.0.'
  299. sys.exit(1)
  300. # Inventory: Group by tag keys
  301. for k, v in instance.tags.iteritems():
  302. key = self.to_safe("tag_" + k + "=" + v)
  303. self.push(self.inventory, key, dest)
  304. # Inventory: Group by Route53 domain names if enabled
  305. if self.route53_enabled:
  306. route53_names = self.get_instance_route53_names(instance)
  307. for name in route53_names:
  308. self.push(self.inventory, name, dest)
  309. # Global Tag: tag all EC2 instances
  310. self.push(self.inventory, 'ec2', dest)
  311. self.inventory["_meta"]["hostvars"][dest] = self.get_host_info_dict_from_instance(instance)
  312. def add_rds_instance(self, instance, region):
  313. ''' Adds an RDS instance to the inventory and index, as long as it is
  314. addressable '''
  315. # Only want available instances
  316. if instance.status != 'available':
  317. return
  318. # Select the best destination address
  319. #if instance.subnet_id:
  320. #dest = getattr(instance, self.vpc_destination_variable)
  321. #else:
  322. #dest = getattr(instance, self.destination_variable)
  323. dest = instance.endpoint[0]
  324. if not dest:
  325. # Skip instances we cannot address (e.g. private VPC subnet)
  326. return
  327. # Add to index
  328. self.index[dest] = [region, instance.id]
  329. # Inventory: Group by instance ID (always a group of 1)
  330. self.inventory[instance.id] = [dest]
  331. # Inventory: Group by region
  332. self.push(self.inventory, region, dest)
  333. # Inventory: Group by availability zone
  334. self.push(self.inventory, instance.availability_zone, dest)
  335. # Inventory: Group by instance type
  336. self.push(self.inventory, self.to_safe('type_' + instance.instance_class), dest)
  337. # Inventory: Group by security group
  338. try:
  339. if instance.security_group:
  340. key = self.to_safe("security_group_" + instance.security_group.name)
  341. self.push(self.inventory, key, dest)
  342. except AttributeError:
  343. print 'Package boto seems a bit older.'
  344. print 'Please upgrade boto >= 2.3.0.'
  345. sys.exit(1)
  346. # Inventory: Group by engine
  347. self.push(self.inventory, self.to_safe("rds_" + instance.engine), dest)
  348. # Inventory: Group by parameter group
  349. self.push(self.inventory, self.to_safe("rds_parameter_group_" + instance.parameter_group.name), dest)
  350. # Global Tag: all RDS instances
  351. self.push(self.inventory, 'rds', dest)
  352. def get_route53_records(self):
  353. ''' Get and store the map of resource records to domain names that
  354. point to them. '''
  355. r53_conn = route53.Route53Connection()
  356. all_zones = r53_conn.get_zones()
  357. route53_zones = [ zone for zone in all_zones if zone.name[:-1]
  358. not in self.route53_excluded_zones ]
  359. self.route53_records = {}
  360. for zone in route53_zones:
  361. rrsets = r53_conn.get_all_rrsets(zone.id)
  362. for record_set in rrsets:
  363. record_name = record_set.name
  364. if record_name.endswith('.'):
  365. record_name = record_name[:-1]
  366. for resource in record_set.resource_records:
  367. self.route53_records.setdefault(resource, set())
  368. self.route53_records[resource].add(record_name)
  369. def get_instance_route53_names(self, instance):
  370. ''' Check if an instance is referenced in the records we have from
  371. Route53. If it is, return the list of domain names pointing to said
  372. instance. If nothing points to it, return an empty list. '''
  373. instance_attributes = [ 'public_dns_name', 'private_dns_name',
  374. 'ip_address', 'private_ip_address' ]
  375. name_list = set()
  376. for attrib in instance_attributes:
  377. try:
  378. value = getattr(instance, attrib)
  379. except AttributeError:
  380. continue
  381. if value in self.route53_records:
  382. name_list.update(self.route53_records[value])
  383. return list(name_list)
  384. def get_host_info_dict_from_instance(self, instance):
  385. instance_vars = {}
  386. for key in vars(instance):
  387. value = getattr(instance, key)
  388. key = self.to_safe('ec2_' + key)
  389. # Handle complex types
  390. # state/previous_state changed to properties in boto in https://github.com/boto/boto/commit/a23c379837f698212252720d2af8dec0325c9518
  391. if key == 'ec2__state':
  392. instance_vars['ec2_state'] = instance.state or ''
  393. instance_vars['ec2_state_code'] = instance.state_code
  394. elif key == 'ec2__previous_state':
  395. instance_vars['ec2_previous_state'] = instance.previous_state or ''
  396. instance_vars['ec2_previous_state_code'] = instance.previous_state_code
  397. elif type(value) in [int, bool]:
  398. instance_vars[key] = value
  399. elif type(value) in [str, unicode]:
  400. instance_vars[key] = value.strip()
  401. elif type(value) == type(None):
  402. instance_vars[key] = ''
  403. elif key == 'ec2_region':
  404. instance_vars[key] = value.name
  405. elif key == 'ec2__placement':
  406. instance_vars['ec2_placement'] = value.zone
  407. elif key == 'ec2_tags':
  408. for k, v in value.iteritems():
  409. key = self.to_safe('ec2_tag_' + k)
  410. instance_vars[key] = v
  411. elif key == 'ec2_groups':
  412. group_ids = []
  413. group_names = []
  414. for group in value:
  415. group_ids.append(group.id)
  416. group_names.append(group.name)
  417. instance_vars["ec2_security_group_ids"] = ','.join(group_ids)
  418. instance_vars["ec2_security_group_names"] = ','.join(group_names)
  419. else:
  420. pass
  421. # TODO Product codes if someone finds them useful
  422. #print key
  423. #print type(value)
  424. #print value
  425. return instance_vars
  426. def get_host_info(self):
  427. ''' Get variables about a specific host '''
  428. if len(self.index) == 0:
  429. # Need to load index from cache
  430. self.load_index_from_cache()
  431. if not self.args.host in self.index:
  432. # try updating the cache
  433. self.do_api_calls_update_cache()
  434. if not self.args.host in self.index:
  435. # host migh not exist anymore
  436. return self.json_format_dict({}, True)
  437. (region, instance_id) = self.index[self.args.host]
  438. instance = self.get_instance(region, instance_id)
  439. return self.json_format_dict(self.get_host_info_dict_from_instance(instance), True)
  440. def push(self, my_dict, key, element):
  441. ''' Pushed an element onto an array that may not have been defined in
  442. the dict '''
  443. if key in my_dict:
  444. my_dict[key].append(element);
  445. else:
  446. my_dict[key] = [element]
  447. def get_inventory_from_cache(self):
  448. ''' Reads the inventory from the cache file and returns it as a JSON
  449. object '''
  450. cache = open(self.cache_path_cache, 'r')
  451. json_inventory = cache.read()
  452. return json_inventory
  453. def load_index_from_cache(self):
  454. ''' Reads the index from the cache file sets self.index '''
  455. cache = open(self.cache_path_index, 'r')
  456. json_index = cache.read()
  457. self.index = json.loads(json_index)
  458. def write_to_cache(self, data, filename):
  459. ''' Writes data in JSON format to a file '''
  460. json_data = self.json_format_dict(data, True)
  461. cache = open(filename, 'w')
  462. cache.write(json_data)
  463. cache.close()
  464. def to_safe(self, word):
  465. ''' Converts 'bad' characters in a string to underscores so they can be
  466. used as Ansible groups '''
  467. return re.sub("[^A-Za-z0-9\-]", "_", word)
  468. def json_format_dict(self, data, pretty=False):
  469. ''' Converts a dict to a JSON object and dumps it as a formatted
  470. string '''
  471. if pretty:
  472. return json.dumps(data, sort_keys=True, indent=2)
  473. else:
  474. return json.dumps(data)
  475. # Run the script
  476. Ec2Inventory()