2014-07-10 20:43:39 +02:00
|
|
|
#!/usr/bin/env python
|
|
|
|
|
|
|
|
"""
|
|
|
|
Collins external inventory script
|
|
|
|
=================================
|
|
|
|
|
|
|
|
Ansible has a feature where instead of reading from /etc/ansible/hosts
|
|
|
|
as a text file, it can query external programs to obtain the list
|
|
|
|
of hosts, groups the hosts are in, and even variables to assign to each host.
|
|
|
|
|
|
|
|
Collins is a hardware asset management system originally developed by
|
|
|
|
Tumblr for tracking new hardware as it built out its own datacenters. It
|
|
|
|
exposes a rich API for manipulating and querying one's hardware inventory,
|
|
|
|
which makes it an ideal 'single point of truth' for driving systems
|
|
|
|
automation like Ansible. Extensive documentation on Collins, including a quickstart,
|
|
|
|
API docs, and a full reference manual, can be found here:
|
|
|
|
|
|
|
|
http://tumblr.github.io/collins
|
|
|
|
|
|
|
|
This script adds support to Ansible for obtaining a dynamic inventory of
|
|
|
|
assets in your infrastructure, grouping them in Ansible by their useful attributes,
|
|
|
|
and binding all facts provided by Collins to each host so that they can be used to
|
|
|
|
drive automation. Some parts of this script were cribbed shamelessly from mdehaan's
|
|
|
|
Cobbler inventory script.
|
|
|
|
|
|
|
|
To use it, copy it to your repo and pass -i <collins script> to the ansible or
|
|
|
|
ansible-playbook command; if you'd like to use it by default, simply copy collins.ini
|
|
|
|
to /etc/ansible and this script to /etc/ansible/hosts.
|
|
|
|
|
|
|
|
Alongside the options set in collins.ini, there are several environment variables
|
|
|
|
that will be used instead of the configured values if they are set:
|
|
|
|
|
|
|
|
- COLLINS_USERNAME - specifies a username to use for Collins authentication
|
|
|
|
- COLLINS_PASSWORD - specifies a password to use for Collins authentication
|
|
|
|
- COLLINS_ASSET_TYPE - specifies a Collins asset type to use during querying;
|
|
|
|
this can be used to run Ansible automation against different asset classes than
|
|
|
|
server nodes, such as network switches and PDUs
|
|
|
|
- COLLINS_CONFIG - specifies an alternative location for collins.ini, defaults to
|
|
|
|
<location of collins.py>/collins.ini
|
|
|
|
|
|
|
|
If errors are encountered during operation, this script will return an exit code of
|
|
|
|
255; otherwise, it will return an exit code of 0.
|
|
|
|
|
2015-04-28 15:36:42 +02:00
|
|
|
Collins attributes are accessible as variables in ansible via the COLLINS['attribute_name'].
|
2015-02-06 15:06:09 +01:00
|
|
|
|
|
|
|
Tested against Ansible 1.8.2 and Collins 1.3.0.
|
2014-07-10 20:43:39 +02:00
|
|
|
"""
|
|
|
|
|
|
|
|
# (c) 2014, Steve Salevan <steve.salevan@gmail.com>
|
|
|
|
#
|
|
|
|
# This file is part of Ansible.
|
|
|
|
#
|
|
|
|
# Ansible is free software: you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License as published by
|
|
|
|
# the Free Software Foundation, either version 3 of the License, or
|
|
|
|
# (at your option) any later version.
|
|
|
|
#
|
|
|
|
# Ansible is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
# GNU General Public License for more details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU General Public License
|
|
|
|
# along with Ansible. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
######################################################################
|
|
|
|
|
|
|
|
|
|
|
|
import argparse
|
|
|
|
import base64
|
|
|
|
import ConfigParser
|
|
|
|
import logging
|
|
|
|
import os
|
|
|
|
import re
|
|
|
|
import sys
|
|
|
|
from time import time
|
|
|
|
import traceback
|
|
|
|
import urllib
|
|
|
|
import urllib2
|
|
|
|
|
|
|
|
try:
|
|
|
|
import json
|
|
|
|
except ImportError:
|
|
|
|
import simplejson as json
|
|
|
|
|
2015-09-03 08:23:27 +02:00
|
|
|
from six import iteritems
|
|
|
|
|
2014-07-10 20:43:39 +02:00
|
|
|
|
|
|
|
class CollinsDefaults(object):
|
|
|
|
ASSETS_API_ENDPOINT = '%s/api/assets'
|
|
|
|
SPECIAL_ATTRIBUTES = set([
|
|
|
|
'CREATED',
|
|
|
|
'DELETED',
|
|
|
|
'UPDATED',
|
|
|
|
'STATE',
|
|
|
|
])
|
|
|
|
LOG_FORMAT = '%(asctime)-15s %(message)s'
|
|
|
|
|
|
|
|
|
2014-07-10 21:32:39 +02:00
|
|
|
class Error(Exception):
|
|
|
|
pass
|
|
|
|
|
|
|
|
|
|
|
|
class MaxRetriesError(Error):
|
|
|
|
pass
|
|
|
|
|
|
|
|
|
2014-07-10 20:43:39 +02:00
|
|
|
class CollinsInventory(object):
|
|
|
|
|
|
|
|
def __init__(self):
|
2014-07-10 21:32:39 +02:00
|
|
|
""" Constructs CollinsInventory object and reads all configuration. """
|
2014-07-10 20:43:39 +02:00
|
|
|
|
|
|
|
self.inventory = dict() # A list of groups and the hosts in that group
|
|
|
|
self.cache = dict() # Details about hosts in the inventory
|
|
|
|
|
|
|
|
# Read settings and parse CLI arguments
|
|
|
|
self.read_settings()
|
|
|
|
self.parse_cli_args()
|
|
|
|
|
|
|
|
logging.basicConfig(format=CollinsDefaults.LOG_FORMAT,
|
|
|
|
filename=self.log_location)
|
|
|
|
self.log = logging.getLogger('CollinsInventory')
|
|
|
|
|
2014-07-10 21:32:39 +02:00
|
|
|
def _asset_get_attribute(self, asset, attrib):
|
|
|
|
""" Returns a user-defined attribute from an asset if it exists; otherwise,
|
|
|
|
returns None. """
|
|
|
|
|
|
|
|
if 'ATTRIBS' in asset:
|
|
|
|
for attrib_block in asset['ATTRIBS'].keys():
|
|
|
|
if attrib in asset['ATTRIBS'][attrib_block]:
|
|
|
|
return asset['ATTRIBS'][attrib_block][attrib]
|
|
|
|
return None
|
|
|
|
|
|
|
|
def _asset_has_attribute(self, asset, attrib):
|
|
|
|
""" Returns whether a user-defined attribute is present on an asset. """
|
|
|
|
|
|
|
|
if 'ATTRIBS' in asset:
|
|
|
|
for attrib_block in asset['ATTRIBS'].keys():
|
|
|
|
if attrib in asset['ATTRIBS'][attrib_block]:
|
|
|
|
return True
|
|
|
|
return False
|
|
|
|
|
2014-07-10 20:43:39 +02:00
|
|
|
def run(self):
|
2014-07-10 21:32:39 +02:00
|
|
|
""" Main execution path """
|
|
|
|
|
2014-07-10 20:43:39 +02:00
|
|
|
# Updates cache if cache is not present or has expired.
|
|
|
|
successful = True
|
|
|
|
if self.args.refresh_cache:
|
|
|
|
successful = self.update_cache()
|
|
|
|
elif not self.is_cache_valid():
|
|
|
|
successful = self.update_cache()
|
|
|
|
else:
|
|
|
|
successful = self.load_inventory_from_cache()
|
|
|
|
successful &= self.load_cache_from_cache()
|
|
|
|
|
|
|
|
data_to_print = ""
|
|
|
|
|
|
|
|
# Data to print
|
|
|
|
if self.args.host:
|
|
|
|
data_to_print = self.get_host_info()
|
|
|
|
|
|
|
|
elif self.args.list:
|
|
|
|
# Display list of instances for inventory
|
|
|
|
data_to_print = self.json_format_dict(self.inventory, self.args.pretty)
|
|
|
|
|
|
|
|
else: # default action with no options
|
|
|
|
data_to_print = self.json_format_dict(self.inventory, self.args.pretty)
|
|
|
|
|
2015-08-28 08:18:13 +02:00
|
|
|
print(data_to_print)
|
2014-07-10 20:43:39 +02:00
|
|
|
return successful
|
|
|
|
|
|
|
|
def find_assets(self, attributes = {}, operation = 'AND'):
|
|
|
|
""" Obtains Collins assets matching the provided attributes. """
|
|
|
|
|
|
|
|
# Formats asset search query to locate assets matching attributes, using
|
|
|
|
# the CQL search feature as described here:
|
|
|
|
# http://tumblr.github.io/collins/recipes.html
|
|
|
|
attributes_query = [ '='.join(attr_pair)
|
2015-09-03 08:23:27 +02:00
|
|
|
for attr_pair in iteritems(attributes) ]
|
2014-07-10 20:43:39 +02:00
|
|
|
query_parameters = {
|
|
|
|
'details': ['True'],
|
|
|
|
'operation': [operation],
|
|
|
|
'query': attributes_query,
|
|
|
|
'remoteLookup': [str(self.query_remote_dcs)],
|
|
|
|
'size': [self.results_per_query],
|
|
|
|
'type': [self.collins_asset_type],
|
|
|
|
}
|
|
|
|
assets = []
|
|
|
|
cur_page = 0
|
|
|
|
num_retries = 0
|
|
|
|
# Locates all assets matching the provided query, exhausting pagination.
|
|
|
|
while True:
|
|
|
|
if num_retries == self.collins_max_retries:
|
2014-07-10 21:32:39 +02:00
|
|
|
raise MaxRetriesError("Maximum of %s retries reached; giving up" % \
|
2014-07-10 20:43:39 +02:00
|
|
|
self.collins_max_retries)
|
|
|
|
query_parameters['page'] = cur_page
|
|
|
|
query_url = "%s?%s" % (
|
|
|
|
(CollinsDefaults.ASSETS_API_ENDPOINT % self.collins_host),
|
|
|
|
urllib.urlencode(query_parameters, doseq=True)
|
|
|
|
)
|
|
|
|
request = urllib2.Request(query_url)
|
|
|
|
request.add_header('Authorization', self.basic_auth_header)
|
|
|
|
try:
|
|
|
|
response = urllib2.urlopen(request, timeout=self.collins_timeout_secs)
|
|
|
|
json_response = json.loads(response.read())
|
|
|
|
# Adds any assets found to the array of assets.
|
|
|
|
assets += json_response['data']['Data']
|
|
|
|
# If we've retrieved all of our assets, breaks out of the loop.
|
|
|
|
if len(json_response['data']['Data']) == 0:
|
|
|
|
break
|
|
|
|
cur_page += 1
|
|
|
|
num_retries = 0
|
|
|
|
except:
|
|
|
|
self.log.error("Error while communicating with Collins, retrying:\n%s",
|
|
|
|
traceback.format_exc())
|
|
|
|
num_retries += 1
|
|
|
|
return assets
|
|
|
|
|
|
|
|
def is_cache_valid(self):
|
|
|
|
""" Determines if the cache files have expired, or if it is still valid """
|
|
|
|
|
|
|
|
if os.path.isfile(self.cache_path_cache):
|
|
|
|
mod_time = os.path.getmtime(self.cache_path_cache)
|
|
|
|
current_time = time()
|
|
|
|
if (mod_time + self.cache_max_age) > current_time:
|
|
|
|
if os.path.isfile(self.cache_path_inventory):
|
|
|
|
return True
|
|
|
|
|
|
|
|
return False
|
|
|
|
|
|
|
|
def read_settings(self):
|
|
|
|
""" Reads the settings from the collins.ini file """
|
|
|
|
|
|
|
|
config_loc = os.getenv('COLLINS_CONFIG',
|
|
|
|
os.path.dirname(os.path.realpath(__file__)) + '/collins.ini')
|
|
|
|
|
|
|
|
config = ConfigParser.SafeConfigParser()
|
|
|
|
config.read(os.path.dirname(os.path.realpath(__file__)) + '/collins.ini')
|
|
|
|
|
|
|
|
self.collins_host = config.get('collins', 'host')
|
|
|
|
self.collins_username = os.getenv('COLLINS_USERNAME',
|
|
|
|
config.get('collins', 'username'))
|
|
|
|
self.collins_password = os.getenv('COLLINS_PASSWORD',
|
|
|
|
config.get('collins', 'password'))
|
|
|
|
self.collins_asset_type = os.getenv('COLLINS_ASSET_TYPE',
|
|
|
|
config.get('collins', 'asset_type'))
|
|
|
|
self.collins_timeout_secs = config.getint('collins', 'timeout_secs')
|
|
|
|
self.collins_max_retries = config.getint('collins', 'max_retries')
|
|
|
|
|
|
|
|
self.results_per_query = config.getint('collins', 'results_per_query')
|
|
|
|
self.ip_address_index = config.getint('collins', 'ip_address_index')
|
|
|
|
self.query_remote_dcs = config.getboolean('collins', 'query_remote_dcs')
|
|
|
|
self.prefer_hostnames = config.getboolean('collins', 'prefer_hostnames')
|
|
|
|
|
|
|
|
cache_path = config.get('collins', 'cache_path')
|
|
|
|
self.cache_path_cache = cache_path + \
|
|
|
|
'/ansible-collins-%s.cache' % self.collins_asset_type
|
|
|
|
self.cache_path_inventory = cache_path + \
|
|
|
|
'/ansible-collins-%s.index' % self.collins_asset_type
|
|
|
|
self.cache_max_age = config.getint('collins', 'cache_max_age')
|
|
|
|
|
|
|
|
log_path = config.get('collins', 'log_path')
|
|
|
|
self.log_location = log_path + '/ansible-collins.log'
|
|
|
|
self.basic_auth_header = "Basic %s" % base64.encodestring(
|
|
|
|
'%s:%s' % (self.collins_username, self.collins_password))[:-1]
|
|
|
|
|
|
|
|
def parse_cli_args(self):
|
|
|
|
""" Command line argument processing """
|
|
|
|
|
|
|
|
parser = argparse.ArgumentParser(
|
|
|
|
description='Produces an Ansible Inventory file based on Collins')
|
|
|
|
parser.add_argument('--list',
|
|
|
|
action='store_true', default=True, help='List instances (default: True)')
|
|
|
|
parser.add_argument('--host',
|
|
|
|
action='store', help='Get all the variables about a specific instance')
|
|
|
|
parser.add_argument('--refresh-cache',
|
|
|
|
action='store_true', default=False,
|
|
|
|
help='Force refresh of cache by making API requests to Collins ' \
|
|
|
|
'(default: False - use cache files)')
|
|
|
|
parser.add_argument('--pretty',
|
|
|
|
action='store_true', default=False, help='Pretty print all JSON output')
|
|
|
|
self.args = parser.parse_args()
|
|
|
|
|
|
|
|
def update_cache(self):
|
|
|
|
""" Make calls to Collins and saves the output in a cache """
|
|
|
|
|
|
|
|
self.cache = dict()
|
|
|
|
self.inventory = dict()
|
|
|
|
|
|
|
|
# Locates all server assets from Collins.
|
|
|
|
try:
|
|
|
|
server_assets = self.find_assets()
|
|
|
|
except:
|
|
|
|
self.log.error("Error while locating assets from Collins:\n%s",
|
|
|
|
traceback.format_exc())
|
|
|
|
return False
|
|
|
|
|
|
|
|
for asset in server_assets:
|
|
|
|
# Determines the index to retrieve the asset's IP address either by an
|
|
|
|
# attribute set on the Collins asset or the pre-configured value.
|
|
|
|
if self._asset_has_attribute(asset, 'ANSIBLE_IP_INDEX'):
|
|
|
|
ip_index = self._asset_get_attribute(asset, 'ANSIBLE_IP_INDEX')
|
|
|
|
try:
|
|
|
|
ip_index = int(ip_index)
|
|
|
|
except:
|
|
|
|
self.log.error(
|
|
|
|
"ANSIBLE_IP_INDEX attribute on asset %s not an integer: %s", asset,
|
|
|
|
ip_index)
|
|
|
|
else:
|
|
|
|
ip_index = self.ip_address_index
|
|
|
|
|
2015-02-06 15:06:09 +01:00
|
|
|
asset['COLLINS'] = {}
|
|
|
|
|
2014-07-10 20:43:39 +02:00
|
|
|
# Attempts to locate the asset's primary identifier (hostname or IP address),
|
|
|
|
# which will be used to index the asset throughout the Ansible inventory.
|
|
|
|
if self.prefer_hostnames and self._asset_has_attribute(asset, 'HOSTNAME'):
|
|
|
|
asset_identifier = self._asset_get_attribute(asset, 'HOSTNAME')
|
|
|
|
elif 'ADDRESSES' not in asset:
|
|
|
|
self.log.warning("No IP addresses found for asset '%s', skipping",
|
|
|
|
asset)
|
|
|
|
continue
|
|
|
|
elif len(asset['ADDRESSES']) < ip_index + 1:
|
|
|
|
self.log.warning(
|
|
|
|
"No IP address found at index %s for asset '%s', skipping",
|
|
|
|
ip_index, asset)
|
|
|
|
continue
|
|
|
|
else:
|
|
|
|
asset_identifier = asset['ADDRESSES'][ip_index]['ADDRESS']
|
|
|
|
|
|
|
|
# Adds an asset index to the Ansible inventory based upon unpacking
|
|
|
|
# the name of the asset's current STATE from its dictionary.
|
|
|
|
if 'STATE' in asset['ASSET'] and asset['ASSET']['STATE']:
|
2014-07-10 21:18:13 +02:00
|
|
|
state_inventory_key = self.to_safe(
|
|
|
|
'STATE-%s' % asset['ASSET']['STATE']['NAME'])
|
2014-07-10 20:43:39 +02:00
|
|
|
self.push(self.inventory, state_inventory_key, asset_identifier)
|
|
|
|
|
|
|
|
# Indexes asset by all user-defined Collins attributes.
|
|
|
|
if 'ATTRIBS' in asset:
|
|
|
|
for attrib_block in asset['ATTRIBS'].keys():
|
|
|
|
for attrib in asset['ATTRIBS'][attrib_block].keys():
|
2015-02-06 15:06:09 +01:00
|
|
|
asset['COLLINS'][attrib] = asset['ATTRIBS'][attrib_block][attrib]
|
|
|
|
attrib_key = self.to_safe('%s-%s' % (attrib, asset['ATTRIBS'][attrib_block][attrib]))
|
2014-07-10 20:43:39 +02:00
|
|
|
self.push(self.inventory, attrib_key, asset_identifier)
|
|
|
|
|
|
|
|
# Indexes asset by all built-in Collins attributes.
|
|
|
|
for attribute in asset['ASSET'].keys():
|
|
|
|
if attribute not in CollinsDefaults.SPECIAL_ATTRIBUTES:
|
|
|
|
attribute_val = asset['ASSET'][attribute]
|
|
|
|
if attribute_val is not None:
|
2014-07-10 21:18:13 +02:00
|
|
|
attrib_key = self.to_safe('%s-%s' % (attribute, attribute_val))
|
2014-07-10 20:43:39 +02:00
|
|
|
self.push(self.inventory, attrib_key, asset_identifier)
|
|
|
|
|
|
|
|
# Indexes asset by hardware product information.
|
|
|
|
if 'HARDWARE' in asset:
|
|
|
|
if 'PRODUCT' in asset['HARDWARE']['BASE']:
|
|
|
|
product = asset['HARDWARE']['BASE']['PRODUCT']
|
|
|
|
if product:
|
2014-07-10 21:18:13 +02:00
|
|
|
product_key = self.to_safe(
|
2014-07-10 20:43:39 +02:00
|
|
|
'HARDWARE-PRODUCT-%s' % asset['HARDWARE']['BASE']['PRODUCT'])
|
|
|
|
self.push(self.inventory, product_key, asset_identifier)
|
|
|
|
|
|
|
|
# Indexing now complete, adds the host details to the asset cache.
|
|
|
|
self.cache[asset_identifier] = asset
|
|
|
|
|
|
|
|
try:
|
|
|
|
self.write_to_cache(self.cache, self.cache_path_cache)
|
|
|
|
self.write_to_cache(self.inventory, self.cache_path_inventory)
|
|
|
|
except:
|
|
|
|
self.log.error("Error while writing to cache:\n%s", traceback.format_exc())
|
|
|
|
return False
|
|
|
|
return True
|
|
|
|
|
|
|
|
def push(self, dictionary, key, value):
|
2014-07-10 21:32:39 +02:00
|
|
|
""" Adds a value to a list at a dictionary key, creating the list if it doesn't
|
|
|
|
exist. """
|
|
|
|
|
2014-07-10 20:43:39 +02:00
|
|
|
if key not in dictionary:
|
|
|
|
dictionary[key] = []
|
|
|
|
dictionary[key].append(value)
|
|
|
|
|
|
|
|
def get_host_info(self):
|
|
|
|
""" Get variables about a specific host. """
|
|
|
|
|
|
|
|
if not self.cache or len(self.cache) == 0:
|
|
|
|
# Need to load index from cache
|
|
|
|
self.load_cache_from_cache()
|
|
|
|
|
|
|
|
if not self.args.host in self.cache:
|
|
|
|
# try updating the cache
|
|
|
|
self.update_cache()
|
|
|
|
|
|
|
|
if not self.args.host in self.cache:
|
|
|
|
# host might not exist anymore
|
|
|
|
return self.json_format_dict({}, self.args.pretty)
|
|
|
|
|
|
|
|
return self.json_format_dict(self.cache[self.args.host], self.args.pretty)
|
|
|
|
|
|
|
|
def load_inventory_from_cache(self):
|
|
|
|
""" Reads the index from the cache file sets self.index """
|
|
|
|
|
|
|
|
try:
|
|
|
|
cache = open(self.cache_path_inventory, 'r')
|
|
|
|
json_inventory = cache.read()
|
|
|
|
self.inventory = json.loads(json_inventory)
|
|
|
|
return True
|
|
|
|
except:
|
|
|
|
self.log.error("Error while loading inventory:\n%s",
|
|
|
|
traceback.format_exc())
|
|
|
|
self.inventory = {}
|
|
|
|
return False
|
|
|
|
|
|
|
|
def load_cache_from_cache(self):
|
|
|
|
""" Reads the cache from the cache file sets self.cache """
|
|
|
|
|
|
|
|
try:
|
|
|
|
cache = open(self.cache_path_cache, 'r')
|
|
|
|
json_cache = cache.read()
|
|
|
|
self.cache = json.loads(json_cache)
|
|
|
|
return True
|
|
|
|
except:
|
|
|
|
self.log.error("Error while loading host cache:\n%s",
|
|
|
|
traceback.format_exc())
|
|
|
|
self.cache = {}
|
|
|
|
return False
|
|
|
|
|
|
|
|
def write_to_cache(self, data, filename):
|
|
|
|
""" Writes data in JSON format to a specified file. """
|
|
|
|
|
|
|
|
json_data = self.json_format_dict(data, self.args.pretty)
|
|
|
|
cache = open(filename, 'w')
|
|
|
|
cache.write(json_data)
|
|
|
|
cache.close()
|
|
|
|
|
2014-07-10 21:18:13 +02:00
|
|
|
def to_safe(self, word):
|
|
|
|
""" Converts 'bad' characters in a string to underscores so they
|
|
|
|
can be used as Ansible groups """
|
|
|
|
|
|
|
|
return re.sub("[^A-Za-z0-9\-]", "_", word)
|
|
|
|
|
2014-07-10 20:43:39 +02:00
|
|
|
def json_format_dict(self, data, pretty=False):
|
|
|
|
""" Converts a dict to a JSON object and dumps it as a formatted string """
|
|
|
|
|
|
|
|
if pretty:
|
|
|
|
return json.dumps(data, sort_keys=True, indent=2)
|
|
|
|
else:
|
|
|
|
return json.dumps(data)
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ in '__main__':
|
|
|
|
inventory = CollinsInventory()
|
|
|
|
if inventory.run():
|
|
|
|
sys.exit(0)
|
|
|
|
else:
|
|
|
|
sys.exit(-1)
|