2012-07-20 12:57:15 +02:00
|
|
|
#!/usr/bin/python
|
2012-08-03 03:29:10 +02:00
|
|
|
# -*- coding: utf-8 -*-
|
2012-07-20 12:57:15 +02:00
|
|
|
|
|
|
|
# (c) 2012, Jan-Piet Mens <jpmens () gmail.com>
|
|
|
|
#
|
|
|
|
# This file is part of Ansible
|
|
|
|
#
|
|
|
|
# Ansible is free software: you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License as published by
|
|
|
|
# the Free Software Foundation, either version 3 of the License, or
|
|
|
|
# (at your option) any later version.
|
|
|
|
#
|
|
|
|
# Ansible is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
# GNU General Public License for more details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU General Public License
|
|
|
|
# along with Ansible. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
#
|
2012-07-22 17:08:16 +02:00
|
|
|
# see examples/playbooks/get_url.yml
|
2012-07-20 12:57:15 +02:00
|
|
|
|
|
|
|
import shutil
|
|
|
|
import datetime
|
|
|
|
import tempfile
|
|
|
|
|
2012-09-17 15:11:04 +02:00
|
|
|
DOCUMENTATION = '''
|
|
|
|
---
|
|
|
|
module: get_url
|
|
|
|
short_description: Downloads files from HTTP, HTTPS, or FTP to node
|
2012-09-19 16:09:26 +02:00
|
|
|
description:
|
|
|
|
- Downloads files from HTTP, HTTPS, or FTP to the remote server. The remote
|
2012-11-21 18:49:30 +01:00
|
|
|
server I(must) have direct access to the remote resource.
|
2012-09-17 15:11:04 +02:00
|
|
|
version_added: "0.6"
|
|
|
|
options:
|
2012-09-28 03:06:31 +02:00
|
|
|
url:
|
|
|
|
description:
|
2013-01-26 18:38:08 +01:00
|
|
|
- HTTP, HTTPS, or FTP URL in the form (http|https|ftp)://[user[:pass]]@host.domain[:port]/path
|
2012-09-28 03:06:31 +02:00
|
|
|
required: true
|
|
|
|
default: null
|
|
|
|
aliases: []
|
|
|
|
dest:
|
|
|
|
description:
|
|
|
|
- absolute path of where to download the file to.
|
2012-11-21 18:49:30 +01:00
|
|
|
- If I(dest) is a directory, the basename of the file on the remote server will be used. If a directory, C(thirsty=yes) must also be set.
|
2012-09-28 03:06:31 +02:00
|
|
|
required: true
|
|
|
|
default: null
|
|
|
|
thirsty:
|
|
|
|
description:
|
|
|
|
- if C(yes), will download the file every time and replace the
|
2012-11-21 18:49:30 +01:00
|
|
|
file if the contents change. If C(no), the file will only be downloaded if
|
2012-09-28 03:06:31 +02:00
|
|
|
the destination does not exist. Generally should be C(yes) only for small
|
|
|
|
local files. prior to 0.6, acts if C(yes) by default.
|
|
|
|
version_added: "0.7"
|
|
|
|
required: false
|
|
|
|
choices: [ "yes", "no" ]
|
|
|
|
default: "no"
|
|
|
|
others:
|
|
|
|
description:
|
|
|
|
- all arguments accepted by the M(file) module also work here
|
|
|
|
required: false
|
2012-09-17 15:11:04 +02:00
|
|
|
examples:
|
2012-10-23 15:14:01 +02:00
|
|
|
- code: "get_url: url=http://example.com/path/file.conf dest=/etc/foo.conf mode=0440"
|
2012-09-28 03:30:32 +02:00
|
|
|
description: "Example from Ansible Playbooks"
|
2012-09-19 16:09:26 +02:00
|
|
|
notes:
|
2013-01-24 21:19:14 +01:00
|
|
|
- This module doesn't yet support configuration for proxies.
|
2012-09-17 15:11:04 +02:00
|
|
|
# informational: requirements for nodes
|
|
|
|
requirements: [ urllib2, urlparse ]
|
2012-10-01 12:37:51 +02:00
|
|
|
author: Jan-Piet Mens
|
2012-09-17 15:11:04 +02:00
|
|
|
'''
|
|
|
|
|
2013-01-24 21:19:14 +01:00
|
|
|
HAS_URLLIB2 = True
|
2012-07-20 12:57:15 +02:00
|
|
|
try:
|
|
|
|
import urllib2
|
2012-08-07 02:07:02 +02:00
|
|
|
except ImportError:
|
2013-01-24 21:19:14 +01:00
|
|
|
HAS_URLLIB2 = False
|
|
|
|
HAS_URLPARSE = True
|
2012-07-22 17:08:16 +02:00
|
|
|
|
2012-07-20 12:57:15 +02:00
|
|
|
try:
|
|
|
|
import urlparse
|
|
|
|
import socket
|
2012-08-07 02:07:02 +02:00
|
|
|
except ImportError:
|
2012-07-20 12:57:15 +02:00
|
|
|
HAS_URLPARSE=False
|
|
|
|
|
|
|
|
# ==============================================================
|
|
|
|
# url handling
|
|
|
|
|
|
|
|
def url_filename(url):
|
2012-07-22 17:08:16 +02:00
|
|
|
fn = os.path.basename(urlparse.urlsplit(url)[2])
|
|
|
|
if fn == '':
|
|
|
|
return 'index.html'
|
|
|
|
return fn
|
2012-07-20 12:57:15 +02:00
|
|
|
|
2012-07-22 17:08:16 +02:00
|
|
|
def url_do_get(module, url, dest):
|
|
|
|
"""
|
|
|
|
Get url and return request and info
|
|
|
|
Credits: http://stackoverflow.com/questions/7006574/how-to-download-file-from-ftp
|
2012-07-20 12:57:15 +02:00
|
|
|
"""
|
2012-07-22 17:08:16 +02:00
|
|
|
|
2012-07-20 12:57:15 +02:00
|
|
|
USERAGENT = 'ansible-httpget'
|
2012-11-06 23:32:49 +01:00
|
|
|
info = dict(url=url, dest=dest)
|
2012-07-20 12:57:15 +02:00
|
|
|
r = None
|
2013-01-24 16:16:23 +01:00
|
|
|
parsed = urlparse.urlparse(url)
|
|
|
|
if '@' in parsed.netloc:
|
|
|
|
credentials = parsed.netloc.split('@')[0]
|
|
|
|
if ':' in credentials:
|
|
|
|
username, password = credentials.split(':')
|
|
|
|
netloc = parsed.netloc.split('@')[1]
|
|
|
|
parsed = list(parsed)
|
|
|
|
parsed[1] = netloc
|
|
|
|
|
|
|
|
passman = urllib2.HTTPPasswordMgrWithDefaultRealm()
|
|
|
|
# this creates a password manager
|
|
|
|
passman.add_password(None, netloc, username, password)
|
|
|
|
# because we have put None at the start it will always
|
|
|
|
# use this username/password combination for urls
|
|
|
|
# for which `theurl` is a super-url
|
|
|
|
|
|
|
|
authhandler = urllib2.HTTPBasicAuthHandler(passman)
|
|
|
|
# create the AuthHandler
|
|
|
|
|
|
|
|
opener = urllib2.build_opener(authhandler)
|
|
|
|
urllib2.install_opener(opener)
|
|
|
|
#reconstruct url without credentials
|
|
|
|
url = urlparse.urlunparse(parsed)
|
2012-07-20 12:57:15 +02:00
|
|
|
|
|
|
|
request = urllib2.Request(url)
|
|
|
|
request.add_header('User-agent', USERAGENT)
|
|
|
|
|
2012-11-06 23:32:49 +01:00
|
|
|
if os.path.exists(dest):
|
|
|
|
t = datetime.datetime.utcfromtimestamp(os.path.getmtime(dest))
|
2012-07-20 12:57:15 +02:00
|
|
|
tstamp = t.strftime('%a, %d %b %Y %H:%M:%S +0000')
|
|
|
|
request.add_header('If-Modified-Since', tstamp)
|
|
|
|
|
|
|
|
try:
|
|
|
|
r = urllib2.urlopen(request)
|
2012-07-22 17:08:16 +02:00
|
|
|
info.update(r.info())
|
|
|
|
info.update(dict(msg="OK (%s bytes)" % r.headers.get('Content-Length', 'unknown'), status=200))
|
2012-08-01 15:30:16 +02:00
|
|
|
except urllib2.HTTPError, e:
|
2012-07-20 12:57:15 +02:00
|
|
|
# Must not fail_json() here so caller can handle HTTP 304 unmodified
|
2012-07-22 17:08:16 +02:00
|
|
|
info.update(dict(msg=str(e), status=e.code))
|
2012-07-20 12:57:15 +02:00
|
|
|
return r, info
|
2012-08-01 15:30:16 +02:00
|
|
|
except urllib2.URLError, e:
|
2012-07-22 17:08:16 +02:00
|
|
|
code = getattr(e, 'code', -1)
|
|
|
|
module.fail_json(msg="Request failed: %s" % str(e), status_code=code)
|
2012-07-20 12:57:15 +02:00
|
|
|
|
|
|
|
return r, info
|
|
|
|
|
2012-07-22 17:08:16 +02:00
|
|
|
def url_get(module, url, dest):
|
|
|
|
"""
|
2012-08-07 02:07:02 +02:00
|
|
|
Download url and store at dest.
|
2012-07-22 17:08:16 +02:00
|
|
|
If dest is a directory, determine filename from url.
|
|
|
|
Return (tempfile, info about the request)
|
2012-07-20 12:57:15 +02:00
|
|
|
"""
|
|
|
|
|
2012-07-22 17:08:16 +02:00
|
|
|
req, info = url_do_get(module, url, dest)
|
2012-07-20 12:57:15 +02:00
|
|
|
|
2012-07-22 17:08:16 +02:00
|
|
|
# TODO: should really handle 304, but how? src file could exist (and be newer) but empty
|
2012-07-20 12:57:15 +02:00
|
|
|
if info['status'] == 304:
|
2012-11-06 23:32:49 +01:00
|
|
|
module.exit_json(url=url, dest=dest, changed=False, msg=info.get('msg', ''))
|
2012-07-20 12:57:15 +02:00
|
|
|
|
2012-07-22 17:08:16 +02:00
|
|
|
# create a temporary file and copy content to do md5-based replacement
|
|
|
|
if info['status'] != 200:
|
2012-11-06 23:32:49 +01:00
|
|
|
module.fail_json(msg="Request failed", status_code=info['status'], response=info['msg'], url=url, dest=dest)
|
2012-07-22 17:08:16 +02:00
|
|
|
|
|
|
|
fd, tempname = tempfile.mkstemp()
|
|
|
|
f = os.fdopen(fd, 'wb')
|
|
|
|
try:
|
|
|
|
shutil.copyfileobj(req, f)
|
|
|
|
except Exception, err:
|
|
|
|
os.remove(tempname)
|
|
|
|
module.fail_json(msg="failed to create temporary content file: %s" % str(err))
|
|
|
|
f.close()
|
|
|
|
req.close()
|
|
|
|
return tempname, info
|
2012-07-20 12:57:15 +02:00
|
|
|
|
|
|
|
# ==============================================================
|
|
|
|
# main
|
|
|
|
|
|
|
|
def main():
|
2012-08-07 02:07:02 +02:00
|
|
|
|
|
|
|
# does this really happen on non-ancient python?
|
2012-07-22 17:08:16 +02:00
|
|
|
if not HAS_URLLIB2:
|
|
|
|
module.fail_json(msg="urllib2 is not installed")
|
|
|
|
if not HAS_URLPARSE:
|
|
|
|
module.fail_json(msg="urlparse is not installed")
|
|
|
|
|
2012-07-20 12:57:15 +02:00
|
|
|
module = AnsibleModule(
|
2012-08-02 01:42:31 +02:00
|
|
|
# not checking because of daisy chain to file module
|
2012-07-20 12:57:15 +02:00
|
|
|
argument_spec = dict(
|
|
|
|
url = dict(required=True),
|
|
|
|
dest = dict(required=True),
|
2012-08-21 00:39:37 +02:00
|
|
|
thirsty = dict(default='no', choices=BOOLEANS)
|
2012-10-21 04:51:36 +02:00
|
|
|
),
|
|
|
|
add_file_common_args=True
|
2012-07-20 12:57:15 +02:00
|
|
|
)
|
2012-08-07 02:07:02 +02:00
|
|
|
|
2012-07-22 17:08:16 +02:00
|
|
|
url = module.params['url']
|
|
|
|
dest = os.path.expanduser(module.params['dest'])
|
2012-08-21 00:39:37 +02:00
|
|
|
thirsty = module.boolean(module.params['thirsty'])
|
|
|
|
|
2012-11-06 23:32:49 +01:00
|
|
|
if os.path.isdir(dest):
|
|
|
|
dest = os.path.join(dest, url_filename(url))
|
|
|
|
|
2012-08-21 00:39:37 +02:00
|
|
|
if not thirsty:
|
2012-09-14 09:02:30 +02:00
|
|
|
if os.path.exists(dest):
|
2012-09-14 09:34:41 +02:00
|
|
|
module.exit_json(msg="file already exists", dest=dest, url=url, changed=False)
|
2012-08-07 02:07:02 +02:00
|
|
|
|
2012-07-22 17:08:16 +02:00
|
|
|
# download to tmpsrc
|
|
|
|
tmpsrc, info = url_get(module, url, dest)
|
|
|
|
md5sum_src = None
|
|
|
|
md5sum_dest = None
|
2012-08-07 02:07:02 +02:00
|
|
|
|
2012-07-20 12:57:15 +02:00
|
|
|
# raise an error if there is no tmpsrc file
|
|
|
|
if not os.path.exists(tmpsrc):
|
|
|
|
os.remove(tmpsrc)
|
|
|
|
module.fail_json(msg="Request failed", status_code=info['status'], response=info['msg'])
|
|
|
|
if not os.access(tmpsrc, os.R_OK):
|
|
|
|
os.remove(tmpsrc)
|
|
|
|
module.fail_json( msg="Source %s not readable" % (tmpsrc))
|
2012-07-22 17:08:16 +02:00
|
|
|
md5sum_src = module.md5(tmpsrc)
|
2012-08-07 02:07:02 +02:00
|
|
|
|
2012-07-20 12:57:15 +02:00
|
|
|
# check if there is no dest file
|
|
|
|
if os.path.exists(dest):
|
|
|
|
# raise an error if copy has no permission on dest
|
|
|
|
if not os.access(dest, os.W_OK):
|
|
|
|
os.remove(tmpsrc)
|
|
|
|
module.fail_json( msg="Destination %s not writable" % (dest))
|
|
|
|
if not os.access(dest, os.R_OK):
|
|
|
|
os.remove(tmpsrc)
|
|
|
|
module.fail_json( msg="Destination %s not readable" % (dest))
|
2012-07-22 17:08:16 +02:00
|
|
|
md5sum_dest = module.md5(dest)
|
2012-07-20 12:57:15 +02:00
|
|
|
else:
|
|
|
|
if not os.access(os.path.dirname(dest), os.W_OK):
|
|
|
|
os.remove(tmpsrc)
|
|
|
|
module.fail_json( msg="Destination %s not writable" % (os.path.dirname(dest)))
|
2012-08-07 02:07:02 +02:00
|
|
|
|
2012-07-20 12:57:15 +02:00
|
|
|
if md5sum_src != md5sum_dest:
|
|
|
|
try:
|
|
|
|
shutil.copyfile(tmpsrc, dest)
|
|
|
|
except Exception, err:
|
|
|
|
os.remove(tmpsrc)
|
2012-08-07 02:07:02 +02:00
|
|
|
module.fail_json(msg="failed to copy %s to %s: %s" % (tmpsrc, dest, str(err)))
|
2012-07-20 12:57:15 +02:00
|
|
|
changed = True
|
|
|
|
else:
|
|
|
|
changed = False
|
2012-08-07 02:07:02 +02:00
|
|
|
|
2012-07-20 12:57:15 +02:00
|
|
|
os.remove(tmpsrc)
|
2012-07-22 17:08:16 +02:00
|
|
|
|
2012-10-21 04:51:36 +02:00
|
|
|
# allow file attribute changes
|
|
|
|
module.params['path'] = dest
|
|
|
|
file_args = module.load_file_common_arguments(module.params)
|
|
|
|
file_args['path'] = dest
|
|
|
|
changed = module.set_file_attributes_if_different(file_args, changed)
|
|
|
|
|
2012-07-22 17:08:16 +02:00
|
|
|
# Mission complete
|
2012-08-07 02:07:02 +02:00
|
|
|
module.exit_json(url=url, dest=dest, src=tmpsrc, md5sum=md5sum_src,
|
2013-01-28 17:46:35 +01:00
|
|
|
changed=changed, msg=info.get('msg', ''))
|
2012-07-20 12:57:15 +02:00
|
|
|
|
|
|
|
# this is magic, see lib/ansible/module_common.py
|
|
|
|
#<<INCLUDE_ANSIBLE_MODULE_COMMON>>
|
|
|
|
main()
|