1
0
Fork 0
mirror of https://github.com/ansible-collections/community.general.git synced 2024-09-14 20:13:21 +02:00

Revert PR #3575 since it causes problems related to exclude patterns (#3767)

* Revert PR #3575 since it causes problems related to exclude patterns

By using a different method for getting archive filelists, and extracting we introduced new problems related to excluding based on gtar patterns.

As a result files that would be excluded by gtar, would still be in the filelist. Implementing our own gtar compatible pattern exclusion mechanism is near to impossible (believe me, we looked at it...). The best way is to look at the original problem and deal with that, and ensure that extraction and filelists are done with the exact same tool and exact same options.

The solution is to decode the octal unicode representation in gtar's output back to unicode. Since gtar has no problem extracting these files in LANG=C, we simply has to compensate for it.

This reverts #3575 and fixes #11348.

* Implement codecs.escape_decode() instead of decode("string_escape") for python3
This commit is contained in:
Dag Wieers 2016-07-06 23:40:48 +02:00 committed by Matt Clay
parent a8059c68d0
commit 855ca9b204

View file

@ -5,7 +5,6 @@
# (c) 2013, Dylan Martin <dmartin@seattlecentral.edu> # (c) 2013, Dylan Martin <dmartin@seattlecentral.edu>
# (c) 2015, Toshio Kuratomi <tkuratomi@ansible.com> # (c) 2015, Toshio Kuratomi <tkuratomi@ansible.com>
# (c) 2016, Dag Wieers <dag@wieers.com> # (c) 2016, Dag Wieers <dag@wieers.com>
# (c) 2016, Virgil Dupras <hsoft@hardcoded.net>
# #
# This file is part of Ansible # This file is part of Ansible
# #
@ -123,9 +122,8 @@ import grp
import datetime import datetime
import time import time
import binascii import binascii
import codecs
from zipfile import ZipFile, BadZipfile from zipfile import ZipFile, BadZipfile
import tarfile
import subprocess
# String from tar that shows the tar contents are different from the # String from tar that shows the tar contents are different from the
# filesystem # filesystem
@ -552,23 +550,25 @@ class TgzArchive(object):
self.compress_mode = 'gz' self.compress_mode = 'gz'
self._files_in_archive = [] self._files_in_archive = []
def _get_tar_fileobj(self):
"""Returns a file object that can be read by ``tarfile.open()``."""
return open(self.src, 'rb')
@property @property
def files_in_archive(self, force_refresh=False): def files_in_archive(self, force_refresh=False):
if self._files_in_archive and not force_refresh: if self._files_in_archive and not force_refresh:
return self._files_in_archive return self._files_in_archive
# The use of Python's tarfile module here allows us to easily avoid tricky file encoding cmd = '%s -t%s' % (self.cmd_path, self.zipflag)
# problems. Ref #11348 if self.opts:
try: cmd += ' ' + ' '.join(self.opts)
tf = tarfile.open(fileobj=self._get_tar_fileobj(), mode='r:%s' % self.compress_mode) if self.excludes:
except Exception: cmd += ' --exclude="' + '" --exclude="'.join(self.excludes) + '"'
cmd += ' -f "%s"' % self.src
rc, out, err = self.module.run_command(cmd)
if rc != 0:
raise UnarchiveError('Unable to list files in the archive') raise UnarchiveError('Unable to list files in the archive')
for filename in tf.getnames(): for filename in out.splitlines():
# Compensate for locale-related problems in gtar output (octal unicode representation) #11348
# filename = filename.decode('string_escape')
filename = codecs.escape_decode(filename)[0]
if filename and filename not in self.excludes: if filename and filename not in self.excludes:
self._files_in_archive.append(filename) self._files_in_archive.append(filename)
return self._files_in_archive return self._files_in_archive
@ -673,19 +673,6 @@ class TarXzArchive(TgzArchive):
self.zipflag = 'J' self.zipflag = 'J'
self.compress_mode = '' self.compress_mode = ''
def _get_tar_fileobj(self):
# Python's tarfile module doesn't support xz compression so we have to manually uncompress
# it first.
xz_bin_path = self.module.get_bin_path('xz')
xz_stdout = tempfile.TemporaryFile()
# we don't use self.module.run_command() to avoid loading the whole archive in memory.
cmd = subprocess.Popen([xz_bin_path, '-dc', self.src], stdout=xz_stdout)
rc = cmd.wait()
if rc != 0:
raise UnarchiveError("Could not uncompress with xz")
xz_stdout.seek(0)
return xz_stdout
# try handlers in order and return the one that works or bail if none work # try handlers in order and return the one that works or bail if none work
def pick_handler(src, dest, file_args, module): def pick_handler(src, dest, file_args, module):