• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1"""distutils.archive_util
2
3Utility functions for creating archive files (tarballs, zip files,
4that sort of thing)."""
5
6__revision__ = "$Id$"
7
8import os
9from warnings import warn
10import sys
11
12from distutils.errors import DistutilsExecError
13from distutils.spawn import spawn
14from distutils.dir_util import mkpath
15from distutils import log
16
17try:
18    from pwd import getpwnam
19except ImportError:
20    getpwnam = None
21
22try:
23    from grp import getgrnam
24except ImportError:
25    getgrnam = None
26
27def _get_gid(name):
28    """Returns a gid, given a group name."""
29    if getgrnam is None or name is None:
30        return None
31    try:
32        result = getgrnam(name)
33    except KeyError:
34        result = None
35    if result is not None:
36        return result[2]
37    return None
38
39def _get_uid(name):
40    """Returns an uid, given a user name."""
41    if getpwnam is None or name is None:
42        return None
43    try:
44        result = getpwnam(name)
45    except KeyError:
46        result = None
47    if result is not None:
48        return result[2]
49    return None
50
51def make_tarball(base_name, base_dir, compress="gzip", verbose=0, dry_run=0,
52                 owner=None, group=None):
53    """Create a (possibly compressed) tar file from all the files under
54    'base_dir'.
55
56    'compress' must be "gzip" (the default), "compress", "bzip2", or None.
57    (compress will be deprecated in Python 3.2)
58
59    'owner' and 'group' can be used to define an owner and a group for the
60    archive that is being built. If not provided, the current owner and group
61    will be used.
62
63    The output tar file will be named 'base_dir' +  ".tar", possibly plus
64    the appropriate compression extension (".gz", ".bz2" or ".Z").
65
66    Returns the output filename.
67    """
68    tar_compression = {'gzip': 'gz', 'bzip2': 'bz2', None: '', 'compress': ''}
69    compress_ext = {'gzip': '.gz', 'bzip2': '.bz2', 'compress': '.Z'}
70
71    # flags for compression program, each element of list will be an argument
72    if compress is not None and compress not in compress_ext.keys():
73        raise ValueError, \
74              ("bad value for 'compress': must be None, 'gzip', 'bzip2' "
75               "or 'compress'")
76
77    archive_name = base_name + '.tar'
78    if compress != 'compress':
79        archive_name += compress_ext.get(compress, '')
80
81    mkpath(os.path.dirname(archive_name), dry_run=dry_run)
82
83    # creating the tarball
84    import tarfile  # late import so Python build itself doesn't break
85
86    log.info('Creating tar archive')
87
88    uid = _get_uid(owner)
89    gid = _get_gid(group)
90
91    def _set_uid_gid(tarinfo):
92        if gid is not None:
93            tarinfo.gid = gid
94            tarinfo.gname = group
95        if uid is not None:
96            tarinfo.uid = uid
97            tarinfo.uname = owner
98        return tarinfo
99
100    if not dry_run:
101        tar = tarfile.open(archive_name, 'w|%s' % tar_compression[compress])
102        try:
103            tar.add(base_dir, filter=_set_uid_gid)
104        finally:
105            tar.close()
106
107    # compression using `compress`
108    if compress == 'compress':
109        warn("'compress' will be deprecated.", PendingDeprecationWarning)
110        # the option varies depending on the platform
111        compressed_name = archive_name + compress_ext[compress]
112        if sys.platform == 'win32':
113            cmd = [compress, archive_name, compressed_name]
114        else:
115            cmd = [compress, '-f', archive_name]
116        spawn(cmd, dry_run=dry_run)
117        return compressed_name
118
119    return archive_name
120
121def make_zipfile(base_name, base_dir, verbose=0, dry_run=0):
122    """Create a zip file from all the files under 'base_dir'.
123
124    The output zip file will be named 'base_name' + ".zip".  Uses either the
125    "zipfile" Python module (if available) or the InfoZIP "zip" utility
126    (if installed and found on the default search path).  If neither tool is
127    available, raises DistutilsExecError.  Returns the name of the output zip
128    file.
129    """
130    try:
131        import zipfile
132    except ImportError:
133        zipfile = None
134
135    zip_filename = base_name + ".zip"
136    mkpath(os.path.dirname(zip_filename), dry_run=dry_run)
137
138    # If zipfile module is not available, try spawning an external
139    # 'zip' command.
140    if zipfile is None:
141        if verbose:
142            zipoptions = "-r"
143        else:
144            zipoptions = "-rq"
145
146        try:
147            spawn(["zip", zipoptions, zip_filename, base_dir],
148                  dry_run=dry_run)
149        except DistutilsExecError:
150            # XXX really should distinguish between "couldn't find
151            # external 'zip' command" and "zip failed".
152            raise DistutilsExecError, \
153                  ("unable to create zip file '%s': "
154                   "could neither import the 'zipfile' module nor "
155                   "find a standalone zip utility") % zip_filename
156
157    else:
158        log.info("creating '%s' and adding '%s' to it",
159                 zip_filename, base_dir)
160
161        if not dry_run:
162            zip = zipfile.ZipFile(zip_filename, "w",
163                                  compression=zipfile.ZIP_DEFLATED)
164
165            for dirpath, dirnames, filenames in os.walk(base_dir):
166                for name in filenames:
167                    path = os.path.normpath(os.path.join(dirpath, name))
168                    if os.path.isfile(path):
169                        zip.write(path, path)
170                        log.info("adding '%s'" % path)
171            zip.close()
172
173    return zip_filename
174
175ARCHIVE_FORMATS = {
176    'gztar': (make_tarball, [('compress', 'gzip')], "gzip'ed tar-file"),
177    'bztar': (make_tarball, [('compress', 'bzip2')], "bzip2'ed tar-file"),
178    'ztar':  (make_tarball, [('compress', 'compress')], "compressed tar file"),
179    'tar':   (make_tarball, [('compress', None)], "uncompressed tar file"),
180    'zip':   (make_zipfile, [],"ZIP file")
181    }
182
183def check_archive_formats(formats):
184    """Returns the first format from the 'format' list that is unknown.
185
186    If all formats are known, returns None
187    """
188    for format in formats:
189        if format not in ARCHIVE_FORMATS:
190            return format
191    return None
192
193def make_archive(base_name, format, root_dir=None, base_dir=None, verbose=0,
194                 dry_run=0, owner=None, group=None):
195    """Create an archive file (eg. zip or tar).
196
197    'base_name' is the name of the file to create, minus any format-specific
198    extension; 'format' is the archive format: one of "zip", "tar", "ztar",
199    or "gztar".
200
201    'root_dir' is a directory that will be the root directory of the
202    archive; ie. we typically chdir into 'root_dir' before creating the
203    archive.  'base_dir' is the directory where we start archiving from;
204    ie. 'base_dir' will be the common prefix of all files and
205    directories in the archive.  'root_dir' and 'base_dir' both default
206    to the current directory.  Returns the name of the archive file.
207
208    'owner' and 'group' are used when creating a tar archive. By default,
209    uses the current owner and group.
210    """
211    save_cwd = os.getcwd()
212    if root_dir is not None:
213        log.debug("changing into '%s'", root_dir)
214        base_name = os.path.abspath(base_name)
215        if not dry_run:
216            os.chdir(root_dir)
217
218    if base_dir is None:
219        base_dir = os.curdir
220
221    kwargs = {'dry_run': dry_run}
222
223    try:
224        format_info = ARCHIVE_FORMATS[format]
225    except KeyError:
226        raise ValueError, "unknown archive format '%s'" % format
227
228    func = format_info[0]
229    for arg, val in format_info[1]:
230        kwargs[arg] = val
231
232    if format != 'zip':
233        kwargs['owner'] = owner
234        kwargs['group'] = group
235
236    try:
237        filename = func(base_name, base_dir, **kwargs)
238    finally:
239        if root_dir is not None:
240            log.debug("changing back to '%s'", save_cwd)
241            os.chdir(save_cwd)
242
243    return filename
244