blob: 834b722ed3f140784e308231f667794c9c2a4b43 [file] [log] [blame]
Greg Wardaebf7062000-04-04 02:05:59 +00001"""distutils.archive_util
2
3Utility functions for creating archive files (tarballs, zip files,
4that sort of thing)."""
5
Greg Wardaebf7062000-04-04 02:05:59 +00006__revision__ = "$Id$"
7
8import os
Tarek Ziadé9e5d2dc2009-05-28 12:53:54 +00009from warnings import warn
10import sys
11
Greg Wardaebf7062000-04-04 02:05:59 +000012from distutils.errors import DistutilsExecError
13from distutils.spawn import spawn
Greg Ward04e25a12000-08-22 01:48:54 +000014from distutils.dir_util import mkpath
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +000015from distutils import log
Greg Wardaebf7062000-04-04 02:05:59 +000016
Tarek Ziadé1b486712009-10-02 23:49:48 +000017try:
18 from pwd import getpwnam
Tarek Ziadé3b34dd82009-10-03 14:52:33 +000019except ImportError:
Tarek Ziadé1b486712009-10-02 23:49:48 +000020 getpwnam = None
21
22try:
23 from grp import getgrnam
Tarek Ziadé3b34dd82009-10-03 14:52:33 +000024except ImportError:
Tarek Ziadé1b486712009-10-02 23:49:48 +000025 getgrnam = None
26
27def _get_gid(name):
28 """Returns a gid, given a group name."""
29 if getgrnam is None or name is None:
30 return None
31 try:
32 result = getgrnam(name)
33 except KeyError:
34 result = None
35 if result is not None:
36 return result[2]
37 return None
38
39def _get_uid(name):
40 """Returns an uid, given a user name."""
41 if getpwnam is None or name is None:
42 return None
43 try:
44 result = getpwnam(name)
45 except KeyError:
46 result = None
47 if result is not None:
48 return result[2]
49 return None
50
51def make_tarball(base_name, base_dir, compress="gzip", verbose=0, dry_run=0,
52 owner=None, group=None):
Greg Wardaebf7062000-04-04 02:05:59 +000053 """Create a (possibly compressed) tar file from all the files under
Tarek Ziadé6f826ed2009-05-17 12:04:57 +000054 'base_dir'.
55
56 'compress' must be "gzip" (the default), "compress", "bzip2", or None.
Tarek Ziadé1b486712009-10-02 23:49:48 +000057 (compress will be deprecated in Python 3.2)
58
59 'owner' and 'group' can be used to define an owner and a group for the
60 archive that is being built. If not provided, the current owner and group
61 will be used.
62
Tarek Ziadé6f826ed2009-05-17 12:04:57 +000063 The output tar file will be named 'base_dir' + ".tar", possibly plus
64 the appropriate compression extension (".gz", ".bz2" or ".Z").
Tarek Ziadé1b486712009-10-02 23:49:48 +000065
Tarek Ziadé6f826ed2009-05-17 12:04:57 +000066 Returns the output filename.
Greg Wardca4289f2000-09-26 02:13:49 +000067 """
Tarek Ziadé9e5d2dc2009-05-28 12:53:54 +000068 tar_compression = {'gzip': 'gz', 'bzip2': 'bz2', None: '', 'compress': ''}
69 compress_ext = {'gzip': '.gz', 'bzip2': '.bz2', 'compress': '.Z'}
Fred Drakeb94b8492001-12-06 20:51:35 +000070
Greg Wardf1948782000-04-25 01:38:20 +000071 # flags for compression program, each element of list will be an argument
Greg Wardf1948782000-04-25 01:38:20 +000072 if compress is not None and compress not in compress_ext.keys():
Greg Wardaebf7062000-04-04 02:05:59 +000073 raise ValueError, \
Tarek Ziadé9e5d2dc2009-05-28 12:53:54 +000074 ("bad value for 'compress': must be None, 'gzip', 'bzip2' "
75 "or 'compress'")
Greg Wardaebf7062000-04-04 02:05:59 +000076
Tarek Ziadé9e5d2dc2009-05-28 12:53:54 +000077 archive_name = base_name + '.tar'
78 if compress != 'compress':
79 archive_name += compress_ext.get(compress, '')
80
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +000081 mkpath(os.path.dirname(archive_name), dry_run=dry_run)
Greg Wardaebf7062000-04-04 02:05:59 +000082
Tarek Ziadé9e5d2dc2009-05-28 12:53:54 +000083 # creating the tarball
84 import tarfile # late import so Python build itself doesn't break
85
86 log.info('Creating tar archive')
Tarek Ziadé1b486712009-10-02 23:49:48 +000087
88 uid = _get_uid(owner)
89 gid = _get_gid(group)
90
91 def _set_uid_gid(tarinfo):
92 if gid is not None:
93 tarinfo.gid = gid
94 tarinfo.gname = group
95 if uid is not None:
96 tarinfo.uid = uid
97 tarinfo.uname = owner
98 return tarinfo
99
Tarek Ziadé9e5d2dc2009-05-28 12:53:54 +0000100 if not dry_run:
101 tar = tarfile.open(archive_name, 'w|%s' % tar_compression[compress])
102 try:
Tarek Ziadé1b486712009-10-02 23:49:48 +0000103 tar.add(base_dir, filter=_set_uid_gid)
Tarek Ziadé9e5d2dc2009-05-28 12:53:54 +0000104 finally:
105 tar.close()
106
107 # compression using `compress`
108 if compress == 'compress':
109 warn("'compress' will be deprecated.", PendingDeprecationWarning)
110 # the option varies depending on the platform
111 compressed_name = archive_name + compress_ext[compress]
112 if sys.platform == 'win32':
113 cmd = [compress, archive_name, compressed_name]
114 else:
115 cmd = [compress, '-f', archive_name]
116 spawn(cmd, dry_run=dry_run)
117 return compressed_name
118
119 return archive_name
Greg Wardaebf7062000-04-04 02:05:59 +0000120
Tarek Ziadé6f826ed2009-05-17 12:04:57 +0000121def make_zipfile(base_name, base_dir, verbose=0, dry_run=0):
122 """Create a zip file from all the files under 'base_dir'.
Greg Wardaebf7062000-04-04 02:05:59 +0000123
Éric Araujo6e52cf32010-12-15 20:33:50 +0000124 The output zip file will be named 'base_name' + ".zip". Uses either the
Tarek Ziadé6f826ed2009-05-17 12:04:57 +0000125 "zipfile" Python module (if available) or the InfoZIP "zip" utility
126 (if installed and found on the default search path). If neither tool is
127 available, raises DistutilsExecError. Returns the name of the output zip
128 file.
Greg Wardca4289f2000-09-26 02:13:49 +0000129 """
Andrew M. Kuchlingcdd21572002-11-21 18:33:28 +0000130 try:
131 import zipfile
132 except ImportError:
133 zipfile = None
Tim Peters182b5ac2004-07-18 06:16:08 +0000134
Greg Wardaebf7062000-04-04 02:05:59 +0000135 zip_filename = base_name + ".zip"
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000136 mkpath(os.path.dirname(zip_filename), dry_run=dry_run)
Greg Wardaebf7062000-04-04 02:05:59 +0000137
Andrew M. Kuchlingcdd21572002-11-21 18:33:28 +0000138 # If zipfile module is not available, try spawning an external
139 # 'zip' command.
140 if zipfile is None:
141 if verbose:
142 zipoptions = "-r"
143 else:
144 zipoptions = "-rq"
Tim Peters182b5ac2004-07-18 06:16:08 +0000145
Andrew M. Kuchlingcdd21572002-11-21 18:33:28 +0000146 try:
147 spawn(["zip", zipoptions, zip_filename, base_dir],
148 dry_run=dry_run)
149 except DistutilsExecError:
150 # XXX really should distinguish between "couldn't find
151 # external 'zip' command" and "zip failed".
152 raise DistutilsExecError, \
153 ("unable to create zip file '%s': "
154 "could neither import the 'zipfile' module nor "
155 "find a standalone zip utility") % zip_filename
156
157 else:
158 log.info("creating '%s' and adding '%s' to it",
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000159 zip_filename, base_dir)
Andrew M. Kuchlingcdd21572002-11-21 18:33:28 +0000160
Greg Wardaebf7062000-04-04 02:05:59 +0000161 if not dry_run:
Tarek Ziadé6f826ed2009-05-17 12:04:57 +0000162 zip = zipfile.ZipFile(zip_filename, "w",
163 compression=zipfile.ZIP_DEFLATED)
Greg Wardaebf7062000-04-04 02:05:59 +0000164
Benjamin Peterson9ec4aa02008-05-08 22:09:54 +0000165 for dirpath, dirnames, filenames in os.walk(base_dir):
166 for name in filenames:
167 path = os.path.normpath(os.path.join(dirpath, name))
168 if os.path.isfile(path):
Tarek Ziadé6f826ed2009-05-17 12:04:57 +0000169 zip.write(path, path)
Benjamin Peterson9ec4aa02008-05-08 22:09:54 +0000170 log.info("adding '%s'" % path)
Tarek Ziadé6f826ed2009-05-17 12:04:57 +0000171 zip.close()
Greg Wardaebf7062000-04-04 02:05:59 +0000172
173 return zip_filename
174
Greg Warddb807542000-04-22 03:09:56 +0000175ARCHIVE_FORMATS = {
Greg Ward2ff78872000-06-24 00:23:20 +0000176 'gztar': (make_tarball, [('compress', 'gzip')], "gzip'ed tar-file"),
177 'bztar': (make_tarball, [('compress', 'bzip2')], "bzip2'ed tar-file"),
178 'ztar': (make_tarball, [('compress', 'compress')], "compressed tar file"),
179 'tar': (make_tarball, [('compress', None)], "uncompressed tar file"),
Greg Ward04e25a12000-08-22 01:48:54 +0000180 'zip': (make_zipfile, [],"ZIP file")
Greg Warddb807542000-04-22 03:09:56 +0000181 }
182
Tarek Ziadé6f826ed2009-05-17 12:04:57 +0000183def check_archive_formats(formats):
184 """Returns the first format from the 'format' list that is unknown.
185
186 If all formats are known, returns None
187 """
Greg Warddb807542000-04-22 03:09:56 +0000188 for format in formats:
Guido van Rossum8bc09652008-02-21 18:18:37 +0000189 if format not in ARCHIVE_FORMATS:
Greg Warddb807542000-04-22 03:09:56 +0000190 return format
Tarek Ziadé6f826ed2009-05-17 12:04:57 +0000191 return None
Greg Warddb807542000-04-22 03:09:56 +0000192
Tarek Ziadé6f826ed2009-05-17 12:04:57 +0000193def make_archive(base_name, format, root_dir=None, base_dir=None, verbose=0,
Tarek Ziadé1b486712009-10-02 23:49:48 +0000194 dry_run=0, owner=None, group=None):
Tarek Ziadé6f826ed2009-05-17 12:04:57 +0000195 """Create an archive file (eg. zip or tar).
196
197 'base_name' is the name of the file to create, minus any format-specific
198 extension; 'format' is the archive format: one of "zip", "tar", "ztar",
199 or "gztar".
200
Greg Wardaebf7062000-04-04 02:05:59 +0000201 'root_dir' is a directory that will be the root directory of the
202 archive; ie. we typically chdir into 'root_dir' before creating the
203 archive. 'base_dir' is the directory where we start archiving from;
204 ie. 'base_dir' will be the common prefix of all files and
205 directories in the archive. 'root_dir' and 'base_dir' both default
Greg Ward87909612000-06-01 01:07:55 +0000206 to the current directory. Returns the name of the archive file.
Tarek Ziadé1b486712009-10-02 23:49:48 +0000207
208 'owner' and 'group' are used when creating a tar archive. By default,
209 uses the current owner and group.
Greg Ward87909612000-06-01 01:07:55 +0000210 """
Greg Wardaebf7062000-04-04 02:05:59 +0000211 save_cwd = os.getcwd()
212 if root_dir is not None:
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000213 log.debug("changing into '%s'", root_dir)
Greg Wardca4289f2000-09-26 02:13:49 +0000214 base_name = os.path.abspath(base_name)
Greg Wardaebf7062000-04-04 02:05:59 +0000215 if not dry_run:
Greg Wardca4289f2000-09-26 02:13:49 +0000216 os.chdir(root_dir)
Greg Wardaebf7062000-04-04 02:05:59 +0000217
218 if base_dir is None:
219 base_dir = os.curdir
220
Tarek Ziadé6f826ed2009-05-17 12:04:57 +0000221 kwargs = {'dry_run': dry_run}
Fred Drakeb94b8492001-12-06 20:51:35 +0000222
Greg Warddb807542000-04-22 03:09:56 +0000223 try:
224 format_info = ARCHIVE_FORMATS[format]
225 except KeyError:
226 raise ValueError, "unknown archive format '%s'" % format
Greg Wardaebf7062000-04-04 02:05:59 +0000227
Greg Warddb807542000-04-22 03:09:56 +0000228 func = format_info[0]
Tarek Ziadé6f826ed2009-05-17 12:04:57 +0000229 for arg, val in format_info[1]:
Greg Warddb807542000-04-22 03:09:56 +0000230 kwargs[arg] = val
Greg Wardaebf7062000-04-04 02:05:59 +0000231
Tarek Ziadé1b486712009-10-02 23:49:48 +0000232 if format != 'zip':
233 kwargs['owner'] = owner
234 kwargs['group'] = group
235
Tarek Ziadé672422a2009-10-24 13:29:44 +0000236 try:
237 filename = func(base_name, base_dir, **kwargs)
238 finally:
239 if root_dir is not None:
240 log.debug("changing back to '%s'", save_cwd)
241 os.chdir(save_cwd)
Greg Wardaebf7062000-04-04 02:05:59 +0000242
Greg Ward87909612000-06-01 01:07:55 +0000243 return filename