blob: 6688119bde4c5e5efdcf255abdec18f4232ecf42 [file] [log] [blame]
Tarek Ziadéc3399782010-02-23 05:39:18 +00001"""Utility functions for copying and archiving files and directory trees.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +00002
Guido van Rossum959fa011999-08-18 20:03:17 +00003XXX The functions here don't copy the resource fork or other metadata on Mac.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +00004
5"""
Guido van Rossumc6360141990-10-13 19:23:40 +00006
Guido van Rossumc96207a1992-03-31 18:55:40 +00007import os
Guido van Rossum83c03e21999-02-23 23:07:51 +00008import sys
Guido van Rossum9d0a3df1997-04-29 14:45:19 +00009import stat
Brett Cannon1c3fa182004-06-19 21:11:35 +000010from os.path import abspath
Georg Brandl2ee470f2008-07-16 12:55:28 +000011import fnmatch
Tarek Ziadé396fad72010-02-23 05:30:31 +000012from warnings import warn
13import collections
Antoine Pitrou910bd512010-03-22 20:11:09 +000014import errno
Tarek Ziadé396fad72010-02-23 05:30:31 +000015
16try:
17 from pwd import getpwnam
18except ImportError:
19 getpwnam = None
20
21try:
22 from grp import getgrnam
23except ImportError:
24 getgrnam = None
Guido van Rossumc6360141990-10-13 19:23:40 +000025
Tarek Ziadéc3399782010-02-23 05:39:18 +000026__all__ = ["copyfileobj", "copyfile", "copymode", "copystat", "copy", "copy2",
27 "copytree", "move", "rmtree", "Error", "SpecialFileError",
28 "ExecError", "make_archive", "get_archive_formats",
29 "register_archive_format", "unregister_archive_format"]
Martin v. Löwise9ce0b02002-10-07 13:23:24 +000030
Neal Norwitz4ce69a52005-09-01 00:45:28 +000031class Error(EnvironmentError):
Martin v. Löwise9ce0b02002-10-07 13:23:24 +000032 pass
Guido van Rossumc6360141990-10-13 19:23:40 +000033
Antoine Pitrou7fff0962009-05-01 21:09:44 +000034class SpecialFileError(EnvironmentError):
35 """Raised when trying to do a kind of operation (e.g. copying) which is
36 not supported on a special file (e.g. a named pipe)"""
37
Tarek Ziadé396fad72010-02-23 05:30:31 +000038class ExecError(EnvironmentError):
39 """Raised when a command could not be executed"""
40
Georg Brandl6aa2d1f2008-08-12 08:35:52 +000041try:
42 WindowsError
43except NameError:
44 WindowsError = None
45
Greg Stein42bb8b32000-07-12 09:55:30 +000046def copyfileobj(fsrc, fdst, length=16*1024):
47 """copy data from file-like object fsrc to file-like object fdst"""
48 while 1:
49 buf = fsrc.read(length)
50 if not buf:
51 break
52 fdst.write(buf)
53
Johannes Gijsbers46f14592004-08-14 13:30:02 +000054def _samefile(src, dst):
55 # Macintosh, Unix.
Tarek Ziadé1eab9cc2010-04-19 21:19:57 +000056 if hasattr(os.path, 'samefile'):
Johannes Gijsbersf9a098e2004-08-14 14:51:01 +000057 try:
58 return os.path.samefile(src, dst)
59 except OSError:
60 return False
Johannes Gijsbers46f14592004-08-14 13:30:02 +000061
62 # All other platforms: check for same pathname.
63 return (os.path.normcase(os.path.abspath(src)) ==
64 os.path.normcase(os.path.abspath(dst)))
Tim Peters495ad3c2001-01-15 01:36:40 +000065
Guido van Rossumc6360141990-10-13 19:23:40 +000066def copyfile(src, dst):
Guido van Rossum9d0a3df1997-04-29 14:45:19 +000067 """Copy data from src to dst"""
Johannes Gijsbers46f14592004-08-14 13:30:02 +000068 if _samefile(src, dst):
Collin Winterce36ad82007-08-30 01:19:48 +000069 raise Error("`%s` and `%s` are the same file" % (src, dst))
Johannes Gijsbers46f14592004-08-14 13:30:02 +000070
Guido van Rossuma2baf461997-04-29 14:06:46 +000071 fsrc = None
72 fdst = None
Antoine Pitrou7fff0962009-05-01 21:09:44 +000073 for fn in [src, dst]:
74 try:
75 st = os.stat(fn)
76 except OSError:
77 # File most likely does not exist
78 pass
Benjamin Petersonc0d98aa2009-06-05 19:13:27 +000079 else:
80 # XXX What about other special files? (sockets, devices...)
81 if stat.S_ISFIFO(st.st_mode):
82 raise SpecialFileError("`%s` is a named pipe" % fn)
Guido van Rossuma2baf461997-04-29 14:06:46 +000083 try:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +000084 fsrc = open(src, 'rb')
85 fdst = open(dst, 'wb')
Greg Stein42bb8b32000-07-12 09:55:30 +000086 copyfileobj(fsrc, fdst)
Guido van Rossuma2baf461997-04-29 14:06:46 +000087 finally:
Guido van Rossum45e2fbc1998-03-26 21:13:24 +000088 if fdst:
89 fdst.close()
90 if fsrc:
91 fsrc.close()
Guido van Rossumc6360141990-10-13 19:23:40 +000092
Guido van Rossumc6360141990-10-13 19:23:40 +000093def copymode(src, dst):
Guido van Rossum9d0a3df1997-04-29 14:45:19 +000094 """Copy mode bits from src to dst"""
Tim Peters0c947242001-01-21 20:00:00 +000095 if hasattr(os, 'chmod'):
96 st = os.stat(src)
Walter Dörwald294bbf32002-06-06 09:48:13 +000097 mode = stat.S_IMODE(st.st_mode)
Tim Peters0c947242001-01-21 20:00:00 +000098 os.chmod(dst, mode)
Guido van Rossumc6360141990-10-13 19:23:40 +000099
Guido van Rossumc6360141990-10-13 19:23:40 +0000100def copystat(src, dst):
Thomas Wouterscf297e42007-02-23 15:07:44 +0000101 """Copy all stat info (mode bits, atime, mtime, flags) from src to dst"""
Guido van Rossuma2baf461997-04-29 14:06:46 +0000102 st = os.stat(src)
Walter Dörwald294bbf32002-06-06 09:48:13 +0000103 mode = stat.S_IMODE(st.st_mode)
Tim Peters0c947242001-01-21 20:00:00 +0000104 if hasattr(os, 'utime'):
Walter Dörwald294bbf32002-06-06 09:48:13 +0000105 os.utime(dst, (st.st_atime, st.st_mtime))
Tim Peters0c947242001-01-21 20:00:00 +0000106 if hasattr(os, 'chmod'):
107 os.chmod(dst, mode)
Thomas Wouterscf297e42007-02-23 15:07:44 +0000108 if hasattr(os, 'chflags') and hasattr(st, 'st_flags'):
Antoine Pitrou910bd512010-03-22 20:11:09 +0000109 try:
110 os.chflags(dst, st.st_flags)
111 except OSError as why:
Tarek Ziadé1eab9cc2010-04-19 21:19:57 +0000112 if (not hasattr(errno, 'EOPNOTSUPP') or
113 why.errno != errno.EOPNOTSUPP):
Antoine Pitrou910bd512010-03-22 20:11:09 +0000114 raise
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000115
Guido van Rossumc6360141990-10-13 19:23:40 +0000116def copy(src, dst):
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000117 """Copy data and mode bits ("cp src dst").
Tim Peters495ad3c2001-01-15 01:36:40 +0000118
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000119 The destination may be a directory.
120
121 """
Guido van Rossuma2baf461997-04-29 14:06:46 +0000122 if os.path.isdir(dst):
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000123 dst = os.path.join(dst, os.path.basename(src))
Guido van Rossuma2baf461997-04-29 14:06:46 +0000124 copyfile(src, dst)
125 copymode(src, dst)
Guido van Rossumc6360141990-10-13 19:23:40 +0000126
Guido van Rossumc6360141990-10-13 19:23:40 +0000127def copy2(src, dst):
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000128 """Copy data and all stat info ("cp -p src dst").
129
130 The destination may be a directory.
131
132 """
Guido van Rossuma2baf461997-04-29 14:06:46 +0000133 if os.path.isdir(dst):
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000134 dst = os.path.join(dst, os.path.basename(src))
Guido van Rossuma2baf461997-04-29 14:06:46 +0000135 copyfile(src, dst)
136 copystat(src, dst)
Guido van Rossumc6360141990-10-13 19:23:40 +0000137
Georg Brandl2ee470f2008-07-16 12:55:28 +0000138def ignore_patterns(*patterns):
139 """Function that can be used as copytree() ignore parameter.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000140
Georg Brandl2ee470f2008-07-16 12:55:28 +0000141 Patterns is a sequence of glob-style patterns
142 that are used to exclude files"""
143 def _ignore_patterns(path, names):
144 ignored_names = []
145 for pattern in patterns:
146 ignored_names.extend(fnmatch.filter(names, pattern))
147 return set(ignored_names)
148 return _ignore_patterns
149
150def copytree(src, dst, symlinks=False, ignore=None):
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000151 """Recursively copy a directory tree using copy2().
152
153 The destination directory must not already exist.
Neal Norwitza4c93b62003-02-23 21:36:32 +0000154 If exception(s) occur, an Error is raised with a list of reasons.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000155
156 If the optional symlinks flag is true, symbolic links in the
157 source tree result in symbolic links in the destination tree; if
158 it is false, the contents of the files pointed to by symbolic
159 links are copied.
160
Georg Brandl2ee470f2008-07-16 12:55:28 +0000161 The optional ignore argument is a callable. If given, it
162 is called with the `src` parameter, which is the directory
163 being visited by copytree(), and `names` which is the list of
164 `src` contents, as returned by os.listdir():
165
166 callable(src, names) -> ignored_names
167
168 Since copytree() is called recursively, the callable will be
169 called once for each directory that is copied. It returns a
170 list of names relative to the `src` directory that should
171 not be copied.
172
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000173 XXX Consider this example code rather than the ultimate tool.
174
175 """
Guido van Rossuma2baf461997-04-29 14:06:46 +0000176 names = os.listdir(src)
Georg Brandl2ee470f2008-07-16 12:55:28 +0000177 if ignore is not None:
178 ignored_names = ignore(src, names)
179 else:
180 ignored_names = set()
181
Johannes Gijsberse4172ea2005-01-08 12:31:29 +0000182 os.makedirs(dst)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000183 errors = []
Guido van Rossuma2baf461997-04-29 14:06:46 +0000184 for name in names:
Georg Brandl2ee470f2008-07-16 12:55:28 +0000185 if name in ignored_names:
186 continue
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000187 srcname = os.path.join(src, name)
188 dstname = os.path.join(dst, name)
189 try:
190 if symlinks and os.path.islink(srcname):
191 linkto = os.readlink(srcname)
192 os.symlink(linkto, dstname)
193 elif os.path.isdir(srcname):
Georg Brandl2ee470f2008-07-16 12:55:28 +0000194 copytree(srcname, dstname, symlinks, ignore)
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000195 else:
Antoine Pitrou7fff0962009-05-01 21:09:44 +0000196 # Will raise a SpecialFileError for unsupported file types
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000197 copy2(srcname, dstname)
Georg Brandla1be88e2005-08-31 22:48:45 +0000198 # catch the Error from the recursive copytree so that we can
199 # continue with other files
Guido van Rossumb940e112007-01-10 16:19:56 +0000200 except Error as err:
Georg Brandla1be88e2005-08-31 22:48:45 +0000201 errors.extend(err.args[0])
Antoine Pitrou7fff0962009-05-01 21:09:44 +0000202 except EnvironmentError as why:
203 errors.append((srcname, dstname, str(why)))
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000204 try:
205 copystat(src, dst)
Guido van Rossumb940e112007-01-10 16:19:56 +0000206 except OSError as why:
Georg Brandl6aa2d1f2008-08-12 08:35:52 +0000207 if WindowsError is not None and isinstance(why, WindowsError):
208 # Copying file access times may fail on Windows
209 pass
210 else:
211 errors.extend((src, dst, str(why)))
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000212 if errors:
Collin Winterce36ad82007-08-30 01:19:48 +0000213 raise Error(errors)
Guido van Rossumd7673291998-02-06 21:38:09 +0000214
Barry Warsaw234d9a92003-01-24 17:36:15 +0000215def rmtree(path, ignore_errors=False, onerror=None):
Guido van Rossumd7673291998-02-06 21:38:09 +0000216 """Recursively delete a directory tree.
217
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000218 If ignore_errors is set, errors are ignored; otherwise, if onerror
219 is set, it is called to handle the error with arguments (func,
220 path, exc_info) where func is os.listdir, os.remove, or os.rmdir;
221 path is the argument to that function that caused it to fail; and
222 exc_info is a tuple returned by sys.exc_info(). If ignore_errors
223 is false and onerror is None, an exception is raised.
224
Guido van Rossumd7673291998-02-06 21:38:09 +0000225 """
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000226 if ignore_errors:
227 def onerror(*args):
Barry Warsaw234d9a92003-01-24 17:36:15 +0000228 pass
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000229 elif onerror is None:
230 def onerror(*args):
231 raise
Christian Heimes9bd667a2008-01-20 15:14:11 +0000232 try:
233 if os.path.islink(path):
234 # symlinks to directories are forbidden, see bug #1669
235 raise OSError("Cannot call rmtree on a symbolic link")
236 except OSError:
237 onerror(os.path.islink, path, sys.exc_info())
238 # can't continue even if onerror hook returns
239 return
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000240 names = []
241 try:
242 names = os.listdir(path)
Guido van Rossumb940e112007-01-10 16:19:56 +0000243 except os.error as err:
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000244 onerror(os.listdir, path, sys.exc_info())
245 for name in names:
246 fullname = os.path.join(path, name)
247 try:
248 mode = os.lstat(fullname).st_mode
249 except os.error:
250 mode = 0
251 if stat.S_ISDIR(mode):
252 rmtree(fullname, ignore_errors, onerror)
Barry Warsaw234d9a92003-01-24 17:36:15 +0000253 else:
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000254 try:
255 os.remove(fullname)
Guido van Rossumb940e112007-01-10 16:19:56 +0000256 except os.error as err:
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000257 onerror(os.remove, fullname, sys.exc_info())
258 try:
259 os.rmdir(path)
260 except os.error:
261 onerror(os.rmdir, path, sys.exc_info())
Guido van Rossumd7673291998-02-06 21:38:09 +0000262
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000263
Christian Heimesada8c3b2008-03-18 18:26:33 +0000264def _basename(path):
265 # A basename() variant which first strips the trailing slash, if present.
266 # Thus we always get the last component of the path, even for directories.
267 return os.path.basename(path.rstrip(os.path.sep))
268
269def move(src, dst):
270 """Recursively move a file or directory to another location. This is
271 similar to the Unix "mv" command.
272
273 If the destination is a directory or a symlink to a directory, the source
274 is moved inside the directory. The destination path must not already
275 exist.
276
277 If the destination already exists but is not a directory, it may be
278 overwritten depending on os.rename() semantics.
279
280 If the destination is on our current filesystem, then rename() is used.
281 Otherwise, src is copied to the destination and then removed.
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000282 A lot more could be done here... A look at a mv.c shows a lot of
283 the issues this implementation glosses over.
284
285 """
Christian Heimesada8c3b2008-03-18 18:26:33 +0000286 real_dst = dst
287 if os.path.isdir(dst):
288 real_dst = os.path.join(dst, _basename(src))
289 if os.path.exists(real_dst):
290 raise Error("Destination path '%s' already exists" % real_dst)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000291 try:
Christian Heimesada8c3b2008-03-18 18:26:33 +0000292 os.rename(src, real_dst)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000293 except OSError:
294 if os.path.isdir(src):
Benjamin Peterson247a9b82009-02-20 04:09:19 +0000295 if _destinsrc(src, dst):
Collin Winterce36ad82007-08-30 01:19:48 +0000296 raise Error("Cannot move a directory '%s' into itself '%s'." % (src, dst))
Christian Heimesada8c3b2008-03-18 18:26:33 +0000297 copytree(src, real_dst, symlinks=True)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000298 rmtree(src)
299 else:
Christian Heimesada8c3b2008-03-18 18:26:33 +0000300 copy2(src, real_dst)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000301 os.unlink(src)
Brett Cannon1c3fa182004-06-19 21:11:35 +0000302
Benjamin Peterson247a9b82009-02-20 04:09:19 +0000303def _destinsrc(src, dst):
Antoine Pitrou0dcc3cd2009-01-29 20:26:59 +0000304 src = abspath(src)
305 dst = abspath(dst)
306 if not src.endswith(os.path.sep):
307 src += os.path.sep
308 if not dst.endswith(os.path.sep):
309 dst += os.path.sep
310 return dst.startswith(src)
Tarek Ziadé396fad72010-02-23 05:30:31 +0000311
312def _get_gid(name):
313 """Returns a gid, given a group name."""
314 if getgrnam is None or name is None:
315 return None
316 try:
317 result = getgrnam(name)
318 except KeyError:
319 result = None
320 if result is not None:
321 return result[2]
322 return None
323
324def _get_uid(name):
325 """Returns an uid, given a user name."""
326 if getpwnam is None or name is None:
327 return None
328 try:
329 result = getpwnam(name)
330 except KeyError:
331 result = None
332 if result is not None:
333 return result[2]
334 return None
335
336def _make_tarball(base_name, base_dir, compress="gzip", verbose=0, dry_run=0,
337 owner=None, group=None, logger=None):
338 """Create a (possibly compressed) tar file from all the files under
339 'base_dir'.
340
341 'compress' must be "gzip" (the default), "compress", "bzip2", or None.
342 (compress will be deprecated in Python 3.2)
343
344 'owner' and 'group' can be used to define an owner and a group for the
345 archive that is being built. If not provided, the current owner and group
346 will be used.
347
348 The output tar file will be named 'base_dir' + ".tar", possibly plus
349 the appropriate compression extension (".gz", ".bz2" or ".Z").
350
351 Returns the output filename.
352 """
353 tar_compression = {'gzip': 'gz', 'bzip2': 'bz2', None: '', 'compress': ''}
354 compress_ext = {'gzip': '.gz', 'bzip2': '.bz2', 'compress': '.Z'}
355
356 # flags for compression program, each element of list will be an argument
357 if compress is not None and compress not in compress_ext.keys():
358 raise ValueError("bad value for 'compress': must be None, 'gzip', "
359 "'bzip2' or 'compress'")
360
361 archive_name = base_name + '.tar'
362 if compress != 'compress':
363 archive_name += compress_ext.get(compress, '')
364
365 archive_dir = os.path.dirname(archive_name)
366 if not os.path.exists(archive_dir):
367 logger.info("creating %s" % archive_dir)
368 if not dry_run:
369 os.makedirs(archive_dir)
370
371
372 # creating the tarball
373 import tarfile # late import so Python build itself doesn't break
374
375 if logger is not None:
376 logger.info('Creating tar archive')
377
378 uid = _get_uid(owner)
379 gid = _get_gid(group)
380
381 def _set_uid_gid(tarinfo):
382 if gid is not None:
383 tarinfo.gid = gid
384 tarinfo.gname = group
385 if uid is not None:
386 tarinfo.uid = uid
387 tarinfo.uname = owner
388 return tarinfo
389
390 if not dry_run:
391 tar = tarfile.open(archive_name, 'w|%s' % tar_compression[compress])
392 try:
393 tar.add(base_dir, filter=_set_uid_gid)
394 finally:
395 tar.close()
396
397 # compression using `compress`
398 # XXX this block will be removed in Python 3.2
399 if compress == 'compress':
400 warn("'compress' will be deprecated.", PendingDeprecationWarning)
401 # the option varies depending on the platform
402 compressed_name = archive_name + compress_ext[compress]
403 if sys.platform == 'win32':
404 cmd = [compress, archive_name, compressed_name]
405 else:
406 cmd = [compress, '-f', archive_name]
407 from distutils.spawn import spawn
408 spawn(cmd, dry_run=dry_run)
409 return compressed_name
410
411 return archive_name
412
413def _call_external_zip(directory, verbose=False):
414 # XXX see if we want to keep an external call here
415 if verbose:
416 zipoptions = "-r"
417 else:
418 zipoptions = "-rq"
419 from distutils.errors import DistutilsExecError
420 from distutils.spawn import spawn
421 try:
422 spawn(["zip", zipoptions, zip_filename, base_dir], dry_run=dry_run)
423 except DistutilsExecError:
424 # XXX really should distinguish between "couldn't find
425 # external 'zip' command" and "zip failed".
426 raise ExecError("unable to create zip file '%s': "
427 "could neither import the 'zipfile' module nor "
428 "find a standalone zip utility") % zip_filename
429
430def _make_zipfile(base_name, base_dir, verbose=0, dry_run=0, logger=None):
431 """Create a zip file from all the files under 'base_dir'.
432
433 The output zip file will be named 'base_dir' + ".zip". Uses either the
434 "zipfile" Python module (if available) or the InfoZIP "zip" utility
435 (if installed and found on the default search path). If neither tool is
436 available, raises ExecError. Returns the name of the output zip
437 file.
438 """
439 zip_filename = base_name + ".zip"
440 archive_dir = os.path.dirname(base_name)
441
442 if not os.path.exists(archive_dir):
443 if logger is not None:
444 logger.info("creating %s", archive_dir)
445 if not dry_run:
446 os.makedirs(archive_dir)
447
448 # If zipfile module is not available, try spawning an external 'zip'
449 # command.
450 try:
451 import zipfile
452 except ImportError:
453 zipfile = None
454
455 if zipfile is None:
456 _call_external_zip(base_dir, verbose)
457 else:
458 if logger is not None:
459 logger.info("creating '%s' and adding '%s' to it",
460 zip_filename, base_dir)
461
462 if not dry_run:
463 zip = zipfile.ZipFile(zip_filename, "w",
464 compression=zipfile.ZIP_DEFLATED)
465
466 for dirpath, dirnames, filenames in os.walk(base_dir):
467 for name in filenames:
468 path = os.path.normpath(os.path.join(dirpath, name))
469 if os.path.isfile(path):
470 zip.write(path, path)
471 if logger is not None:
472 logger.info("adding '%s'", path)
473 zip.close()
474
475 return zip_filename
476
477_ARCHIVE_FORMATS = {
478 'gztar': (_make_tarball, [('compress', 'gzip')], "gzip'ed tar-file"),
479 'bztar': (_make_tarball, [('compress', 'bzip2')], "bzip2'ed tar-file"),
480 'ztar': (_make_tarball, [('compress', 'compress')],
481 "compressed tar file"),
482 'tar': (_make_tarball, [('compress', None)], "uncompressed tar file"),
483 'zip': (_make_zipfile, [],"ZIP file")
484 }
485
486def get_archive_formats():
487 """Returns a list of supported formats for archiving and unarchiving.
488
489 Each element of the returned sequence is a tuple (name, description)
490 """
491 formats = [(name, registry[2]) for name, registry in
492 _ARCHIVE_FORMATS.items()]
493 formats.sort()
494 return formats
495
496def register_archive_format(name, function, extra_args=None, description=''):
497 """Registers an archive format.
498
499 name is the name of the format. function is the callable that will be
500 used to create archives. If provided, extra_args is a sequence of
501 (name, value) tuples that will be passed as arguments to the callable.
502 description can be provided to describe the format, and will be returned
503 by the get_archive_formats() function.
504 """
505 if extra_args is None:
506 extra_args = []
507 if not isinstance(function, collections.Callable):
508 raise TypeError('The %s object is not callable' % function)
509 if not isinstance(extra_args, (tuple, list)):
510 raise TypeError('extra_args needs to be a sequence')
511 for element in extra_args:
512 if not isinstance(element, (tuple, list)) or len(element) !=2 :
513 raise TypeError('extra_args elements are : (arg_name, value)')
514
515 _ARCHIVE_FORMATS[name] = (function, extra_args, description)
516
517def unregister_archive_format(name):
518 del _ARCHIVE_FORMATS[name]
519
520def make_archive(base_name, format, root_dir=None, base_dir=None, verbose=0,
521 dry_run=0, owner=None, group=None, logger=None):
522 """Create an archive file (eg. zip or tar).
523
524 'base_name' is the name of the file to create, minus any format-specific
525 extension; 'format' is the archive format: one of "zip", "tar", "ztar",
526 or "gztar".
527
528 'root_dir' is a directory that will be the root directory of the
529 archive; ie. we typically chdir into 'root_dir' before creating the
530 archive. 'base_dir' is the directory where we start archiving from;
531 ie. 'base_dir' will be the common prefix of all files and
532 directories in the archive. 'root_dir' and 'base_dir' both default
533 to the current directory. Returns the name of the archive file.
534
535 'owner' and 'group' are used when creating a tar archive. By default,
536 uses the current owner and group.
537 """
538 save_cwd = os.getcwd()
539 if root_dir is not None:
540 if logger is not None:
541 logger.debug("changing into '%s'", root_dir)
542 base_name = os.path.abspath(base_name)
543 if not dry_run:
544 os.chdir(root_dir)
545
546 if base_dir is None:
547 base_dir = os.curdir
548
549 kwargs = {'dry_run': dry_run, 'logger': logger}
550
551 try:
552 format_info = _ARCHIVE_FORMATS[format]
553 except KeyError:
554 raise ValueError("unknown archive format '%s'" % format)
555
556 func = format_info[0]
557 for arg, val in format_info[1]:
558 kwargs[arg] = val
559
560 if format != 'zip':
561 kwargs['owner'] = owner
562 kwargs['group'] = group
563
564 try:
565 filename = func(base_name, base_dir, **kwargs)
566 finally:
567 if root_dir is not None:
568 if logger is not None:
569 logger.debug("changing back to '%s'", save_cwd)
570 os.chdir(save_cwd)
571
572 return filename