blob: 3cafd01d239686611c01b1748b31f226c9f4089e [file] [log] [blame]
Tarek Ziadéc3399782010-02-23 05:39:18 +00001"""Utility functions for copying and archiving files and directory trees.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +00002
Guido van Rossum959fa011999-08-18 20:03:17 +00003XXX The functions here don't copy the resource fork or other metadata on Mac.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +00004
5"""
Guido van Rossumc6360141990-10-13 19:23:40 +00006
Guido van Rossumc96207a1992-03-31 18:55:40 +00007import os
Guido van Rossum83c03e21999-02-23 23:07:51 +00008import sys
Guido van Rossum9d0a3df1997-04-29 14:45:19 +00009import stat
Brett Cannon1c3fa182004-06-19 21:11:35 +000010from os.path import abspath
Georg Brandl2ee470f2008-07-16 12:55:28 +000011import fnmatch
Tarek Ziadé396fad72010-02-23 05:30:31 +000012import collections
Antoine Pitrou910bd512010-03-22 20:11:09 +000013import errno
Tarek Ziadé6ac91722010-04-28 17:51:36 +000014import tarfile
Tarek Ziadé396fad72010-02-23 05:30:31 +000015
16try:
Tarek Ziadéffa155a2010-04-29 13:34:35 +000017 import bz2
Florent Xicluna54540ec2011-11-04 08:29:17 +010018 del bz2
Tarek Ziadéffa155a2010-04-29 13:34:35 +000019 _BZ2_SUPPORTED = True
20except ImportError:
21 _BZ2_SUPPORTED = False
22
23try:
Tarek Ziadé396fad72010-02-23 05:30:31 +000024 from pwd import getpwnam
25except ImportError:
26 getpwnam = None
27
28try:
29 from grp import getgrnam
30except ImportError:
31 getgrnam = None
Guido van Rossumc6360141990-10-13 19:23:40 +000032
Tarek Ziadéc3399782010-02-23 05:39:18 +000033__all__ = ["copyfileobj", "copyfile", "copymode", "copystat", "copy", "copy2",
34 "copytree", "move", "rmtree", "Error", "SpecialFileError",
35 "ExecError", "make_archive", "get_archive_formats",
Tarek Ziadé6ac91722010-04-28 17:51:36 +000036 "register_archive_format", "unregister_archive_format",
37 "get_unpack_formats", "register_unpack_format",
Éric Araujoc5efe652011-08-21 14:30:00 +020038 "unregister_unpack_format", "unpack_archive",
Brian Curtinc57a3452012-06-22 16:00:30 -050039 "ignore_patterns", "chown", "which"]
Éric Araujoe4d5b8e2011-08-08 16:51:11 +020040 # disk_usage is added later, if available on the platform
Martin v. Löwise9ce0b02002-10-07 13:23:24 +000041
Neal Norwitz4ce69a52005-09-01 00:45:28 +000042class Error(EnvironmentError):
Martin v. Löwise9ce0b02002-10-07 13:23:24 +000043 pass
Guido van Rossumc6360141990-10-13 19:23:40 +000044
Antoine Pitrou7fff0962009-05-01 21:09:44 +000045class SpecialFileError(EnvironmentError):
46 """Raised when trying to do a kind of operation (e.g. copying) which is
47 not supported on a special file (e.g. a named pipe)"""
48
Tarek Ziadé396fad72010-02-23 05:30:31 +000049class ExecError(EnvironmentError):
50 """Raised when a command could not be executed"""
51
Tarek Ziadé6ac91722010-04-28 17:51:36 +000052class ReadError(EnvironmentError):
53 """Raised when an archive cannot be read"""
54
55class RegistryError(Exception):
56 """Raised when a registery operation with the archiving
57 and unpacking registeries fails"""
58
59
Georg Brandl6aa2d1f2008-08-12 08:35:52 +000060try:
61 WindowsError
62except NameError:
63 WindowsError = None
64
Greg Stein42bb8b32000-07-12 09:55:30 +000065def copyfileobj(fsrc, fdst, length=16*1024):
66 """copy data from file-like object fsrc to file-like object fdst"""
67 while 1:
68 buf = fsrc.read(length)
69 if not buf:
70 break
71 fdst.write(buf)
72
Johannes Gijsbers46f14592004-08-14 13:30:02 +000073def _samefile(src, dst):
74 # Macintosh, Unix.
Tarek Ziadé1eab9cc2010-04-19 21:19:57 +000075 if hasattr(os.path, 'samefile'):
Johannes Gijsbersf9a098e2004-08-14 14:51:01 +000076 try:
77 return os.path.samefile(src, dst)
78 except OSError:
79 return False
Johannes Gijsbers46f14592004-08-14 13:30:02 +000080
81 # All other platforms: check for same pathname.
82 return (os.path.normcase(os.path.abspath(src)) ==
83 os.path.normcase(os.path.abspath(dst)))
Tim Peters495ad3c2001-01-15 01:36:40 +000084
Antoine Pitrou78091e62011-12-29 18:54:15 +010085def copyfile(src, dst, symlinks=False):
86 """Copy data from src to dst.
87
88 If optional flag `symlinks` is set and `src` is a symbolic link, a new
89 symlink will be created instead of copying the file it points to.
90
91 """
Johannes Gijsbers46f14592004-08-14 13:30:02 +000092 if _samefile(src, dst):
Collin Winterce36ad82007-08-30 01:19:48 +000093 raise Error("`%s` and `%s` are the same file" % (src, dst))
Johannes Gijsbers46f14592004-08-14 13:30:02 +000094
Antoine Pitrou7fff0962009-05-01 21:09:44 +000095 for fn in [src, dst]:
96 try:
97 st = os.stat(fn)
98 except OSError:
99 # File most likely does not exist
100 pass
Benjamin Petersonc0d98aa2009-06-05 19:13:27 +0000101 else:
102 # XXX What about other special files? (sockets, devices...)
103 if stat.S_ISFIFO(st.st_mode):
104 raise SpecialFileError("`%s` is a named pipe" % fn)
Tarek Ziadéb01142b2010-05-05 22:43:04 +0000105
Antoine Pitrou78091e62011-12-29 18:54:15 +0100106 if symlinks and os.path.islink(src):
107 os.symlink(os.readlink(src), dst)
108 else:
109 with open(src, 'rb') as fsrc:
110 with open(dst, 'wb') as fdst:
111 copyfileobj(fsrc, fdst)
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500112 return dst
Guido van Rossumc6360141990-10-13 19:23:40 +0000113
Antoine Pitrou78091e62011-12-29 18:54:15 +0100114def copymode(src, dst, symlinks=False):
115 """Copy mode bits from src to dst.
Guido van Rossumc6360141990-10-13 19:23:40 +0000116
Antoine Pitrou78091e62011-12-29 18:54:15 +0100117 If the optional flag `symlinks` is set, symlinks aren't followed if and
118 only if both `src` and `dst` are symlinks. If `lchmod` isn't available (eg.
119 Linux), in these cases, this method does nothing.
120
121 """
122 if symlinks and os.path.islink(src) and os.path.islink(dst):
123 if hasattr(os, 'lchmod'):
124 stat_func, chmod_func = os.lstat, os.lchmod
125 else:
126 return
127 elif hasattr(os, 'chmod'):
128 stat_func, chmod_func = os.stat, os.chmod
129 else:
130 return
131
132 st = stat_func(src)
133 chmod_func(dst, stat.S_IMODE(st.st_mode))
134
135def copystat(src, dst, symlinks=False):
136 """Copy all stat info (mode bits, atime, mtime, flags) from src to dst.
137
138 If the optional flag `symlinks` is set, symlinks aren't followed if and
139 only if both `src` and `dst` are symlinks.
140
141 """
Larry Hastings9cf065c2012-06-22 16:30:09 -0700142 def _nop(*args, ns=None, follow_symlinks=None):
Antoine Pitrou78091e62011-12-29 18:54:15 +0100143 pass
144
Larry Hastings9cf065c2012-06-22 16:30:09 -0700145 # follow symlinks (aka don't not follow symlinks)
146 follow = not (symlinks and os.path.islink(src) and os.path.islink(dst))
147 if follow:
148 # use the real function if it exists
149 def lookup(name):
150 return getattr(os, name, _nop)
Antoine Pitrou78091e62011-12-29 18:54:15 +0100151 else:
Larry Hastings9cf065c2012-06-22 16:30:09 -0700152 # use the real function only if it exists
153 # *and* it supports follow_symlinks
154 def lookup(name):
155 fn = getattr(os, name, _nop)
156 if fn in os.supports_follow_symlinks:
157 return fn
158 return _nop
Antoine Pitrou78091e62011-12-29 18:54:15 +0100159
Larry Hastings9cf065c2012-06-22 16:30:09 -0700160 st = lookup("stat")(src, follow_symlinks=follow)
Walter Dörwald294bbf32002-06-06 09:48:13 +0000161 mode = stat.S_IMODE(st.st_mode)
Larry Hastings9cf065c2012-06-22 16:30:09 -0700162 lookup("utime")(dst, ns=(st.st_atime_ns, st.st_mtime_ns),
163 follow_symlinks=follow)
164 try:
165 lookup("chmod")(dst, mode, follow_symlinks=follow)
166 except NotImplementedError:
167 # if we got a NotImplementedError, it's because
168 # * follow_symlinks=False,
169 # * lchown() is unavailable, and
170 # * either
171 # * fchownat() is unvailable or
172 # * fchownat() doesn't implement AT_SYMLINK_NOFOLLOW.
173 # (it returned ENOSUP.)
174 # therefore we're out of options--we simply cannot chown the
175 # symlink. give up, suppress the error.
176 # (which is what shutil always did in this circumstance.)
177 pass
Antoine Pitrou78091e62011-12-29 18:54:15 +0100178 if hasattr(st, 'st_flags'):
Antoine Pitrou910bd512010-03-22 20:11:09 +0000179 try:
Larry Hastings9cf065c2012-06-22 16:30:09 -0700180 lookup("chflags")(dst, st.st_flags, follow_symlinks=follow)
Antoine Pitrou910bd512010-03-22 20:11:09 +0000181 except OSError as why:
Ned Deilybaf75712012-05-10 17:05:19 -0700182 for err in 'EOPNOTSUPP', 'ENOTSUP':
183 if hasattr(errno, err) and why.errno == getattr(errno, err):
184 break
185 else:
Antoine Pitrou910bd512010-03-22 20:11:09 +0000186 raise
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000187
Antoine Pitrou424246f2012-05-12 19:02:01 +0200188if hasattr(os, 'listxattr'):
189 def _copyxattr(src, dst, symlinks=False):
190 """Copy extended filesystem attributes from `src` to `dst`.
191
192 Overwrite existing attributes.
193
194 If the optional flag `symlinks` is set, symlinks won't be followed.
195
196 """
Antoine Pitrou424246f2012-05-12 19:02:01 +0200197
Larry Hastings9cf065c2012-06-22 16:30:09 -0700198 for name in os.listxattr(src, follow_symlinks=symlinks):
Antoine Pitrou424246f2012-05-12 19:02:01 +0200199 try:
Larry Hastings9cf065c2012-06-22 16:30:09 -0700200 value = os.getxattr(src, name, follow_symlinks=symlinks)
201 os.setxattr(dst, name, value, follow_symlinks=symlinks)
Antoine Pitrou424246f2012-05-12 19:02:01 +0200202 except OSError as e:
203 if e.errno not in (errno.EPERM, errno.ENOTSUP, errno.ENODATA):
204 raise
205else:
206 def _copyxattr(*args, **kwargs):
207 pass
208
Antoine Pitrou78091e62011-12-29 18:54:15 +0100209def copy(src, dst, symlinks=False):
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500210 """Copy data and mode bits ("cp src dst"). Return the file's destination.
Tim Peters495ad3c2001-01-15 01:36:40 +0000211
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000212 The destination may be a directory.
213
Antoine Pitrou78091e62011-12-29 18:54:15 +0100214 If the optional flag `symlinks` is set, symlinks won't be followed. This
215 resembles GNU's "cp -P src dst".
216
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000217 """
Guido van Rossuma2baf461997-04-29 14:06:46 +0000218 if os.path.isdir(dst):
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000219 dst = os.path.join(dst, os.path.basename(src))
Antoine Pitrou78091e62011-12-29 18:54:15 +0100220 copyfile(src, dst, symlinks=symlinks)
221 copymode(src, dst, symlinks=symlinks)
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500222 return dst
Guido van Rossumc6360141990-10-13 19:23:40 +0000223
Antoine Pitrou78091e62011-12-29 18:54:15 +0100224def copy2(src, dst, symlinks=False):
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500225 """Copy data and all stat info ("cp -p src dst"). Return the file's
226 destination."
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000227
228 The destination may be a directory.
229
Antoine Pitrou78091e62011-12-29 18:54:15 +0100230 If the optional flag `symlinks` is set, symlinks won't be followed. This
231 resembles GNU's "cp -P src dst".
232
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000233 """
Guido van Rossuma2baf461997-04-29 14:06:46 +0000234 if os.path.isdir(dst):
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000235 dst = os.path.join(dst, os.path.basename(src))
Antoine Pitrou78091e62011-12-29 18:54:15 +0100236 copyfile(src, dst, symlinks=symlinks)
237 copystat(src, dst, symlinks=symlinks)
Antoine Pitrou424246f2012-05-12 19:02:01 +0200238 _copyxattr(src, dst, symlinks=symlinks)
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500239 return dst
Guido van Rossumc6360141990-10-13 19:23:40 +0000240
Georg Brandl2ee470f2008-07-16 12:55:28 +0000241def ignore_patterns(*patterns):
242 """Function that can be used as copytree() ignore parameter.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000243
Georg Brandl2ee470f2008-07-16 12:55:28 +0000244 Patterns is a sequence of glob-style patterns
245 that are used to exclude files"""
246 def _ignore_patterns(path, names):
247 ignored_names = []
248 for pattern in patterns:
249 ignored_names.extend(fnmatch.filter(names, pattern))
250 return set(ignored_names)
251 return _ignore_patterns
252
Tarek Ziadéfb437512010-04-20 08:57:33 +0000253def copytree(src, dst, symlinks=False, ignore=None, copy_function=copy2,
254 ignore_dangling_symlinks=False):
Tarek Ziadé5340db32010-04-19 22:30:51 +0000255 """Recursively copy a directory tree.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000256
257 The destination directory must not already exist.
Neal Norwitza4c93b62003-02-23 21:36:32 +0000258 If exception(s) occur, an Error is raised with a list of reasons.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000259
260 If the optional symlinks flag is true, symbolic links in the
261 source tree result in symbolic links in the destination tree; if
262 it is false, the contents of the files pointed to by symbolic
Tarek Ziadéfb437512010-04-20 08:57:33 +0000263 links are copied. If the file pointed by the symlink doesn't
264 exist, an exception will be added in the list of errors raised in
265 an Error exception at the end of the copy process.
266
267 You can set the optional ignore_dangling_symlinks flag to true if you
Tarek Ziadé8c26c7d2010-04-23 13:03:50 +0000268 want to silence this exception. Notice that this has no effect on
269 platforms that don't support os.symlink.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000270
Georg Brandl2ee470f2008-07-16 12:55:28 +0000271 The optional ignore argument is a callable. If given, it
272 is called with the `src` parameter, which is the directory
273 being visited by copytree(), and `names` which is the list of
274 `src` contents, as returned by os.listdir():
275
276 callable(src, names) -> ignored_names
277
278 Since copytree() is called recursively, the callable will be
279 called once for each directory that is copied. It returns a
280 list of names relative to the `src` directory that should
281 not be copied.
282
Tarek Ziadé5340db32010-04-19 22:30:51 +0000283 The optional copy_function argument is a callable that will be used
284 to copy each file. It will be called with the source path and the
285 destination path as arguments. By default, copy2() is used, but any
286 function that supports the same signature (like copy()) can be used.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000287
288 """
Guido van Rossuma2baf461997-04-29 14:06:46 +0000289 names = os.listdir(src)
Georg Brandl2ee470f2008-07-16 12:55:28 +0000290 if ignore is not None:
291 ignored_names = ignore(src, names)
292 else:
293 ignored_names = set()
294
Johannes Gijsberse4172ea2005-01-08 12:31:29 +0000295 os.makedirs(dst)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000296 errors = []
Guido van Rossuma2baf461997-04-29 14:06:46 +0000297 for name in names:
Georg Brandl2ee470f2008-07-16 12:55:28 +0000298 if name in ignored_names:
299 continue
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000300 srcname = os.path.join(src, name)
301 dstname = os.path.join(dst, name)
302 try:
Tarek Ziadéfb437512010-04-20 08:57:33 +0000303 if os.path.islink(srcname):
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000304 linkto = os.readlink(srcname)
Tarek Ziadéfb437512010-04-20 08:57:33 +0000305 if symlinks:
Antoine Pitrou78091e62011-12-29 18:54:15 +0100306 # We can't just leave it to `copy_function` because legacy
307 # code with a custom `copy_function` may rely on copytree
308 # doing the right thing.
Tarek Ziadéfb437512010-04-20 08:57:33 +0000309 os.symlink(linkto, dstname)
Antoine Pitrou78091e62011-12-29 18:54:15 +0100310 copystat(srcname, dstname, symlinks=symlinks)
Tarek Ziadéfb437512010-04-20 08:57:33 +0000311 else:
312 # ignore dangling symlink if the flag is on
313 if not os.path.exists(linkto) and ignore_dangling_symlinks:
314 continue
315 # otherwise let the copy occurs. copy2 will raise an error
316 copy_function(srcname, dstname)
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000317 elif os.path.isdir(srcname):
Tarek Ziadé5340db32010-04-19 22:30:51 +0000318 copytree(srcname, dstname, symlinks, ignore, copy_function)
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000319 else:
Antoine Pitrou7fff0962009-05-01 21:09:44 +0000320 # Will raise a SpecialFileError for unsupported file types
Tarek Ziadé5340db32010-04-19 22:30:51 +0000321 copy_function(srcname, dstname)
Georg Brandla1be88e2005-08-31 22:48:45 +0000322 # catch the Error from the recursive copytree so that we can
323 # continue with other files
Guido van Rossumb940e112007-01-10 16:19:56 +0000324 except Error as err:
Georg Brandla1be88e2005-08-31 22:48:45 +0000325 errors.extend(err.args[0])
Antoine Pitrou7fff0962009-05-01 21:09:44 +0000326 except EnvironmentError as why:
327 errors.append((srcname, dstname, str(why)))
Thomas Wouters0e3f5912006-08-11 14:57:12 +0000328 try:
329 copystat(src, dst)
Guido van Rossumb940e112007-01-10 16:19:56 +0000330 except OSError as why:
Georg Brandl6aa2d1f2008-08-12 08:35:52 +0000331 if WindowsError is not None and isinstance(why, WindowsError):
332 # Copying file access times may fail on Windows
333 pass
334 else:
335 errors.extend((src, dst, str(why)))
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000336 if errors:
Collin Winterce36ad82007-08-30 01:19:48 +0000337 raise Error(errors)
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500338 return dst
Guido van Rossumd7673291998-02-06 21:38:09 +0000339
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200340# version vulnerable to race conditions
341def _rmtree_unsafe(path, onerror):
Christian Heimes9bd667a2008-01-20 15:14:11 +0000342 try:
343 if os.path.islink(path):
344 # symlinks to directories are forbidden, see bug #1669
345 raise OSError("Cannot call rmtree on a symbolic link")
346 except OSError:
347 onerror(os.path.islink, path, sys.exc_info())
348 # can't continue even if onerror hook returns
349 return
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000350 names = []
351 try:
352 names = os.listdir(path)
Éric Araujocfcc9772011-08-10 20:54:33 +0200353 except os.error:
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000354 onerror(os.listdir, path, sys.exc_info())
355 for name in names:
356 fullname = os.path.join(path, name)
357 try:
358 mode = os.lstat(fullname).st_mode
359 except os.error:
360 mode = 0
361 if stat.S_ISDIR(mode):
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200362 _rmtree_unsafe(fullname, onerror)
Barry Warsaw234d9a92003-01-24 17:36:15 +0000363 else:
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000364 try:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200365 os.unlink(fullname)
Éric Araujocfcc9772011-08-10 20:54:33 +0200366 except os.error:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200367 onerror(os.unlink, fullname, sys.exc_info())
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000368 try:
369 os.rmdir(path)
370 except os.error:
371 onerror(os.rmdir, path, sys.exc_info())
Guido van Rossumd7673291998-02-06 21:38:09 +0000372
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200373# Version using fd-based APIs to protect against races
374def _rmtree_safe_fd(topfd, path, onerror):
375 names = []
376 try:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200377 names = os.listdir(topfd)
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200378 except os.error:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200379 onerror(os.listdir, path, sys.exc_info())
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200380 for name in names:
381 fullname = os.path.join(path, name)
382 try:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200383 orig_st = os.stat(name, dir_fd=topfd)
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200384 mode = orig_st.st_mode
385 except os.error:
386 mode = 0
387 if stat.S_ISDIR(mode):
388 try:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200389 dirfd = os.open(name, os.O_RDONLY, dir_fd=topfd)
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200390 except os.error:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200391 onerror(os.open, fullname, sys.exc_info())
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200392 else:
393 try:
394 if os.path.samestat(orig_st, os.fstat(dirfd)):
395 _rmtree_safe_fd(dirfd, fullname, onerror)
396 finally:
397 os.close(dirfd)
398 else:
399 try:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200400 os.unlink(name, dir_fd=topfd)
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200401 except os.error:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200402 onerror(os.unlink, fullname, sys.exc_info())
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200403 try:
404 os.rmdir(path)
405 except os.error:
406 onerror(os.rmdir, path, sys.exc_info())
407
Nick Coghlan5b0eca12012-06-24 16:43:06 +1000408_use_fd_functions = (os.unlink in os.supports_dir_fd and
409 os.open in os.supports_dir_fd)
410
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200411def rmtree(path, ignore_errors=False, onerror=None):
412 """Recursively delete a directory tree.
413
414 If ignore_errors is set, errors are ignored; otherwise, if onerror
415 is set, it is called to handle the error with arguments (func,
Hynek Schlawack2100b422012-06-23 20:28:32 +0200416 path, exc_info) where func is platform and implementation dependent;
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200417 path is the argument to that function that caused it to fail; and
418 exc_info is a tuple returned by sys.exc_info(). If ignore_errors
419 is false and onerror is None, an exception is raised.
420
421 """
422 if ignore_errors:
423 def onerror(*args):
424 pass
425 elif onerror is None:
426 def onerror(*args):
427 raise
428 if _use_fd_functions:
Hynek Schlawack3b527782012-06-25 13:27:31 +0200429 # While the unsafe rmtree works fine on bytes, the fd based does not.
430 if isinstance(path, bytes):
431 path = os.fsdecode(path)
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200432 # Note: To guard against symlink races, we use the standard
433 # lstat()/open()/fstat() trick.
434 try:
435 orig_st = os.lstat(path)
436 except Exception:
437 onerror(os.lstat, path, sys.exc_info())
438 return
439 try:
440 fd = os.open(path, os.O_RDONLY)
441 except Exception:
442 onerror(os.lstat, path, sys.exc_info())
443 return
444 try:
445 if (stat.S_ISDIR(orig_st.st_mode) and
446 os.path.samestat(orig_st, os.fstat(fd))):
447 _rmtree_safe_fd(fd, path, onerror)
448 elif (stat.S_ISREG(orig_st.st_mode)):
449 raise NotADirectoryError(20,
450 "Not a directory: '{}'".format(path))
451 finally:
452 os.close(fd)
453 else:
454 return _rmtree_unsafe(path, onerror)
455
Nick Coghlan5b0eca12012-06-24 16:43:06 +1000456# Allow introspection of whether or not the hardening against symlink
457# attacks is supported on the current platform
458rmtree.avoids_symlink_attacks = _use_fd_functions
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000459
Christian Heimesada8c3b2008-03-18 18:26:33 +0000460def _basename(path):
461 # A basename() variant which first strips the trailing slash, if present.
462 # Thus we always get the last component of the path, even for directories.
463 return os.path.basename(path.rstrip(os.path.sep))
464
465def move(src, dst):
466 """Recursively move a file or directory to another location. This is
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500467 similar to the Unix "mv" command. Return the file or directory's
468 destination.
Christian Heimesada8c3b2008-03-18 18:26:33 +0000469
470 If the destination is a directory or a symlink to a directory, the source
471 is moved inside the directory. The destination path must not already
472 exist.
473
474 If the destination already exists but is not a directory, it may be
475 overwritten depending on os.rename() semantics.
476
477 If the destination is on our current filesystem, then rename() is used.
Antoine Pitrou0a08d7a2012-01-06 20:16:19 +0100478 Otherwise, src is copied to the destination and then removed. Symlinks are
479 recreated under the new name if os.rename() fails because of cross
480 filesystem renames.
481
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000482 A lot more could be done here... A look at a mv.c shows a lot of
483 the issues this implementation glosses over.
484
485 """
Christian Heimesada8c3b2008-03-18 18:26:33 +0000486 real_dst = dst
487 if os.path.isdir(dst):
Ronald Oussorenf51738b2011-05-06 10:23:04 +0200488 if _samefile(src, dst):
489 # We might be on a case insensitive filesystem,
490 # perform the rename anyway.
491 os.rename(src, dst)
492 return
493
Christian Heimesada8c3b2008-03-18 18:26:33 +0000494 real_dst = os.path.join(dst, _basename(src))
495 if os.path.exists(real_dst):
496 raise Error("Destination path '%s' already exists" % real_dst)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000497 try:
Christian Heimesada8c3b2008-03-18 18:26:33 +0000498 os.rename(src, real_dst)
Éric Araujocfcc9772011-08-10 20:54:33 +0200499 except OSError:
Antoine Pitrou0a08d7a2012-01-06 20:16:19 +0100500 if os.path.islink(src):
501 linkto = os.readlink(src)
502 os.symlink(linkto, real_dst)
503 os.unlink(src)
504 elif os.path.isdir(src):
Benjamin Peterson247a9b82009-02-20 04:09:19 +0000505 if _destinsrc(src, dst):
Collin Winterce36ad82007-08-30 01:19:48 +0000506 raise Error("Cannot move a directory '%s' into itself '%s'." % (src, dst))
Christian Heimesada8c3b2008-03-18 18:26:33 +0000507 copytree(src, real_dst, symlinks=True)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000508 rmtree(src)
509 else:
Christian Heimesada8c3b2008-03-18 18:26:33 +0000510 copy2(src, real_dst)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000511 os.unlink(src)
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500512 return real_dst
Brett Cannon1c3fa182004-06-19 21:11:35 +0000513
Benjamin Peterson247a9b82009-02-20 04:09:19 +0000514def _destinsrc(src, dst):
Antoine Pitrou0dcc3cd2009-01-29 20:26:59 +0000515 src = abspath(src)
516 dst = abspath(dst)
517 if not src.endswith(os.path.sep):
518 src += os.path.sep
519 if not dst.endswith(os.path.sep):
520 dst += os.path.sep
521 return dst.startswith(src)
Tarek Ziadé396fad72010-02-23 05:30:31 +0000522
523def _get_gid(name):
524 """Returns a gid, given a group name."""
525 if getgrnam is None or name is None:
526 return None
527 try:
528 result = getgrnam(name)
529 except KeyError:
530 result = None
531 if result is not None:
532 return result[2]
533 return None
534
535def _get_uid(name):
536 """Returns an uid, given a user name."""
537 if getpwnam is None or name is None:
538 return None
539 try:
540 result = getpwnam(name)
541 except KeyError:
542 result = None
543 if result is not None:
544 return result[2]
545 return None
546
547def _make_tarball(base_name, base_dir, compress="gzip", verbose=0, dry_run=0,
548 owner=None, group=None, logger=None):
549 """Create a (possibly compressed) tar file from all the files under
550 'base_dir'.
551
Tarek Ziadé5e2be872010-04-20 21:40:47 +0000552 'compress' must be "gzip" (the default), "bzip2", or None.
Tarek Ziadé396fad72010-02-23 05:30:31 +0000553
554 'owner' and 'group' can be used to define an owner and a group for the
555 archive that is being built. If not provided, the current owner and group
556 will be used.
557
Éric Araujo4433a5f2010-12-15 20:26:30 +0000558 The output tar file will be named 'base_name' + ".tar", possibly plus
Tarek Ziadé5e2be872010-04-20 21:40:47 +0000559 the appropriate compression extension (".gz", or ".bz2").
Tarek Ziadé396fad72010-02-23 05:30:31 +0000560
561 Returns the output filename.
562 """
Tarek Ziadéffa155a2010-04-29 13:34:35 +0000563 tar_compression = {'gzip': 'gz', None: ''}
564 compress_ext = {'gzip': '.gz'}
565
566 if _BZ2_SUPPORTED:
567 tar_compression['bzip2'] = 'bz2'
568 compress_ext['bzip2'] = '.bz2'
Tarek Ziadé396fad72010-02-23 05:30:31 +0000569
570 # flags for compression program, each element of list will be an argument
Éric Araujoc1b7e7f2011-09-18 23:12:30 +0200571 if compress is not None and compress not in compress_ext:
Tarek Ziadéffa155a2010-04-29 13:34:35 +0000572 raise ValueError("bad value for 'compress', or compression format not "
573 "supported : {0}".format(compress))
Tarek Ziadé396fad72010-02-23 05:30:31 +0000574
Tarek Ziadé5e2be872010-04-20 21:40:47 +0000575 archive_name = base_name + '.tar' + compress_ext.get(compress, '')
Tarek Ziadé396fad72010-02-23 05:30:31 +0000576 archive_dir = os.path.dirname(archive_name)
Tarek Ziadé5e2be872010-04-20 21:40:47 +0000577
Tarek Ziadé396fad72010-02-23 05:30:31 +0000578 if not os.path.exists(archive_dir):
Éric Araujoac4e58e2011-01-29 20:32:11 +0000579 if logger is not None:
Éric Araujo43a7ee12011-08-19 02:55:11 +0200580 logger.info("creating %s", archive_dir)
Tarek Ziadé396fad72010-02-23 05:30:31 +0000581 if not dry_run:
582 os.makedirs(archive_dir)
583
Tarek Ziadé396fad72010-02-23 05:30:31 +0000584 # creating the tarball
Tarek Ziadé396fad72010-02-23 05:30:31 +0000585 if logger is not None:
586 logger.info('Creating tar archive')
587
588 uid = _get_uid(owner)
589 gid = _get_gid(group)
590
591 def _set_uid_gid(tarinfo):
592 if gid is not None:
593 tarinfo.gid = gid
594 tarinfo.gname = group
595 if uid is not None:
596 tarinfo.uid = uid
597 tarinfo.uname = owner
598 return tarinfo
599
600 if not dry_run:
601 tar = tarfile.open(archive_name, 'w|%s' % tar_compression[compress])
602 try:
603 tar.add(base_dir, filter=_set_uid_gid)
604 finally:
605 tar.close()
606
Tarek Ziadé396fad72010-02-23 05:30:31 +0000607 return archive_name
608
Tarek Ziadée2124162010-04-21 13:35:21 +0000609def _call_external_zip(base_dir, zip_filename, verbose=False, dry_run=False):
Tarek Ziadé396fad72010-02-23 05:30:31 +0000610 # XXX see if we want to keep an external call here
611 if verbose:
612 zipoptions = "-r"
613 else:
614 zipoptions = "-rq"
615 from distutils.errors import DistutilsExecError
616 from distutils.spawn import spawn
617 try:
618 spawn(["zip", zipoptions, zip_filename, base_dir], dry_run=dry_run)
619 except DistutilsExecError:
620 # XXX really should distinguish between "couldn't find
621 # external 'zip' command" and "zip failed".
622 raise ExecError("unable to create zip file '%s': "
623 "could neither import the 'zipfile' module nor "
624 "find a standalone zip utility") % zip_filename
625
626def _make_zipfile(base_name, base_dir, verbose=0, dry_run=0, logger=None):
627 """Create a zip file from all the files under 'base_dir'.
628
Éric Araujo4433a5f2010-12-15 20:26:30 +0000629 The output zip file will be named 'base_name' + ".zip". Uses either the
Tarek Ziadé396fad72010-02-23 05:30:31 +0000630 "zipfile" Python module (if available) or the InfoZIP "zip" utility
631 (if installed and found on the default search path). If neither tool is
632 available, raises ExecError. Returns the name of the output zip
633 file.
634 """
635 zip_filename = base_name + ".zip"
636 archive_dir = os.path.dirname(base_name)
637
638 if not os.path.exists(archive_dir):
639 if logger is not None:
640 logger.info("creating %s", archive_dir)
641 if not dry_run:
642 os.makedirs(archive_dir)
643
644 # If zipfile module is not available, try spawning an external 'zip'
645 # command.
646 try:
647 import zipfile
648 except ImportError:
649 zipfile = None
650
651 if zipfile is None:
Tarek Ziadée2124162010-04-21 13:35:21 +0000652 _call_external_zip(base_dir, zip_filename, verbose, dry_run)
Tarek Ziadé396fad72010-02-23 05:30:31 +0000653 else:
654 if logger is not None:
655 logger.info("creating '%s' and adding '%s' to it",
656 zip_filename, base_dir)
657
658 if not dry_run:
659 zip = zipfile.ZipFile(zip_filename, "w",
660 compression=zipfile.ZIP_DEFLATED)
661
662 for dirpath, dirnames, filenames in os.walk(base_dir):
663 for name in filenames:
664 path = os.path.normpath(os.path.join(dirpath, name))
665 if os.path.isfile(path):
666 zip.write(path, path)
667 if logger is not None:
668 logger.info("adding '%s'", path)
669 zip.close()
670
671 return zip_filename
672
673_ARCHIVE_FORMATS = {
674 'gztar': (_make_tarball, [('compress', 'gzip')], "gzip'ed tar-file"),
Tarek Ziadé396fad72010-02-23 05:30:31 +0000675 'tar': (_make_tarball, [('compress', None)], "uncompressed tar file"),
Éric Araujoc1b7e7f2011-09-18 23:12:30 +0200676 'zip': (_make_zipfile, [], "ZIP file")
Tarek Ziadé396fad72010-02-23 05:30:31 +0000677 }
678
Tarek Ziadéffa155a2010-04-29 13:34:35 +0000679if _BZ2_SUPPORTED:
680 _ARCHIVE_FORMATS['bztar'] = (_make_tarball, [('compress', 'bzip2')],
681 "bzip2'ed tar-file")
682
Tarek Ziadé396fad72010-02-23 05:30:31 +0000683def get_archive_formats():
684 """Returns a list of supported formats for archiving and unarchiving.
685
686 Each element of the returned sequence is a tuple (name, description)
687 """
688 formats = [(name, registry[2]) for name, registry in
689 _ARCHIVE_FORMATS.items()]
690 formats.sort()
691 return formats
692
693def register_archive_format(name, function, extra_args=None, description=''):
694 """Registers an archive format.
695
696 name is the name of the format. function is the callable that will be
697 used to create archives. If provided, extra_args is a sequence of
698 (name, value) tuples that will be passed as arguments to the callable.
699 description can be provided to describe the format, and will be returned
700 by the get_archive_formats() function.
701 """
702 if extra_args is None:
703 extra_args = []
Florent Xicluna5d1155c2011-10-28 14:45:05 +0200704 if not callable(function):
Tarek Ziadé396fad72010-02-23 05:30:31 +0000705 raise TypeError('The %s object is not callable' % function)
706 if not isinstance(extra_args, (tuple, list)):
707 raise TypeError('extra_args needs to be a sequence')
708 for element in extra_args:
Éric Araujoc1b7e7f2011-09-18 23:12:30 +0200709 if not isinstance(element, (tuple, list)) or len(element) !=2:
Tarek Ziadé396fad72010-02-23 05:30:31 +0000710 raise TypeError('extra_args elements are : (arg_name, value)')
711
712 _ARCHIVE_FORMATS[name] = (function, extra_args, description)
713
714def unregister_archive_format(name):
715 del _ARCHIVE_FORMATS[name]
716
717def make_archive(base_name, format, root_dir=None, base_dir=None, verbose=0,
718 dry_run=0, owner=None, group=None, logger=None):
719 """Create an archive file (eg. zip or tar).
720
721 'base_name' is the name of the file to create, minus any format-specific
Tarek Ziadé5e2be872010-04-20 21:40:47 +0000722 extension; 'format' is the archive format: one of "zip", "tar", "bztar"
723 or "gztar".
Tarek Ziadé396fad72010-02-23 05:30:31 +0000724
725 'root_dir' is a directory that will be the root directory of the
726 archive; ie. we typically chdir into 'root_dir' before creating the
727 archive. 'base_dir' is the directory where we start archiving from;
728 ie. 'base_dir' will be the common prefix of all files and
729 directories in the archive. 'root_dir' and 'base_dir' both default
730 to the current directory. Returns the name of the archive file.
731
732 'owner' and 'group' are used when creating a tar archive. By default,
733 uses the current owner and group.
734 """
735 save_cwd = os.getcwd()
736 if root_dir is not None:
737 if logger is not None:
738 logger.debug("changing into '%s'", root_dir)
739 base_name = os.path.abspath(base_name)
740 if not dry_run:
741 os.chdir(root_dir)
742
743 if base_dir is None:
744 base_dir = os.curdir
745
746 kwargs = {'dry_run': dry_run, 'logger': logger}
747
748 try:
749 format_info = _ARCHIVE_FORMATS[format]
750 except KeyError:
751 raise ValueError("unknown archive format '%s'" % format)
752
753 func = format_info[0]
754 for arg, val in format_info[1]:
755 kwargs[arg] = val
756
757 if format != 'zip':
758 kwargs['owner'] = owner
759 kwargs['group'] = group
760
761 try:
762 filename = func(base_name, base_dir, **kwargs)
763 finally:
764 if root_dir is not None:
765 if logger is not None:
766 logger.debug("changing back to '%s'", save_cwd)
767 os.chdir(save_cwd)
768
769 return filename
Tarek Ziadé6ac91722010-04-28 17:51:36 +0000770
771
772def get_unpack_formats():
773 """Returns a list of supported formats for unpacking.
774
775 Each element of the returned sequence is a tuple
776 (name, extensions, description)
777 """
778 formats = [(name, info[0], info[3]) for name, info in
779 _UNPACK_FORMATS.items()]
780 formats.sort()
781 return formats
782
783def _check_unpack_options(extensions, function, extra_args):
784 """Checks what gets registered as an unpacker."""
785 # first make sure no other unpacker is registered for this extension
786 existing_extensions = {}
787 for name, info in _UNPACK_FORMATS.items():
788 for ext in info[0]:
789 existing_extensions[ext] = name
790
791 for extension in extensions:
792 if extension in existing_extensions:
793 msg = '%s is already registered for "%s"'
794 raise RegistryError(msg % (extension,
795 existing_extensions[extension]))
796
Florent Xicluna5d1155c2011-10-28 14:45:05 +0200797 if not callable(function):
Tarek Ziadé6ac91722010-04-28 17:51:36 +0000798 raise TypeError('The registered function must be a callable')
799
800
801def register_unpack_format(name, extensions, function, extra_args=None,
802 description=''):
803 """Registers an unpack format.
804
805 `name` is the name of the format. `extensions` is a list of extensions
806 corresponding to the format.
807
808 `function` is the callable that will be
809 used to unpack archives. The callable will receive archives to unpack.
810 If it's unable to handle an archive, it needs to raise a ReadError
811 exception.
812
813 If provided, `extra_args` is a sequence of
814 (name, value) tuples that will be passed as arguments to the callable.
815 description can be provided to describe the format, and will be returned
816 by the get_unpack_formats() function.
817 """
818 if extra_args is None:
819 extra_args = []
820 _check_unpack_options(extensions, function, extra_args)
821 _UNPACK_FORMATS[name] = extensions, function, extra_args, description
822
823def unregister_unpack_format(name):
824 """Removes the pack format from the registery."""
825 del _UNPACK_FORMATS[name]
826
827def _ensure_directory(path):
828 """Ensure that the parent directory of `path` exists"""
829 dirname = os.path.dirname(path)
830 if not os.path.isdir(dirname):
831 os.makedirs(dirname)
832
833def _unpack_zipfile(filename, extract_dir):
834 """Unpack zip `filename` to `extract_dir`
835 """
836 try:
837 import zipfile
838 except ImportError:
839 raise ReadError('zlib not supported, cannot unpack this archive.')
840
841 if not zipfile.is_zipfile(filename):
842 raise ReadError("%s is not a zip file" % filename)
843
844 zip = zipfile.ZipFile(filename)
845 try:
846 for info in zip.infolist():
847 name = info.filename
848
849 # don't extract absolute paths or ones with .. in them
850 if name.startswith('/') or '..' in name:
851 continue
852
853 target = os.path.join(extract_dir, *name.split('/'))
854 if not target:
855 continue
856
857 _ensure_directory(target)
858 if not name.endswith('/'):
859 # file
860 data = zip.read(info.filename)
Éric Araujoc1b7e7f2011-09-18 23:12:30 +0200861 f = open(target, 'wb')
Tarek Ziadé6ac91722010-04-28 17:51:36 +0000862 try:
863 f.write(data)
864 finally:
865 f.close()
866 del data
867 finally:
868 zip.close()
869
870def _unpack_tarfile(filename, extract_dir):
871 """Unpack tar/tar.gz/tar.bz2 `filename` to `extract_dir`
872 """
873 try:
874 tarobj = tarfile.open(filename)
875 except tarfile.TarError:
876 raise ReadError(
877 "%s is not a compressed or uncompressed tar file" % filename)
878 try:
879 tarobj.extractall(extract_dir)
880 finally:
881 tarobj.close()
882
883_UNPACK_FORMATS = {
884 'gztar': (['.tar.gz', '.tgz'], _unpack_tarfile, [], "gzip'ed tar-file"),
Tarek Ziadé6ac91722010-04-28 17:51:36 +0000885 'tar': (['.tar'], _unpack_tarfile, [], "uncompressed tar file"),
886 'zip': (['.zip'], _unpack_zipfile, [], "ZIP file")
887 }
888
Tarek Ziadéffa155a2010-04-29 13:34:35 +0000889if _BZ2_SUPPORTED:
890 _UNPACK_FORMATS['bztar'] = (['.bz2'], _unpack_tarfile, [],
891 "bzip2'ed tar-file")
892
Tarek Ziadé6ac91722010-04-28 17:51:36 +0000893def _find_unpack_format(filename):
894 for name, info in _UNPACK_FORMATS.items():
895 for extension in info[0]:
896 if filename.endswith(extension):
897 return name
898 return None
899
900def unpack_archive(filename, extract_dir=None, format=None):
901 """Unpack an archive.
902
903 `filename` is the name of the archive.
904
905 `extract_dir` is the name of the target directory, where the archive
906 is unpacked. If not provided, the current working directory is used.
907
908 `format` is the archive format: one of "zip", "tar", or "gztar". Or any
909 other registered format. If not provided, unpack_archive will use the
910 filename extension and see if an unpacker was registered for that
911 extension.
912
913 In case none is found, a ValueError is raised.
914 """
915 if extract_dir is None:
916 extract_dir = os.getcwd()
917
918 if format is not None:
919 try:
920 format_info = _UNPACK_FORMATS[format]
921 except KeyError:
922 raise ValueError("Unknown unpack format '{0}'".format(format))
923
Nick Coghlanabf202d2011-03-16 13:52:20 -0400924 func = format_info[1]
925 func(filename, extract_dir, **dict(format_info[2]))
Tarek Ziadé6ac91722010-04-28 17:51:36 +0000926 else:
927 # we need to look at the registered unpackers supported extensions
928 format = _find_unpack_format(filename)
929 if format is None:
930 raise ReadError("Unknown archive format '{0}'".format(filename))
931
932 func = _UNPACK_FORMATS[format][1]
933 kwargs = dict(_UNPACK_FORMATS[format][2])
934 func(filename, extract_dir, **kwargs)
Giampaolo Rodola'210e7ca2011-07-01 13:55:36 +0200935
Éric Araujoe4d5b8e2011-08-08 16:51:11 +0200936
937if hasattr(os, 'statvfs'):
938
939 __all__.append('disk_usage')
940 _ntuple_diskusage = collections.namedtuple('usage', 'total used free')
Giampaolo Rodola'210e7ca2011-07-01 13:55:36 +0200941
942 def disk_usage(path):
Éric Araujoe4d5b8e2011-08-08 16:51:11 +0200943 """Return disk usage statistics about the given path.
944
Sandro Tosif8ae4fa2012-04-23 20:07:15 +0200945 Returned value is a named tuple with attributes 'total', 'used' and
Éric Araujoe4d5b8e2011-08-08 16:51:11 +0200946 'free', which are the amount of total, used and free space, in bytes.
Giampaolo Rodola'210e7ca2011-07-01 13:55:36 +0200947 """
Éric Araujoe4d5b8e2011-08-08 16:51:11 +0200948 st = os.statvfs(path)
949 free = st.f_bavail * st.f_frsize
950 total = st.f_blocks * st.f_frsize
951 used = (st.f_blocks - st.f_bfree) * st.f_frsize
952 return _ntuple_diskusage(total, used, free)
953
954elif os.name == 'nt':
955
956 import nt
957 __all__.append('disk_usage')
958 _ntuple_diskusage = collections.namedtuple('usage', 'total used free')
959
960 def disk_usage(path):
961 """Return disk usage statistics about the given path.
962
963 Returned valus is a named tuple with attributes 'total', 'used' and
964 'free', which are the amount of total, used and free space, in bytes.
965 """
966 total, free = nt._getdiskusage(path)
967 used = total - free
Giampaolo Rodola'210e7ca2011-07-01 13:55:36 +0200968 return _ntuple_diskusage(total, used, free)
Sandro Tosid902a142011-08-22 23:28:27 +0200969
Éric Araujo0ac4a5d2011-09-01 08:31:51 +0200970
Sandro Tosid902a142011-08-22 23:28:27 +0200971def chown(path, user=None, group=None):
972 """Change owner user and group of the given path.
973
974 user and group can be the uid/gid or the user/group names, and in that case,
975 they are converted to their respective uid/gid.
976 """
977
978 if user is None and group is None:
979 raise ValueError("user and/or group must be set")
980
981 _user = user
982 _group = group
983
984 # -1 means don't change it
985 if user is None:
986 _user = -1
987 # user can either be an int (the uid) or a string (the system username)
988 elif isinstance(user, str):
989 _user = _get_uid(user)
990 if _user is None:
991 raise LookupError("no such user: {!r}".format(user))
992
993 if group is None:
994 _group = -1
995 elif not isinstance(group, int):
996 _group = _get_gid(group)
997 if _group is None:
998 raise LookupError("no such group: {!r}".format(group))
999
1000 os.chown(path, _user, _group)
Antoine Pitroubcf2b592012-02-08 23:28:36 +01001001
1002def get_terminal_size(fallback=(80, 24)):
1003 """Get the size of the terminal window.
1004
1005 For each of the two dimensions, the environment variable, COLUMNS
1006 and LINES respectively, is checked. If the variable is defined and
1007 the value is a positive integer, it is used.
1008
1009 When COLUMNS or LINES is not defined, which is the common case,
1010 the terminal connected to sys.__stdout__ is queried
1011 by invoking os.get_terminal_size.
1012
1013 If the terminal size cannot be successfully queried, either because
1014 the system doesn't support querying, or because we are not
1015 connected to a terminal, the value given in fallback parameter
1016 is used. Fallback defaults to (80, 24) which is the default
1017 size used by many terminal emulators.
1018
1019 The value returned is a named tuple of type os.terminal_size.
1020 """
1021 # columns, lines are the working values
1022 try:
1023 columns = int(os.environ['COLUMNS'])
1024 except (KeyError, ValueError):
1025 columns = 0
1026
1027 try:
1028 lines = int(os.environ['LINES'])
1029 except (KeyError, ValueError):
1030 lines = 0
1031
1032 # only query if necessary
1033 if columns <= 0 or lines <= 0:
1034 try:
1035 size = os.get_terminal_size(sys.__stdout__.fileno())
1036 except (NameError, OSError):
1037 size = os.terminal_size(fallback)
1038 if columns <= 0:
1039 columns = size.columns
1040 if lines <= 0:
1041 lines = size.lines
1042
1043 return os.terminal_size((columns, lines))
Brian Curtinc57a3452012-06-22 16:00:30 -05001044
1045def which(cmd, mode=os.F_OK | os.X_OK, path=None):
Brian Curtindc00f1e2012-06-22 22:49:12 -05001046 """Given a command, mode, and a PATH string, return the path which
Philip Jenvey88bc0d22012-06-23 15:54:38 -07001047 conforms to the given mode on the PATH, or None if there is no such
1048 file.
1049
1050 `mode` defaults to os.F_OK | os.X_OK. `path` defaults to the result
1051 of os.environ.get("PATH"), or can be overridden with a custom search
1052 path.
1053
1054 """
Brian Curtinc57a3452012-06-22 16:00:30 -05001055 # Check that a given file can be accessed with the correct mode.
1056 # Additionally check that `file` is not a directory, as on Windows
1057 # directories pass the os.access check.
1058 def _access_check(fn, mode):
Philip Jenvey88bc0d22012-06-23 15:54:38 -07001059 return (os.path.exists(fn) and os.access(fn, mode)
1060 and not os.path.isdir(fn))
Brian Curtinc57a3452012-06-22 16:00:30 -05001061
1062 # Short circuit. If we're given a full path which matches the mode
1063 # and it exists, we're done here.
1064 if _access_check(cmd, mode):
1065 return cmd
1066
1067 path = (path or os.environ.get("PATH", os.defpath)).split(os.pathsep)
1068
1069 if sys.platform == "win32":
1070 # The current directory takes precedence on Windows.
1071 if not os.curdir in path:
1072 path.insert(0, os.curdir)
1073
1074 # PATHEXT is necessary to check on Windows.
1075 pathext = os.environ.get("PATHEXT", "").split(os.pathsep)
1076 # See if the given file matches any of the expected path extensions.
1077 # This will allow us to short circuit when given "python.exe".
1078 matches = [cmd for ext in pathext if cmd.lower().endswith(ext.lower())]
Philip Jenvey88bc0d22012-06-23 15:54:38 -07001079 # If it does match, only test that one, otherwise we have to try
1080 # others.
1081 files = [cmd] if matches else [cmd + ext.lower() for ext in pathext]
Brian Curtinc57a3452012-06-22 16:00:30 -05001082 else:
1083 # On other platforms you don't have things like PATHEXT to tell you
1084 # what file suffixes are executable, so just pass on cmd as-is.
1085 files = [cmd]
1086
1087 seen = set()
1088 for dir in path:
Antoine Pitrou07c24d12012-06-22 23:33:05 +02001089 dir = os.path.normcase(dir)
Brian Curtinc57a3452012-06-22 16:00:30 -05001090 if not dir in seen:
1091 seen.add(dir)
1092 for thefile in files:
1093 name = os.path.join(dir, thefile)
1094 if _access_check(name, mode):
1095 return name
1096 return None