blob: f97de788d9d406d8cfa27dc70ac084ad2c4735f8 [file] [log] [blame]
Tarek Ziadéc3399782010-02-23 05:39:18 +00001"""Utility functions for copying and archiving files and directory trees.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +00002
Guido van Rossum959fa011999-08-18 20:03:17 +00003XXX The functions here don't copy the resource fork or other metadata on Mac.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +00004
5"""
Guido van Rossumc6360141990-10-13 19:23:40 +00006
Guido van Rossumc96207a1992-03-31 18:55:40 +00007import os
Guido van Rossum83c03e21999-02-23 23:07:51 +00008import sys
Guido van Rossum9d0a3df1997-04-29 14:45:19 +00009import stat
Georg Brandl2ee470f2008-07-16 12:55:28 +000010import fnmatch
Tarek Ziadé396fad72010-02-23 05:30:31 +000011import collections
Antoine Pitrou910bd512010-03-22 20:11:09 +000012import errno
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +020013
14try:
15 import zlib
16 del zlib
17 _ZLIB_SUPPORTED = True
18except ImportError:
19 _ZLIB_SUPPORTED = False
Tarek Ziadé396fad72010-02-23 05:30:31 +000020
21try:
Tarek Ziadéffa155a2010-04-29 13:34:35 +000022 import bz2
Florent Xicluna54540ec2011-11-04 08:29:17 +010023 del bz2
Tarek Ziadéffa155a2010-04-29 13:34:35 +000024 _BZ2_SUPPORTED = True
Brett Cannoncd171c82013-07-04 17:43:24 -040025except ImportError:
Tarek Ziadéffa155a2010-04-29 13:34:35 +000026 _BZ2_SUPPORTED = False
27
28try:
Serhiy Storchaka11213772014-08-06 18:50:19 +030029 import lzma
30 del lzma
31 _LZMA_SUPPORTED = True
32except ImportError:
33 _LZMA_SUPPORTED = False
34
35try:
Tarek Ziadé396fad72010-02-23 05:30:31 +000036 from pwd import getpwnam
Brett Cannoncd171c82013-07-04 17:43:24 -040037except ImportError:
Tarek Ziadé396fad72010-02-23 05:30:31 +000038 getpwnam = None
39
40try:
41 from grp import getgrnam
Brett Cannoncd171c82013-07-04 17:43:24 -040042except ImportError:
Tarek Ziadé396fad72010-02-23 05:30:31 +000043 getgrnam = None
Guido van Rossumc6360141990-10-13 19:23:40 +000044
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -070045_WINDOWS = os.name == 'nt'
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +020046posix = nt = None
47if os.name == 'posix':
48 import posix
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -070049elif _WINDOWS:
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +020050 import nt
51
Inada Naoki4f190302019-03-02 13:31:01 +090052COPY_BUFSIZE = 1024 * 1024 if _WINDOWS else 64 * 1024
Giampaolo Rodola413d9552019-05-30 14:05:41 +080053_USE_CP_SENDFILE = hasattr(os, "sendfile") and sys.platform.startswith("linux")
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -070054_HAS_FCOPYFILE = posix and hasattr(posix, "_fcopyfile") # macOS
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +020055
Tarek Ziadéc3399782010-02-23 05:39:18 +000056__all__ = ["copyfileobj", "copyfile", "copymode", "copystat", "copy", "copy2",
57 "copytree", "move", "rmtree", "Error", "SpecialFileError",
58 "ExecError", "make_archive", "get_archive_formats",
Tarek Ziadé6ac91722010-04-28 17:51:36 +000059 "register_archive_format", "unregister_archive_format",
60 "get_unpack_formats", "register_unpack_format",
Éric Araujoc5efe652011-08-21 14:30:00 +020061 "unregister_unpack_format", "unpack_archive",
Berker Peksag8083cd62014-11-01 11:04:06 +020062 "ignore_patterns", "chown", "which", "get_terminal_size",
63 "SameFileError"]
Éric Araujoe4d5b8e2011-08-08 16:51:11 +020064 # disk_usage is added later, if available on the platform
Martin v. Löwise9ce0b02002-10-07 13:23:24 +000065
Andrew Svetlov3438fa42012-12-17 23:35:18 +020066class Error(OSError):
Martin v. Löwise9ce0b02002-10-07 13:23:24 +000067 pass
Guido van Rossumc6360141990-10-13 19:23:40 +000068
Hynek Schlawack48653762012-10-07 12:49:58 +020069class SameFileError(Error):
70 """Raised when source and destination are the same file."""
71
Andrew Svetlov3438fa42012-12-17 23:35:18 +020072class SpecialFileError(OSError):
Antoine Pitrou7fff0962009-05-01 21:09:44 +000073 """Raised when trying to do a kind of operation (e.g. copying) which is
74 not supported on a special file (e.g. a named pipe)"""
75
Andrew Svetlov3438fa42012-12-17 23:35:18 +020076class ExecError(OSError):
Tarek Ziadé396fad72010-02-23 05:30:31 +000077 """Raised when a command could not be executed"""
78
Andrew Svetlov3438fa42012-12-17 23:35:18 +020079class ReadError(OSError):
Tarek Ziadé6ac91722010-04-28 17:51:36 +000080 """Raised when an archive cannot be read"""
81
82class RegistryError(Exception):
Ezio Melotti30b9d5d2013-08-17 15:50:46 +030083 """Raised when a registry operation with the archiving
Raymond Hettinger15f44ab2016-08-30 10:47:49 -070084 and unpacking registries fails"""
Tarek Ziadé6ac91722010-04-28 17:51:36 +000085
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +020086class _GiveupOnFastCopy(Exception):
87 """Raised as a signal to fallback on using raw read()/write()
88 file copy when fast-copy functions fail to do so.
89 """
Tarek Ziadé6ac91722010-04-28 17:51:36 +000090
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -070091def _fastcopy_fcopyfile(fsrc, fdst, flags):
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +020092 """Copy a regular file content or metadata by using high-performance
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -070093 fcopyfile(3) syscall (macOS).
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +020094 """
95 try:
96 infd = fsrc.fileno()
97 outfd = fdst.fileno()
98 except Exception as err:
99 raise _GiveupOnFastCopy(err) # not a regular file
100
101 try:
102 posix._fcopyfile(infd, outfd, flags)
103 except OSError as err:
104 err.filename = fsrc.name
105 err.filename2 = fdst.name
106 if err.errno in {errno.EINVAL, errno.ENOTSUP}:
107 raise _GiveupOnFastCopy(err)
108 else:
109 raise err from None
110
111def _fastcopy_sendfile(fsrc, fdst):
112 """Copy data from one regular mmap-like fd to another by using
113 high-performance sendfile(2) syscall.
Giampaolo Rodola413d9552019-05-30 14:05:41 +0800114 This should work on Linux >= 2.6.33 only.
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +0200115 """
116 # Note: copyfileobj() is left alone in order to not introduce any
117 # unexpected breakage. Possible risks by using zero-copy calls
118 # in copyfileobj() are:
119 # - fdst cannot be open in "a"(ppend) mode
120 # - fsrc and fdst may be open in "t"(ext) mode
121 # - fsrc may be a BufferedReader (which hides unread data in a buffer),
122 # GzipFile (which decompresses data), HTTPResponse (which decodes
123 # chunks).
124 # - possibly others (e.g. encrypted fs/partition?)
Giampaolo Rodola413d9552019-05-30 14:05:41 +0800125 global _USE_CP_SENDFILE
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +0200126 try:
127 infd = fsrc.fileno()
128 outfd = fdst.fileno()
129 except Exception as err:
130 raise _GiveupOnFastCopy(err) # not a regular file
131
132 # Hopefully the whole file will be copied in a single call.
133 # sendfile() is called in a loop 'till EOF is reached (0 return)
134 # so a bufsize smaller or bigger than the actual file size
135 # should not make any difference, also in case the file content
136 # changes while being copied.
137 try:
Giampaolo Rodola94e16502019-10-01 11:40:54 +0800138 blocksize = max(os.fstat(infd).st_size, 2 ** 23) # min 8MiB
139 except OSError:
140 blocksize = 2 ** 27 # 128MiB
141 # On 32-bit architectures truncate to 1GiB to avoid OverflowError,
142 # see bpo-38319.
143 if sys.maxsize < 2 ** 32:
144 blocksize = min(blocksize, 2 ** 30)
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +0200145
146 offset = 0
147 while True:
148 try:
149 sent = os.sendfile(outfd, infd, offset, blocksize)
150 except OSError as err:
151 # ...in oder to have a more informative exception.
152 err.filename = fsrc.name
153 err.filename2 = fdst.name
154
155 if err.errno == errno.ENOTSOCK:
156 # sendfile() on this platform (probably Linux < 2.6.33)
157 # does not support copies between regular files (only
158 # sockets).
Giampaolo Rodola413d9552019-05-30 14:05:41 +0800159 _USE_CP_SENDFILE = False
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +0200160 raise _GiveupOnFastCopy(err)
161
162 if err.errno == errno.ENOSPC: # filesystem is full
163 raise err from None
164
165 # Give up on first call and if no data was copied.
166 if offset == 0 and os.lseek(outfd, 0, os.SEEK_CUR) == 0:
167 raise _GiveupOnFastCopy(err)
168
169 raise err
170 else:
171 if sent == 0:
172 break # EOF
173 offset += sent
174
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -0700175def _copyfileobj_readinto(fsrc, fdst, length=COPY_BUFSIZE):
176 """readinto()/memoryview() based variant of copyfileobj().
177 *fsrc* must support readinto() method and both files must be
178 open in binary mode.
179 """
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +0200180 # Localize variable access to minimize overhead.
181 fsrc_readinto = fsrc.readinto
182 fdst_write = fdst.write
183 with memoryview(bytearray(length)) as mv:
184 while True:
185 n = fsrc_readinto(mv)
186 if not n:
187 break
188 elif n < length:
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -0700189 with mv[:n] as smv:
190 fdst.write(smv)
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +0200191 else:
192 fdst_write(mv)
193
Giampaolo Rodola3b0abb02019-02-24 15:46:40 -0800194def copyfileobj(fsrc, fdst, length=0):
Greg Stein42bb8b32000-07-12 09:55:30 +0000195 """copy data from file-like object fsrc to file-like object fdst"""
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -0700196 # Localize variable access to minimize overhead.
Giampaolo Rodola3b0abb02019-02-24 15:46:40 -0800197 if not length:
198 length = COPY_BUFSIZE
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -0700199 fsrc_read = fsrc.read
200 fdst_write = fdst.write
201 while True:
202 buf = fsrc_read(length)
203 if not buf:
204 break
205 fdst_write(buf)
Greg Stein42bb8b32000-07-12 09:55:30 +0000206
Johannes Gijsbers46f14592004-08-14 13:30:02 +0000207def _samefile(src, dst):
208 # Macintosh, Unix.
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800209 if isinstance(src, os.DirEntry) and hasattr(os.path, 'samestat'):
210 try:
211 return os.path.samestat(src.stat(), os.stat(dst))
212 except OSError:
213 return False
214
Tarek Ziadé1eab9cc2010-04-19 21:19:57 +0000215 if hasattr(os.path, 'samefile'):
Johannes Gijsbersf9a098e2004-08-14 14:51:01 +0000216 try:
217 return os.path.samefile(src, dst)
218 except OSError:
219 return False
Johannes Gijsbers46f14592004-08-14 13:30:02 +0000220
221 # All other platforms: check for same pathname.
222 return (os.path.normcase(os.path.abspath(src)) ==
223 os.path.normcase(os.path.abspath(dst)))
Tim Peters495ad3c2001-01-15 01:36:40 +0000224
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800225def _stat(fn):
226 return fn.stat() if isinstance(fn, os.DirEntry) else os.stat(fn)
227
228def _islink(fn):
229 return fn.is_symlink() if isinstance(fn, os.DirEntry) else os.path.islink(fn)
230
Larry Hastingsb4038062012-07-15 10:57:38 -0700231def copyfile(src, dst, *, follow_symlinks=True):
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -0700232 """Copy data from src to dst in the most efficient way possible.
Antoine Pitrou78091e62011-12-29 18:54:15 +0100233
Larry Hastingsb4038062012-07-15 10:57:38 -0700234 If follow_symlinks is not set and src is a symbolic link, a new
Antoine Pitrou78091e62011-12-29 18:54:15 +0100235 symlink will be created instead of copying the file it points to.
236
237 """
Johannes Gijsbers46f14592004-08-14 13:30:02 +0000238 if _samefile(src, dst):
Hynek Schlawack48653762012-10-07 12:49:58 +0200239 raise SameFileError("{!r} and {!r} are the same file".format(src, dst))
Johannes Gijsbers46f14592004-08-14 13:30:02 +0000240
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -0700241 file_size = 0
242 for i, fn in enumerate([src, dst]):
Antoine Pitrou7fff0962009-05-01 21:09:44 +0000243 try:
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800244 st = _stat(fn)
Antoine Pitrou7fff0962009-05-01 21:09:44 +0000245 except OSError:
246 # File most likely does not exist
247 pass
Benjamin Petersonc0d98aa2009-06-05 19:13:27 +0000248 else:
249 # XXX What about other special files? (sockets, devices...)
250 if stat.S_ISFIFO(st.st_mode):
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800251 fn = fn.path if isinstance(fn, os.DirEntry) else fn
Benjamin Petersonc0d98aa2009-06-05 19:13:27 +0000252 raise SpecialFileError("`%s` is a named pipe" % fn)
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -0700253 if _WINDOWS and i == 0:
254 file_size = st.st_size
Tarek Ziadéb01142b2010-05-05 22:43:04 +0000255
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800256 if not follow_symlinks and _islink(src):
Antoine Pitrou78091e62011-12-29 18:54:15 +0100257 os.symlink(os.readlink(src), dst)
258 else:
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +0200259 with open(src, 'rb') as fsrc, open(dst, 'wb') as fdst:
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -0700260 # macOS
261 if _HAS_FCOPYFILE:
262 try:
263 _fastcopy_fcopyfile(fsrc, fdst, posix._COPYFILE_DATA)
264 return dst
265 except _GiveupOnFastCopy:
266 pass
Giampaolo Rodola413d9552019-05-30 14:05:41 +0800267 # Linux
268 elif _USE_CP_SENDFILE:
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +0200269 try:
270 _fastcopy_sendfile(fsrc, fdst)
271 return dst
272 except _GiveupOnFastCopy:
273 pass
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -0700274 # Windows, see:
275 # https://github.com/python/cpython/pull/7160#discussion_r195405230
276 elif _WINDOWS and file_size > 0:
277 _copyfileobj_readinto(fsrc, fdst, min(file_size, COPY_BUFSIZE))
278 return dst
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +0200279
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -0700280 copyfileobj(fsrc, fdst)
Giampaolo Rodola4a172cc2018-06-12 23:04:50 +0200281
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500282 return dst
Guido van Rossumc6360141990-10-13 19:23:40 +0000283
Larry Hastingsb4038062012-07-15 10:57:38 -0700284def copymode(src, dst, *, follow_symlinks=True):
Antoine Pitrou78091e62011-12-29 18:54:15 +0100285 """Copy mode bits from src to dst.
Guido van Rossumc6360141990-10-13 19:23:40 +0000286
Larry Hastingsb4038062012-07-15 10:57:38 -0700287 If follow_symlinks is not set, symlinks aren't followed if and only
288 if both `src` and `dst` are symlinks. If `lchmod` isn't available
289 (e.g. Linux) this method does nothing.
Antoine Pitrou78091e62011-12-29 18:54:15 +0100290
291 """
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800292 if not follow_symlinks and _islink(src) and os.path.islink(dst):
Antoine Pitrou78091e62011-12-29 18:54:15 +0100293 if hasattr(os, 'lchmod'):
294 stat_func, chmod_func = os.lstat, os.lchmod
295 else:
296 return
Antoine Pitrou78091e62011-12-29 18:54:15 +0100297 else:
Anthony Sottile8377cd42019-02-25 14:32:27 -0800298 stat_func, chmod_func = _stat, os.chmod
Antoine Pitrou78091e62011-12-29 18:54:15 +0100299
300 st = stat_func(src)
301 chmod_func(dst, stat.S_IMODE(st.st_mode))
302
Larry Hastingsad5ae042012-07-14 17:55:11 -0700303if hasattr(os, 'listxattr'):
Larry Hastingsb4038062012-07-15 10:57:38 -0700304 def _copyxattr(src, dst, *, follow_symlinks=True):
Larry Hastingsad5ae042012-07-14 17:55:11 -0700305 """Copy extended filesystem attributes from `src` to `dst`.
306
307 Overwrite existing attributes.
308
Larry Hastingsb4038062012-07-15 10:57:38 -0700309 If `follow_symlinks` is false, symlinks won't be followed.
Larry Hastingsad5ae042012-07-14 17:55:11 -0700310
311 """
312
Hynek Schlawack0beab052013-02-05 08:22:44 +0100313 try:
314 names = os.listxattr(src, follow_symlinks=follow_symlinks)
315 except OSError as e:
Ying Wanga16387a2019-05-29 23:25:31 -0400316 if e.errno not in (errno.ENOTSUP, errno.ENODATA, errno.EINVAL):
Hynek Schlawack0beab052013-02-05 08:22:44 +0100317 raise
318 return
319 for name in names:
Larry Hastingsad5ae042012-07-14 17:55:11 -0700320 try:
Larry Hastingsb4038062012-07-15 10:57:38 -0700321 value = os.getxattr(src, name, follow_symlinks=follow_symlinks)
322 os.setxattr(dst, name, value, follow_symlinks=follow_symlinks)
Larry Hastingsad5ae042012-07-14 17:55:11 -0700323 except OSError as e:
Ying Wanga16387a2019-05-29 23:25:31 -0400324 if e.errno not in (errno.EPERM, errno.ENOTSUP, errno.ENODATA,
325 errno.EINVAL):
Larry Hastingsad5ae042012-07-14 17:55:11 -0700326 raise
327else:
328 def _copyxattr(*args, **kwargs):
329 pass
330
Larry Hastingsb4038062012-07-15 10:57:38 -0700331def copystat(src, dst, *, follow_symlinks=True):
Zsolt Cserna4f399be2018-10-23 12:09:50 +0200332 """Copy file metadata
Antoine Pitrou78091e62011-12-29 18:54:15 +0100333
Zsolt Cserna4f399be2018-10-23 12:09:50 +0200334 Copy the permission bits, last access time, last modification time, and
335 flags from `src` to `dst`. On Linux, copystat() also copies the "extended
336 attributes" where possible. The file contents, owner, and group are
Boris Verhovsky9488a522019-09-09 09:51:56 -0600337 unaffected. `src` and `dst` are path-like objects or path names given as
338 strings.
Antoine Pitrou78091e62011-12-29 18:54:15 +0100339
Zsolt Cserna4f399be2018-10-23 12:09:50 +0200340 If the optional flag `follow_symlinks` is not set, symlinks aren't
341 followed if and only if both `src` and `dst` are symlinks.
Antoine Pitrou78091e62011-12-29 18:54:15 +0100342 """
Larry Hastings9cf065c2012-06-22 16:30:09 -0700343 def _nop(*args, ns=None, follow_symlinks=None):
Antoine Pitrou78091e62011-12-29 18:54:15 +0100344 pass
345
Larry Hastings9cf065c2012-06-22 16:30:09 -0700346 # follow symlinks (aka don't not follow symlinks)
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800347 follow = follow_symlinks or not (_islink(src) and os.path.islink(dst))
Larry Hastings9cf065c2012-06-22 16:30:09 -0700348 if follow:
349 # use the real function if it exists
350 def lookup(name):
351 return getattr(os, name, _nop)
Antoine Pitrou78091e62011-12-29 18:54:15 +0100352 else:
Larry Hastings9cf065c2012-06-22 16:30:09 -0700353 # use the real function only if it exists
354 # *and* it supports follow_symlinks
355 def lookup(name):
356 fn = getattr(os, name, _nop)
357 if fn in os.supports_follow_symlinks:
358 return fn
359 return _nop
Antoine Pitrou78091e62011-12-29 18:54:15 +0100360
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800361 if isinstance(src, os.DirEntry):
362 st = src.stat(follow_symlinks=follow)
363 else:
364 st = lookup("stat")(src, follow_symlinks=follow)
Walter Dörwald294bbf32002-06-06 09:48:13 +0000365 mode = stat.S_IMODE(st.st_mode)
Larry Hastings9cf065c2012-06-22 16:30:09 -0700366 lookup("utime")(dst, ns=(st.st_atime_ns, st.st_mtime_ns),
367 follow_symlinks=follow)
Olexa Bilaniuk79efbb72019-05-09 22:22:06 -0500368 # We must copy extended attributes before the file is (potentially)
369 # chmod()'ed read-only, otherwise setxattr() will error with -EACCES.
370 _copyxattr(src, dst, follow_symlinks=follow)
Larry Hastings9cf065c2012-06-22 16:30:09 -0700371 try:
372 lookup("chmod")(dst, mode, follow_symlinks=follow)
373 except NotImplementedError:
374 # if we got a NotImplementedError, it's because
375 # * follow_symlinks=False,
376 # * lchown() is unavailable, and
377 # * either
Ezio Melotti30b9d5d2013-08-17 15:50:46 +0300378 # * fchownat() is unavailable or
Larry Hastings9cf065c2012-06-22 16:30:09 -0700379 # * fchownat() doesn't implement AT_SYMLINK_NOFOLLOW.
380 # (it returned ENOSUP.)
381 # therefore we're out of options--we simply cannot chown the
382 # symlink. give up, suppress the error.
383 # (which is what shutil always did in this circumstance.)
384 pass
Antoine Pitrou78091e62011-12-29 18:54:15 +0100385 if hasattr(st, 'st_flags'):
Antoine Pitrou910bd512010-03-22 20:11:09 +0000386 try:
Larry Hastings9cf065c2012-06-22 16:30:09 -0700387 lookup("chflags")(dst, st.st_flags, follow_symlinks=follow)
Antoine Pitrou910bd512010-03-22 20:11:09 +0000388 except OSError as why:
Ned Deilybaf75712012-05-10 17:05:19 -0700389 for err in 'EOPNOTSUPP', 'ENOTSUP':
390 if hasattr(errno, err) and why.errno == getattr(errno, err):
391 break
392 else:
Antoine Pitrou910bd512010-03-22 20:11:09 +0000393 raise
Antoine Pitrou424246f2012-05-12 19:02:01 +0200394
Larry Hastingsb4038062012-07-15 10:57:38 -0700395def copy(src, dst, *, follow_symlinks=True):
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500396 """Copy data and mode bits ("cp src dst"). Return the file's destination.
Tim Peters495ad3c2001-01-15 01:36:40 +0000397
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000398 The destination may be a directory.
399
Larry Hastingsb4038062012-07-15 10:57:38 -0700400 If follow_symlinks is false, symlinks won't be followed. This
Antoine Pitrou78091e62011-12-29 18:54:15 +0100401 resembles GNU's "cp -P src dst".
402
Hynek Schlawack48653762012-10-07 12:49:58 +0200403 If source and destination are the same file, a SameFileError will be
404 raised.
405
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000406 """
Guido van Rossuma2baf461997-04-29 14:06:46 +0000407 if os.path.isdir(dst):
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000408 dst = os.path.join(dst, os.path.basename(src))
Larry Hastingsb4038062012-07-15 10:57:38 -0700409 copyfile(src, dst, follow_symlinks=follow_symlinks)
410 copymode(src, dst, follow_symlinks=follow_symlinks)
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500411 return dst
Guido van Rossumc6360141990-10-13 19:23:40 +0000412
Larry Hastingsb4038062012-07-15 10:57:38 -0700413def copy2(src, dst, *, follow_symlinks=True):
Zsolt Cserna4f399be2018-10-23 12:09:50 +0200414 """Copy data and metadata. Return the file's destination.
415
416 Metadata is copied with copystat(). Please see the copystat function
417 for more information.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000418
419 The destination may be a directory.
420
Larry Hastingsb4038062012-07-15 10:57:38 -0700421 If follow_symlinks is false, symlinks won't be followed. This
Antoine Pitrou78091e62011-12-29 18:54:15 +0100422 resembles GNU's "cp -P src dst".
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000423 """
Guido van Rossuma2baf461997-04-29 14:06:46 +0000424 if os.path.isdir(dst):
Guido van Rossum45e2fbc1998-03-26 21:13:24 +0000425 dst = os.path.join(dst, os.path.basename(src))
Larry Hastingsb4038062012-07-15 10:57:38 -0700426 copyfile(src, dst, follow_symlinks=follow_symlinks)
427 copystat(src, dst, follow_symlinks=follow_symlinks)
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500428 return dst
Guido van Rossumc6360141990-10-13 19:23:40 +0000429
Georg Brandl2ee470f2008-07-16 12:55:28 +0000430def ignore_patterns(*patterns):
431 """Function that can be used as copytree() ignore parameter.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000432
Georg Brandl2ee470f2008-07-16 12:55:28 +0000433 Patterns is a sequence of glob-style patterns
434 that are used to exclude files"""
435 def _ignore_patterns(path, names):
436 ignored_names = []
437 for pattern in patterns:
438 ignored_names.extend(fnmatch.filter(names, pattern))
439 return set(ignored_names)
440 return _ignore_patterns
441
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800442def _copytree(entries, src, dst, symlinks, ignore, copy_function,
jab9e00d9e2018-12-28 13:03:40 -0500443 ignore_dangling_symlinks, dirs_exist_ok=False):
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800444 if ignore is not None:
445 ignored_names = ignore(src, set(os.listdir(src)))
446 else:
447 ignored_names = set()
448
jab9e00d9e2018-12-28 13:03:40 -0500449 os.makedirs(dst, exist_ok=dirs_exist_ok)
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800450 errors = []
451 use_srcentry = copy_function is copy2 or copy_function is copy
452
453 for srcentry in entries:
454 if srcentry.name in ignored_names:
455 continue
456 srcname = os.path.join(src, srcentry.name)
457 dstname = os.path.join(dst, srcentry.name)
458 srcobj = srcentry if use_srcentry else srcname
459 try:
Steve Dowerdf2d4a62019-08-21 15:27:33 -0700460 is_symlink = srcentry.is_symlink()
461 if is_symlink and os.name == 'nt':
462 # Special check for directory junctions, which appear as
463 # symlinks but we want to recurse.
464 lstat = srcentry.stat(follow_symlinks=False)
465 if lstat.st_reparse_tag == stat.IO_REPARSE_TAG_MOUNT_POINT:
466 is_symlink = False
467 if is_symlink:
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800468 linkto = os.readlink(srcname)
469 if symlinks:
470 # We can't just leave it to `copy_function` because legacy
471 # code with a custom `copy_function` may rely on copytree
472 # doing the right thing.
473 os.symlink(linkto, dstname)
474 copystat(srcobj, dstname, follow_symlinks=not symlinks)
475 else:
476 # ignore dangling symlink if the flag is on
477 if not os.path.exists(linkto) and ignore_dangling_symlinks:
478 continue
jab9e00d9e2018-12-28 13:03:40 -0500479 # otherwise let the copy occur. copy2 will raise an error
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800480 if srcentry.is_dir():
481 copytree(srcobj, dstname, symlinks, ignore,
jab9e00d9e2018-12-28 13:03:40 -0500482 copy_function, dirs_exist_ok=dirs_exist_ok)
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800483 else:
484 copy_function(srcobj, dstname)
485 elif srcentry.is_dir():
jab9e00d9e2018-12-28 13:03:40 -0500486 copytree(srcobj, dstname, symlinks, ignore, copy_function,
487 dirs_exist_ok=dirs_exist_ok)
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800488 else:
489 # Will raise a SpecialFileError for unsupported file types
Giampaolo Rodolac606a9c2019-02-26 12:04:41 +0100490 copy_function(srcobj, dstname)
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800491 # catch the Error from the recursive copytree so that we can
492 # continue with other files
493 except Error as err:
494 errors.extend(err.args[0])
495 except OSError as why:
496 errors.append((srcname, dstname, str(why)))
497 try:
498 copystat(src, dst)
499 except OSError as why:
500 # Copying file access times may fail on Windows
501 if getattr(why, 'winerror', None) is None:
502 errors.append((src, dst, str(why)))
503 if errors:
504 raise Error(errors)
505 return dst
506
Tarek Ziadéfb437512010-04-20 08:57:33 +0000507def copytree(src, dst, symlinks=False, ignore=None, copy_function=copy2,
jab9e00d9e2018-12-28 13:03:40 -0500508 ignore_dangling_symlinks=False, dirs_exist_ok=False):
509 """Recursively copy a directory tree and return the destination directory.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000510
jab9e00d9e2018-12-28 13:03:40 -0500511 dirs_exist_ok dictates whether to raise an exception in case dst or any
512 missing parent directory already exists.
513
Neal Norwitza4c93b62003-02-23 21:36:32 +0000514 If exception(s) occur, an Error is raised with a list of reasons.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000515
516 If the optional symlinks flag is true, symbolic links in the
517 source tree result in symbolic links in the destination tree; if
518 it is false, the contents of the files pointed to by symbolic
Tarek Ziadéfb437512010-04-20 08:57:33 +0000519 links are copied. If the file pointed by the symlink doesn't
520 exist, an exception will be added in the list of errors raised in
521 an Error exception at the end of the copy process.
522
523 You can set the optional ignore_dangling_symlinks flag to true if you
Tarek Ziadé8c26c7d2010-04-23 13:03:50 +0000524 want to silence this exception. Notice that this has no effect on
525 platforms that don't support os.symlink.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000526
Georg Brandl2ee470f2008-07-16 12:55:28 +0000527 The optional ignore argument is a callable. If given, it
528 is called with the `src` parameter, which is the directory
529 being visited by copytree(), and `names` which is the list of
530 `src` contents, as returned by os.listdir():
531
532 callable(src, names) -> ignored_names
533
534 Since copytree() is called recursively, the callable will be
535 called once for each directory that is copied. It returns a
536 list of names relative to the `src` directory that should
537 not be copied.
538
Tarek Ziadé5340db32010-04-19 22:30:51 +0000539 The optional copy_function argument is a callable that will be used
540 to copy each file. It will be called with the source path and the
541 destination path as arguments. By default, copy2() is used, but any
542 function that supports the same signature (like copy()) can be used.
Guido van Rossum9d0a3df1997-04-29 14:45:19 +0000543
544 """
Steve Dower60419a72019-06-24 08:42:54 -0700545 sys.audit("shutil.copytree", src, dst)
Giampaolo Rodola19c46a42018-11-12 06:18:15 -0800546 with os.scandir(src) as entries:
547 return _copytree(entries=entries, src=src, dst=dst, symlinks=symlinks,
548 ignore=ignore, copy_function=copy_function,
jab9e00d9e2018-12-28 13:03:40 -0500549 ignore_dangling_symlinks=ignore_dangling_symlinks,
550 dirs_exist_ok=dirs_exist_ok)
Guido van Rossumd7673291998-02-06 21:38:09 +0000551
Ned Deily7fcc2082019-08-29 17:20:03 -0400552if hasattr(os.stat_result, 'st_file_attributes'):
Steve Dowerdf2d4a62019-08-21 15:27:33 -0700553 # Special handling for directory junctions to make them behave like
554 # symlinks for shutil.rmtree, since in general they do not appear as
555 # regular links.
556 def _rmtree_isdir(entry):
557 try:
558 st = entry.stat(follow_symlinks=False)
559 return (stat.S_ISDIR(st.st_mode) and not
560 (st.st_file_attributes & stat.FILE_ATTRIBUTE_REPARSE_POINT
561 and st.st_reparse_tag == stat.IO_REPARSE_TAG_MOUNT_POINT))
562 except OSError:
563 return False
564
565 def _rmtree_islink(path):
566 try:
567 st = os.lstat(path)
568 return (stat.S_ISLNK(st.st_mode) or
569 (st.st_file_attributes & stat.FILE_ATTRIBUTE_REPARSE_POINT
570 and st.st_reparse_tag == stat.IO_REPARSE_TAG_MOUNT_POINT))
571 except OSError:
572 return False
573else:
574 def _rmtree_isdir(entry):
575 try:
576 return entry.is_dir(follow_symlinks=False)
577 except OSError:
578 return False
579
580 def _rmtree_islink(path):
581 return os.path.islink(path)
582
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200583# version vulnerable to race conditions
584def _rmtree_unsafe(path, onerror):
Christian Heimes9bd667a2008-01-20 15:14:11 +0000585 try:
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200586 with os.scandir(path) as scandir_it:
587 entries = list(scandir_it)
Christian Heimes9bd667a2008-01-20 15:14:11 +0000588 except OSError:
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200589 onerror(os.scandir, path, sys.exc_info())
590 entries = []
591 for entry in entries:
592 fullname = entry.path
Steve Dowerdf2d4a62019-08-21 15:27:33 -0700593 if _rmtree_isdir(entry):
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200594 try:
595 if entry.is_symlink():
596 # This can only happen if someone replaces
597 # a directory with a symlink after the call to
598 # os.scandir or entry.is_dir above.
599 raise OSError("Cannot call rmtree on a symbolic link")
600 except OSError:
601 onerror(os.path.islink, fullname, sys.exc_info())
602 continue
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200603 _rmtree_unsafe(fullname, onerror)
Barry Warsaw234d9a92003-01-24 17:36:15 +0000604 else:
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000605 try:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200606 os.unlink(fullname)
Andrew Svetlovad28c7f2012-12-18 22:02:39 +0200607 except OSError:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200608 onerror(os.unlink, fullname, sys.exc_info())
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000609 try:
610 os.rmdir(path)
Andrew Svetlovad28c7f2012-12-18 22:02:39 +0200611 except OSError:
Johannes Gijsbersef5ffc42004-10-31 12:05:31 +0000612 onerror(os.rmdir, path, sys.exc_info())
Guido van Rossumd7673291998-02-06 21:38:09 +0000613
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200614# Version using fd-based APIs to protect against races
615def _rmtree_safe_fd(topfd, path, onerror):
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200616 try:
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200617 with os.scandir(topfd) as scandir_it:
618 entries = list(scandir_it)
Hynek Schlawackb5501102012-12-10 09:11:25 +0100619 except OSError as err:
620 err.filename = path
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200621 onerror(os.scandir, path, sys.exc_info())
622 return
623 for entry in entries:
624 fullname = os.path.join(path, entry.name)
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200625 try:
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200626 is_dir = entry.is_dir(follow_symlinks=False)
Hynek Schlawackb5501102012-12-10 09:11:25 +0100627 except OSError:
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200628 is_dir = False
Serhiy Storchakae9b51c02019-05-31 11:30:37 +0300629 else:
630 if is_dir:
631 try:
632 orig_st = entry.stat(follow_symlinks=False)
633 is_dir = stat.S_ISDIR(orig_st.st_mode)
634 except OSError:
635 onerror(os.lstat, fullname, sys.exc_info())
636 continue
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200637 if is_dir:
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200638 try:
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200639 dirfd = os.open(entry.name, os.O_RDONLY, dir_fd=topfd)
Hynek Schlawackb5501102012-12-10 09:11:25 +0100640 except OSError:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200641 onerror(os.open, fullname, sys.exc_info())
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200642 else:
643 try:
644 if os.path.samestat(orig_st, os.fstat(dirfd)):
645 _rmtree_safe_fd(dirfd, fullname, onerror)
Hynek Schlawack9f558cc2012-06-28 15:30:47 +0200646 try:
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200647 os.rmdir(entry.name, dir_fd=topfd)
Hynek Schlawackb5501102012-12-10 09:11:25 +0100648 except OSError:
Hynek Schlawack9f558cc2012-06-28 15:30:47 +0200649 onerror(os.rmdir, fullname, sys.exc_info())
Hynek Schlawackb5501102012-12-10 09:11:25 +0100650 else:
651 try:
652 # This can only happen if someone replaces
653 # a directory with a symlink after the call to
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200654 # os.scandir or stat.S_ISDIR above.
Hynek Schlawackb5501102012-12-10 09:11:25 +0100655 raise OSError("Cannot call rmtree on a symbolic "
656 "link")
657 except OSError:
658 onerror(os.path.islink, fullname, sys.exc_info())
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200659 finally:
660 os.close(dirfd)
661 else:
662 try:
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200663 os.unlink(entry.name, dir_fd=topfd)
Hynek Schlawackb5501102012-12-10 09:11:25 +0100664 except OSError:
Hynek Schlawack2100b422012-06-23 20:28:32 +0200665 onerror(os.unlink, fullname, sys.exc_info())
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200666
Hynek Schlawackd0f6e0a2012-06-29 08:28:20 +0200667_use_fd_functions = ({os.open, os.stat, os.unlink, os.rmdir} <=
668 os.supports_dir_fd and
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200669 os.scandir in os.supports_fd and
Hynek Schlawackd0f6e0a2012-06-29 08:28:20 +0200670 os.stat in os.supports_follow_symlinks)
Nick Coghlan5b0eca12012-06-24 16:43:06 +1000671
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200672def rmtree(path, ignore_errors=False, onerror=None):
673 """Recursively delete a directory tree.
674
675 If ignore_errors is set, errors are ignored; otherwise, if onerror
676 is set, it is called to handle the error with arguments (func,
Hynek Schlawack2100b422012-06-23 20:28:32 +0200677 path, exc_info) where func is platform and implementation dependent;
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200678 path is the argument to that function that caused it to fail; and
679 exc_info is a tuple returned by sys.exc_info(). If ignore_errors
680 is false and onerror is None, an exception is raised.
681
682 """
Steve Dower60419a72019-06-24 08:42:54 -0700683 sys.audit("shutil.rmtree", path)
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200684 if ignore_errors:
685 def onerror(*args):
686 pass
687 elif onerror is None:
688 def onerror(*args):
689 raise
690 if _use_fd_functions:
Hynek Schlawack3b527782012-06-25 13:27:31 +0200691 # While the unsafe rmtree works fine on bytes, the fd based does not.
692 if isinstance(path, bytes):
693 path = os.fsdecode(path)
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200694 # Note: To guard against symlink races, we use the standard
695 # lstat()/open()/fstat() trick.
696 try:
697 orig_st = os.lstat(path)
698 except Exception:
699 onerror(os.lstat, path, sys.exc_info())
700 return
701 try:
702 fd = os.open(path, os.O_RDONLY)
703 except Exception:
704 onerror(os.lstat, path, sys.exc_info())
705 return
706 try:
Hynek Schlawackb5501102012-12-10 09:11:25 +0100707 if os.path.samestat(orig_st, os.fstat(fd)):
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200708 _rmtree_safe_fd(fd, path, onerror)
Hynek Schlawack9f558cc2012-06-28 15:30:47 +0200709 try:
710 os.rmdir(path)
Andrew Svetlovad28c7f2012-12-18 22:02:39 +0200711 except OSError:
Hynek Schlawack9f558cc2012-06-28 15:30:47 +0200712 onerror(os.rmdir, path, sys.exc_info())
Hynek Schlawacka75cd1c2012-06-28 12:07:29 +0200713 else:
Hynek Schlawackb5501102012-12-10 09:11:25 +0100714 try:
715 # symlinks to directories are forbidden, see bug #1669
716 raise OSError("Cannot call rmtree on a symbolic link")
717 except OSError:
718 onerror(os.path.islink, path, sys.exc_info())
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200719 finally:
720 os.close(fd)
721 else:
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200722 try:
Steve Dowerdf2d4a62019-08-21 15:27:33 -0700723 if _rmtree_islink(path):
Serhiy Storchakad4d79bc2017-11-04 14:16:35 +0200724 # symlinks to directories are forbidden, see bug #1669
725 raise OSError("Cannot call rmtree on a symbolic link")
726 except OSError:
727 onerror(os.path.islink, path, sys.exc_info())
728 # can't continue even if onerror hook returns
729 return
Hynek Schlawack67be92b2012-06-23 17:58:42 +0200730 return _rmtree_unsafe(path, onerror)
731
Nick Coghlan5b0eca12012-06-24 16:43:06 +1000732# Allow introspection of whether or not the hardening against symlink
733# attacks is supported on the current platform
734rmtree.avoids_symlink_attacks = _use_fd_functions
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000735
Christian Heimesada8c3b2008-03-18 18:26:33 +0000736def _basename(path):
Maxwell A McKinnoncf57cab2019-09-30 19:41:16 -0700737 """A basename() variant which first strips the trailing slash, if present.
738 Thus we always get the last component of the path, even for directories.
739
740 path: Union[PathLike, str]
741
742 e.g.
743 >>> os.path.basename('/bar/foo')
744 'foo'
745 >>> os.path.basename('/bar/foo/')
746 ''
747 >>> _basename('/bar/foo/')
748 'foo'
749 """
750 path = os.fspath(path)
Serhiy Storchaka3a308b92014-02-11 10:30:59 +0200751 sep = os.path.sep + (os.path.altsep or '')
752 return os.path.basename(path.rstrip(sep))
Christian Heimesada8c3b2008-03-18 18:26:33 +0000753
R David Murray6ffface2014-06-11 14:40:13 -0400754def move(src, dst, copy_function=copy2):
Christian Heimesada8c3b2008-03-18 18:26:33 +0000755 """Recursively move a file or directory to another location. This is
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500756 similar to the Unix "mv" command. Return the file or directory's
757 destination.
Christian Heimesada8c3b2008-03-18 18:26:33 +0000758
759 If the destination is a directory or a symlink to a directory, the source
760 is moved inside the directory. The destination path must not already
761 exist.
762
763 If the destination already exists but is not a directory, it may be
764 overwritten depending on os.rename() semantics.
765
766 If the destination is on our current filesystem, then rename() is used.
Antoine Pitrou0a08d7a2012-01-06 20:16:19 +0100767 Otherwise, src is copied to the destination and then removed. Symlinks are
768 recreated under the new name if os.rename() fails because of cross
769 filesystem renames.
770
R David Murray6ffface2014-06-11 14:40:13 -0400771 The optional `copy_function` argument is a callable that will be used
772 to copy the source or it will be delegated to `copytree`.
773 By default, copy2() is used, but any function that supports the same
774 signature (like copy()) can be used.
775
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000776 A lot more could be done here... A look at a mv.c shows a lot of
777 the issues this implementation glosses over.
778
779 """
Christian Heimesada8c3b2008-03-18 18:26:33 +0000780 real_dst = dst
781 if os.path.isdir(dst):
Ronald Oussorenf51738b2011-05-06 10:23:04 +0200782 if _samefile(src, dst):
783 # We might be on a case insensitive filesystem,
784 # perform the rename anyway.
785 os.rename(src, dst)
786 return
787
Maxwell A McKinnoncf57cab2019-09-30 19:41:16 -0700788 # Using _basename instead of os.path.basename is important, as we must
789 # ignore any trailing slash to avoid the basename returning ''
Christian Heimesada8c3b2008-03-18 18:26:33 +0000790 real_dst = os.path.join(dst, _basename(src))
Maxwell A McKinnoncf57cab2019-09-30 19:41:16 -0700791
Christian Heimesada8c3b2008-03-18 18:26:33 +0000792 if os.path.exists(real_dst):
793 raise Error("Destination path '%s' already exists" % real_dst)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000794 try:
Christian Heimesada8c3b2008-03-18 18:26:33 +0000795 os.rename(src, real_dst)
Éric Araujocfcc9772011-08-10 20:54:33 +0200796 except OSError:
Antoine Pitrou0a08d7a2012-01-06 20:16:19 +0100797 if os.path.islink(src):
798 linkto = os.readlink(src)
799 os.symlink(linkto, real_dst)
800 os.unlink(src)
801 elif os.path.isdir(src):
Benjamin Peterson247a9b82009-02-20 04:09:19 +0000802 if _destinsrc(src, dst):
R David Murray6ffface2014-06-11 14:40:13 -0400803 raise Error("Cannot move a directory '%s' into itself"
804 " '%s'." % (src, dst))
805 copytree(src, real_dst, copy_function=copy_function,
806 symlinks=True)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000807 rmtree(src)
808 else:
R David Murray6ffface2014-06-11 14:40:13 -0400809 copy_function(src, real_dst)
Martin v. Löwise9ce0b02002-10-07 13:23:24 +0000810 os.unlink(src)
Brian Curtin0d0a1de2012-06-18 18:41:07 -0500811 return real_dst
Brett Cannon1c3fa182004-06-19 21:11:35 +0000812
Benjamin Peterson247a9b82009-02-20 04:09:19 +0000813def _destinsrc(src, dst):
Berker Peksag3715da52014-09-18 05:11:15 +0300814 src = os.path.abspath(src)
815 dst = os.path.abspath(dst)
Antoine Pitrou0dcc3cd2009-01-29 20:26:59 +0000816 if not src.endswith(os.path.sep):
817 src += os.path.sep
818 if not dst.endswith(os.path.sep):
819 dst += os.path.sep
820 return dst.startswith(src)
Tarek Ziadé396fad72010-02-23 05:30:31 +0000821
822def _get_gid(name):
823 """Returns a gid, given a group name."""
824 if getgrnam is None or name is None:
825 return None
826 try:
827 result = getgrnam(name)
828 except KeyError:
829 result = None
830 if result is not None:
831 return result[2]
832 return None
833
834def _get_uid(name):
835 """Returns an uid, given a user name."""
836 if getpwnam is None or name is None:
837 return None
838 try:
839 result = getpwnam(name)
840 except KeyError:
841 result = None
842 if result is not None:
843 return result[2]
844 return None
845
846def _make_tarball(base_name, base_dir, compress="gzip", verbose=0, dry_run=0,
847 owner=None, group=None, logger=None):
848 """Create a (possibly compressed) tar file from all the files under
849 'base_dir'.
850
Serhiy Storchaka11213772014-08-06 18:50:19 +0300851 'compress' must be "gzip" (the default), "bzip2", "xz", or None.
Tarek Ziadé396fad72010-02-23 05:30:31 +0000852
853 'owner' and 'group' can be used to define an owner and a group for the
854 archive that is being built. If not provided, the current owner and group
855 will be used.
856
Éric Araujo4433a5f2010-12-15 20:26:30 +0000857 The output tar file will be named 'base_name' + ".tar", possibly plus
Serhiy Storchaka11213772014-08-06 18:50:19 +0300858 the appropriate compression extension (".gz", ".bz2", or ".xz").
Tarek Ziadé396fad72010-02-23 05:30:31 +0000859
860 Returns the output filename.
861 """
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +0200862 if compress is None:
863 tar_compression = ''
864 elif _ZLIB_SUPPORTED and compress == 'gzip':
865 tar_compression = 'gz'
866 elif _BZ2_SUPPORTED and compress == 'bzip2':
867 tar_compression = 'bz2'
868 elif _LZMA_SUPPORTED and compress == 'xz':
869 tar_compression = 'xz'
870 else:
Tarek Ziadéffa155a2010-04-29 13:34:35 +0000871 raise ValueError("bad value for 'compress', or compression format not "
872 "supported : {0}".format(compress))
Tarek Ziadé396fad72010-02-23 05:30:31 +0000873
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +0200874 import tarfile # late import for breaking circular dependency
875
876 compress_ext = '.' + tar_compression if compress else ''
877 archive_name = base_name + '.tar' + compress_ext
Tarek Ziadé396fad72010-02-23 05:30:31 +0000878 archive_dir = os.path.dirname(archive_name)
Tarek Ziadé5e2be872010-04-20 21:40:47 +0000879
Serhiy Storchaka9a4fc192014-11-28 00:48:46 +0200880 if archive_dir and not os.path.exists(archive_dir):
Éric Araujoac4e58e2011-01-29 20:32:11 +0000881 if logger is not None:
Éric Araujo43a7ee12011-08-19 02:55:11 +0200882 logger.info("creating %s", archive_dir)
Tarek Ziadé396fad72010-02-23 05:30:31 +0000883 if not dry_run:
884 os.makedirs(archive_dir)
885
Tarek Ziadé396fad72010-02-23 05:30:31 +0000886 # creating the tarball
Tarek Ziadé396fad72010-02-23 05:30:31 +0000887 if logger is not None:
888 logger.info('Creating tar archive')
889
890 uid = _get_uid(owner)
891 gid = _get_gid(group)
892
893 def _set_uid_gid(tarinfo):
894 if gid is not None:
895 tarinfo.gid = gid
896 tarinfo.gname = group
897 if uid is not None:
898 tarinfo.uid = uid
899 tarinfo.uname = owner
900 return tarinfo
901
902 if not dry_run:
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +0200903 tar = tarfile.open(archive_name, 'w|%s' % tar_compression)
Tarek Ziadé396fad72010-02-23 05:30:31 +0000904 try:
905 tar.add(base_dir, filter=_set_uid_gid)
906 finally:
907 tar.close()
908
Tarek Ziadé396fad72010-02-23 05:30:31 +0000909 return archive_name
910
Tarek Ziadé396fad72010-02-23 05:30:31 +0000911def _make_zipfile(base_name, base_dir, verbose=0, dry_run=0, logger=None):
912 """Create a zip file from all the files under 'base_dir'.
913
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +0200914 The output zip file will be named 'base_name' + ".zip". Returns the
915 name of the output zip file.
Tarek Ziadé396fad72010-02-23 05:30:31 +0000916 """
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +0200917 import zipfile # late import for breaking circular dependency
Andrew Kuchlinga0934b22014-03-20 16:11:16 -0400918
Tarek Ziadé396fad72010-02-23 05:30:31 +0000919 zip_filename = base_name + ".zip"
920 archive_dir = os.path.dirname(base_name)
921
Serhiy Storchaka9a4fc192014-11-28 00:48:46 +0200922 if archive_dir and not os.path.exists(archive_dir):
Tarek Ziadé396fad72010-02-23 05:30:31 +0000923 if logger is not None:
924 logger.info("creating %s", archive_dir)
925 if not dry_run:
926 os.makedirs(archive_dir)
927
Andrew Kuchlinga0934b22014-03-20 16:11:16 -0400928 if logger is not None:
929 logger.info("creating '%s' and adding '%s' to it",
930 zip_filename, base_dir)
Tarek Ziadé396fad72010-02-23 05:30:31 +0000931
Andrew Kuchlinga0934b22014-03-20 16:11:16 -0400932 if not dry_run:
933 with zipfile.ZipFile(zip_filename, "w",
934 compression=zipfile.ZIP_DEFLATED) as zf:
Serhiy Storchakad941d7a2015-09-08 05:51:00 +0300935 path = os.path.normpath(base_dir)
Serhiy Storchaka666de772016-10-23 15:55:09 +0300936 if path != os.curdir:
937 zf.write(path, path)
938 if logger is not None:
939 logger.info("adding '%s'", path)
Andrew Kuchlinga0934b22014-03-20 16:11:16 -0400940 for dirpath, dirnames, filenames in os.walk(base_dir):
Serhiy Storchakad941d7a2015-09-08 05:51:00 +0300941 for name in sorted(dirnames):
942 path = os.path.normpath(os.path.join(dirpath, name))
943 zf.write(path, path)
944 if logger is not None:
945 logger.info("adding '%s'", path)
Andrew Kuchlinga0934b22014-03-20 16:11:16 -0400946 for name in filenames:
947 path = os.path.normpath(os.path.join(dirpath, name))
948 if os.path.isfile(path):
949 zf.write(path, path)
950 if logger is not None:
951 logger.info("adding '%s'", path)
Tarek Ziadé396fad72010-02-23 05:30:31 +0000952
953 return zip_filename
954
955_ARCHIVE_FORMATS = {
Tarek Ziadé396fad72010-02-23 05:30:31 +0000956 'tar': (_make_tarball, [('compress', None)], "uncompressed tar file"),
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +0200957}
958
959if _ZLIB_SUPPORTED:
960 _ARCHIVE_FORMATS['gztar'] = (_make_tarball, [('compress', 'gzip')],
961 "gzip'ed tar-file")
962 _ARCHIVE_FORMATS['zip'] = (_make_zipfile, [], "ZIP file")
Tarek Ziadé396fad72010-02-23 05:30:31 +0000963
Tarek Ziadéffa155a2010-04-29 13:34:35 +0000964if _BZ2_SUPPORTED:
965 _ARCHIVE_FORMATS['bztar'] = (_make_tarball, [('compress', 'bzip2')],
966 "bzip2'ed tar-file")
967
Serhiy Storchaka11213772014-08-06 18:50:19 +0300968if _LZMA_SUPPORTED:
969 _ARCHIVE_FORMATS['xztar'] = (_make_tarball, [('compress', 'xz')],
970 "xz'ed tar-file")
971
Tarek Ziadé396fad72010-02-23 05:30:31 +0000972def get_archive_formats():
973 """Returns a list of supported formats for archiving and unarchiving.
974
975 Each element of the returned sequence is a tuple (name, description)
976 """
977 formats = [(name, registry[2]) for name, registry in
978 _ARCHIVE_FORMATS.items()]
979 formats.sort()
980 return formats
981
982def register_archive_format(name, function, extra_args=None, description=''):
983 """Registers an archive format.
984
985 name is the name of the format. function is the callable that will be
986 used to create archives. If provided, extra_args is a sequence of
987 (name, value) tuples that will be passed as arguments to the callable.
988 description can be provided to describe the format, and will be returned
989 by the get_archive_formats() function.
990 """
991 if extra_args is None:
992 extra_args = []
Florent Xicluna5d1155c2011-10-28 14:45:05 +0200993 if not callable(function):
Tarek Ziadé396fad72010-02-23 05:30:31 +0000994 raise TypeError('The %s object is not callable' % function)
995 if not isinstance(extra_args, (tuple, list)):
996 raise TypeError('extra_args needs to be a sequence')
997 for element in extra_args:
Éric Araujoc1b7e7f2011-09-18 23:12:30 +0200998 if not isinstance(element, (tuple, list)) or len(element) !=2:
Tarek Ziadé396fad72010-02-23 05:30:31 +0000999 raise TypeError('extra_args elements are : (arg_name, value)')
1000
1001 _ARCHIVE_FORMATS[name] = (function, extra_args, description)
1002
1003def unregister_archive_format(name):
1004 del _ARCHIVE_FORMATS[name]
1005
1006def make_archive(base_name, format, root_dir=None, base_dir=None, verbose=0,
1007 dry_run=0, owner=None, group=None, logger=None):
1008 """Create an archive file (eg. zip or tar).
1009
1010 'base_name' is the name of the file to create, minus any format-specific
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +02001011 extension; 'format' is the archive format: one of "zip", "tar", "gztar",
1012 "bztar", or "xztar". Or any other registered format.
Tarek Ziadé396fad72010-02-23 05:30:31 +00001013
1014 'root_dir' is a directory that will be the root directory of the
1015 archive; ie. we typically chdir into 'root_dir' before creating the
1016 archive. 'base_dir' is the directory where we start archiving from;
1017 ie. 'base_dir' will be the common prefix of all files and
1018 directories in the archive. 'root_dir' and 'base_dir' both default
1019 to the current directory. Returns the name of the archive file.
1020
1021 'owner' and 'group' are used when creating a tar archive. By default,
1022 uses the current owner and group.
1023 """
Steve Dower60419a72019-06-24 08:42:54 -07001024 sys.audit("shutil.make_archive", base_name, format, root_dir, base_dir)
Tarek Ziadé396fad72010-02-23 05:30:31 +00001025 save_cwd = os.getcwd()
1026 if root_dir is not None:
1027 if logger is not None:
1028 logger.debug("changing into '%s'", root_dir)
1029 base_name = os.path.abspath(base_name)
1030 if not dry_run:
1031 os.chdir(root_dir)
1032
1033 if base_dir is None:
1034 base_dir = os.curdir
1035
1036 kwargs = {'dry_run': dry_run, 'logger': logger}
1037
1038 try:
1039 format_info = _ARCHIVE_FORMATS[format]
1040 except KeyError:
Serhiy Storchaka5affd232017-04-05 09:37:24 +03001041 raise ValueError("unknown archive format '%s'" % format) from None
Tarek Ziadé396fad72010-02-23 05:30:31 +00001042
1043 func = format_info[0]
1044 for arg, val in format_info[1]:
1045 kwargs[arg] = val
1046
1047 if format != 'zip':
1048 kwargs['owner'] = owner
1049 kwargs['group'] = group
1050
1051 try:
1052 filename = func(base_name, base_dir, **kwargs)
1053 finally:
1054 if root_dir is not None:
1055 if logger is not None:
1056 logger.debug("changing back to '%s'", save_cwd)
1057 os.chdir(save_cwd)
1058
1059 return filename
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001060
1061
1062def get_unpack_formats():
1063 """Returns a list of supported formats for unpacking.
1064
1065 Each element of the returned sequence is a tuple
1066 (name, extensions, description)
1067 """
1068 formats = [(name, info[0], info[3]) for name, info in
1069 _UNPACK_FORMATS.items()]
1070 formats.sort()
1071 return formats
1072
1073def _check_unpack_options(extensions, function, extra_args):
1074 """Checks what gets registered as an unpacker."""
1075 # first make sure no other unpacker is registered for this extension
1076 existing_extensions = {}
1077 for name, info in _UNPACK_FORMATS.items():
1078 for ext in info[0]:
1079 existing_extensions[ext] = name
1080
1081 for extension in extensions:
1082 if extension in existing_extensions:
1083 msg = '%s is already registered for "%s"'
1084 raise RegistryError(msg % (extension,
1085 existing_extensions[extension]))
1086
Florent Xicluna5d1155c2011-10-28 14:45:05 +02001087 if not callable(function):
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001088 raise TypeError('The registered function must be a callable')
1089
1090
1091def register_unpack_format(name, extensions, function, extra_args=None,
1092 description=''):
1093 """Registers an unpack format.
1094
1095 `name` is the name of the format. `extensions` is a list of extensions
1096 corresponding to the format.
1097
1098 `function` is the callable that will be
1099 used to unpack archives. The callable will receive archives to unpack.
1100 If it's unable to handle an archive, it needs to raise a ReadError
1101 exception.
1102
1103 If provided, `extra_args` is a sequence of
1104 (name, value) tuples that will be passed as arguments to the callable.
1105 description can be provided to describe the format, and will be returned
1106 by the get_unpack_formats() function.
1107 """
1108 if extra_args is None:
1109 extra_args = []
1110 _check_unpack_options(extensions, function, extra_args)
1111 _UNPACK_FORMATS[name] = extensions, function, extra_args, description
1112
1113def unregister_unpack_format(name):
Martin Pantereb995702016-07-28 01:11:04 +00001114 """Removes the pack format from the registry."""
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001115 del _UNPACK_FORMATS[name]
1116
1117def _ensure_directory(path):
1118 """Ensure that the parent directory of `path` exists"""
1119 dirname = os.path.dirname(path)
1120 if not os.path.isdir(dirname):
1121 os.makedirs(dirname)
1122
1123def _unpack_zipfile(filename, extract_dir):
1124 """Unpack zip `filename` to `extract_dir`
1125 """
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +02001126 import zipfile # late import for breaking circular dependency
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001127
1128 if not zipfile.is_zipfile(filename):
1129 raise ReadError("%s is not a zip file" % filename)
1130
1131 zip = zipfile.ZipFile(filename)
1132 try:
1133 for info in zip.infolist():
1134 name = info.filename
1135
1136 # don't extract absolute paths or ones with .. in them
1137 if name.startswith('/') or '..' in name:
1138 continue
1139
1140 target = os.path.join(extract_dir, *name.split('/'))
1141 if not target:
1142 continue
1143
1144 _ensure_directory(target)
1145 if not name.endswith('/'):
1146 # file
1147 data = zip.read(info.filename)
Éric Araujoc1b7e7f2011-09-18 23:12:30 +02001148 f = open(target, 'wb')
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001149 try:
1150 f.write(data)
1151 finally:
1152 f.close()
1153 del data
1154 finally:
1155 zip.close()
1156
1157def _unpack_tarfile(filename, extract_dir):
Serhiy Storchaka11213772014-08-06 18:50:19 +03001158 """Unpack tar/tar.gz/tar.bz2/tar.xz `filename` to `extract_dir`
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001159 """
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +02001160 import tarfile # late import for breaking circular dependency
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001161 try:
1162 tarobj = tarfile.open(filename)
1163 except tarfile.TarError:
1164 raise ReadError(
1165 "%s is not a compressed or uncompressed tar file" % filename)
1166 try:
1167 tarobj.extractall(extract_dir)
1168 finally:
1169 tarobj.close()
1170
1171_UNPACK_FORMATS = {
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001172 'tar': (['.tar'], _unpack_tarfile, [], "uncompressed tar file"),
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +02001173 'zip': (['.zip'], _unpack_zipfile, [], "ZIP file"),
1174}
1175
1176if _ZLIB_SUPPORTED:
1177 _UNPACK_FORMATS['gztar'] = (['.tar.gz', '.tgz'], _unpack_tarfile, [],
1178 "gzip'ed tar-file")
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001179
Tarek Ziadéffa155a2010-04-29 13:34:35 +00001180if _BZ2_SUPPORTED:
Serhiy Storchaka11213772014-08-06 18:50:19 +03001181 _UNPACK_FORMATS['bztar'] = (['.tar.bz2', '.tbz2'], _unpack_tarfile, [],
Tarek Ziadéffa155a2010-04-29 13:34:35 +00001182 "bzip2'ed tar-file")
1183
Serhiy Storchaka11213772014-08-06 18:50:19 +03001184if _LZMA_SUPPORTED:
1185 _UNPACK_FORMATS['xztar'] = (['.tar.xz', '.txz'], _unpack_tarfile, [],
1186 "xz'ed tar-file")
1187
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001188def _find_unpack_format(filename):
1189 for name, info in _UNPACK_FORMATS.items():
1190 for extension in info[0]:
1191 if filename.endswith(extension):
1192 return name
1193 return None
1194
1195def unpack_archive(filename, extract_dir=None, format=None):
1196 """Unpack an archive.
1197
1198 `filename` is the name of the archive.
1199
1200 `extract_dir` is the name of the target directory, where the archive
1201 is unpacked. If not provided, the current working directory is used.
1202
Serhiy Storchaka20cdffd2016-12-16 18:58:33 +02001203 `format` is the archive format: one of "zip", "tar", "gztar", "bztar",
1204 or "xztar". Or any other registered format. If not provided,
1205 unpack_archive will use the filename extension and see if an unpacker
1206 was registered for that extension.
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001207
1208 In case none is found, a ValueError is raised.
1209 """
1210 if extract_dir is None:
1211 extract_dir = os.getcwd()
1212
Jelle Zijlstraa12df7b2017-05-05 14:27:12 -07001213 extract_dir = os.fspath(extract_dir)
1214 filename = os.fspath(filename)
1215
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001216 if format is not None:
1217 try:
1218 format_info = _UNPACK_FORMATS[format]
1219 except KeyError:
Serhiy Storchaka5affd232017-04-05 09:37:24 +03001220 raise ValueError("Unknown unpack format '{0}'".format(format)) from None
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001221
Nick Coghlanabf202d2011-03-16 13:52:20 -04001222 func = format_info[1]
1223 func(filename, extract_dir, **dict(format_info[2]))
Tarek Ziadé6ac91722010-04-28 17:51:36 +00001224 else:
1225 # we need to look at the registered unpackers supported extensions
1226 format = _find_unpack_format(filename)
1227 if format is None:
1228 raise ReadError("Unknown archive format '{0}'".format(filename))
1229
1230 func = _UNPACK_FORMATS[format][1]
1231 kwargs = dict(_UNPACK_FORMATS[format][2])
1232 func(filename, extract_dir, **kwargs)
Giampaolo Rodola'210e7ca2011-07-01 13:55:36 +02001233
Éric Araujoe4d5b8e2011-08-08 16:51:11 +02001234
1235if hasattr(os, 'statvfs'):
1236
1237 __all__.append('disk_usage')
1238 _ntuple_diskusage = collections.namedtuple('usage', 'total used free')
Raymond Hettinger5b798ab2015-08-17 22:04:45 -07001239 _ntuple_diskusage.total.__doc__ = 'Total space in bytes'
1240 _ntuple_diskusage.used.__doc__ = 'Used space in bytes'
1241 _ntuple_diskusage.free.__doc__ = 'Free space in bytes'
Giampaolo Rodola'210e7ca2011-07-01 13:55:36 +02001242
1243 def disk_usage(path):
Éric Araujoe4d5b8e2011-08-08 16:51:11 +02001244 """Return disk usage statistics about the given path.
1245
Sandro Tosif8ae4fa2012-04-23 20:07:15 +02001246 Returned value is a named tuple with attributes 'total', 'used' and
Éric Araujoe4d5b8e2011-08-08 16:51:11 +02001247 'free', which are the amount of total, used and free space, in bytes.
Giampaolo Rodola'210e7ca2011-07-01 13:55:36 +02001248 """
Éric Araujoe4d5b8e2011-08-08 16:51:11 +02001249 st = os.statvfs(path)
1250 free = st.f_bavail * st.f_frsize
1251 total = st.f_blocks * st.f_frsize
1252 used = (st.f_blocks - st.f_bfree) * st.f_frsize
1253 return _ntuple_diskusage(total, used, free)
1254
Giampaolo Rodolac7f02a92018-06-19 08:27:29 -07001255elif _WINDOWS:
Éric Araujoe4d5b8e2011-08-08 16:51:11 +02001256
Éric Araujoe4d5b8e2011-08-08 16:51:11 +02001257 __all__.append('disk_usage')
1258 _ntuple_diskusage = collections.namedtuple('usage', 'total used free')
1259
1260 def disk_usage(path):
1261 """Return disk usage statistics about the given path.
1262
Ezio Melotti30b9d5d2013-08-17 15:50:46 +03001263 Returned values is a named tuple with attributes 'total', 'used' and
Éric Araujoe4d5b8e2011-08-08 16:51:11 +02001264 'free', which are the amount of total, used and free space, in bytes.
1265 """
1266 total, free = nt._getdiskusage(path)
1267 used = total - free
Giampaolo Rodola'210e7ca2011-07-01 13:55:36 +02001268 return _ntuple_diskusage(total, used, free)
Sandro Tosid902a142011-08-22 23:28:27 +02001269
Éric Araujo0ac4a5d2011-09-01 08:31:51 +02001270
Sandro Tosid902a142011-08-22 23:28:27 +02001271def chown(path, user=None, group=None):
1272 """Change owner user and group of the given path.
1273
1274 user and group can be the uid/gid or the user/group names, and in that case,
1275 they are converted to their respective uid/gid.
1276 """
1277
1278 if user is None and group is None:
1279 raise ValueError("user and/or group must be set")
1280
1281 _user = user
1282 _group = group
1283
1284 # -1 means don't change it
1285 if user is None:
1286 _user = -1
1287 # user can either be an int (the uid) or a string (the system username)
1288 elif isinstance(user, str):
1289 _user = _get_uid(user)
1290 if _user is None:
1291 raise LookupError("no such user: {!r}".format(user))
1292
1293 if group is None:
1294 _group = -1
1295 elif not isinstance(group, int):
1296 _group = _get_gid(group)
1297 if _group is None:
1298 raise LookupError("no such group: {!r}".format(group))
1299
1300 os.chown(path, _user, _group)
Antoine Pitroubcf2b592012-02-08 23:28:36 +01001301
1302def get_terminal_size(fallback=(80, 24)):
1303 """Get the size of the terminal window.
1304
1305 For each of the two dimensions, the environment variable, COLUMNS
1306 and LINES respectively, is checked. If the variable is defined and
1307 the value is a positive integer, it is used.
1308
1309 When COLUMNS or LINES is not defined, which is the common case,
1310 the terminal connected to sys.__stdout__ is queried
1311 by invoking os.get_terminal_size.
1312
1313 If the terminal size cannot be successfully queried, either because
1314 the system doesn't support querying, or because we are not
1315 connected to a terminal, the value given in fallback parameter
1316 is used. Fallback defaults to (80, 24) which is the default
1317 size used by many terminal emulators.
1318
1319 The value returned is a named tuple of type os.terminal_size.
1320 """
1321 # columns, lines are the working values
1322 try:
1323 columns = int(os.environ['COLUMNS'])
1324 except (KeyError, ValueError):
1325 columns = 0
1326
1327 try:
1328 lines = int(os.environ['LINES'])
1329 except (KeyError, ValueError):
1330 lines = 0
1331
1332 # only query if necessary
1333 if columns <= 0 or lines <= 0:
1334 try:
1335 size = os.get_terminal_size(sys.__stdout__.fileno())
Serhiy Storchakad30829d2016-04-24 09:58:43 +03001336 except (AttributeError, ValueError, OSError):
1337 # stdout is None, closed, detached, or not a terminal, or
1338 # os.get_terminal_size() is unsupported
Antoine Pitroubcf2b592012-02-08 23:28:36 +01001339 size = os.terminal_size(fallback)
1340 if columns <= 0:
1341 columns = size.columns
1342 if lines <= 0:
1343 lines = size.lines
1344
1345 return os.terminal_size((columns, lines))
Brian Curtinc57a3452012-06-22 16:00:30 -05001346
Cheryl Sabella5680f652019-02-13 06:25:10 -05001347
1348# Check that a given file can be accessed with the correct mode.
1349# Additionally check that `file` is not a directory, as on Windows
1350# directories pass the os.access check.
1351def _access_check(fn, mode):
1352 return (os.path.exists(fn) and os.access(fn, mode)
1353 and not os.path.isdir(fn))
1354
1355
Brian Curtinc57a3452012-06-22 16:00:30 -05001356def which(cmd, mode=os.F_OK | os.X_OK, path=None):
Brian Curtindc00f1e2012-06-22 22:49:12 -05001357 """Given a command, mode, and a PATH string, return the path which
Philip Jenvey88bc0d22012-06-23 15:54:38 -07001358 conforms to the given mode on the PATH, or None if there is no such
1359 file.
1360
1361 `mode` defaults to os.F_OK | os.X_OK. `path` defaults to the result
1362 of os.environ.get("PATH"), or can be overridden with a custom search
1363 path.
1364
1365 """
Serhiy Storchaka8bea2002013-01-23 10:44:21 +02001366 # If we're given a path with a directory part, look it up directly rather
1367 # than referring to PATH directories. This includes checking relative to the
1368 # current directory, e.g. ./script
1369 if os.path.dirname(cmd):
1370 if _access_check(cmd, mode):
1371 return cmd
1372 return None
Brian Curtinc57a3452012-06-22 16:00:30 -05001373
Cheryl Sabella5680f652019-02-13 06:25:10 -05001374 use_bytes = isinstance(cmd, bytes)
1375
Barry Warsaw618738b2013-04-16 11:05:03 -04001376 if path is None:
Victor Stinner228a3c92019-04-17 16:26:36 +02001377 path = os.environ.get("PATH", None)
1378 if path is None:
1379 try:
1380 path = os.confstr("CS_PATH")
1381 except (AttributeError, ValueError):
1382 # os.confstr() or CS_PATH is not available
1383 path = os.defpath
1384 # bpo-35755: Don't use os.defpath if the PATH environment variable is
Victor Stinner197f0442019-04-17 17:44:06 +02001385 # set to an empty string
Victor Stinner228a3c92019-04-17 16:26:36 +02001386
1387 # PATH='' doesn't match, whereas PATH=':' looks in the current directory
Barry Warsaw618738b2013-04-16 11:05:03 -04001388 if not path:
1389 return None
Victor Stinner228a3c92019-04-17 16:26:36 +02001390
Cheryl Sabella5680f652019-02-13 06:25:10 -05001391 if use_bytes:
1392 path = os.fsencode(path)
1393 path = path.split(os.fsencode(os.pathsep))
1394 else:
1395 path = os.fsdecode(path)
1396 path = path.split(os.pathsep)
Brian Curtinc57a3452012-06-22 16:00:30 -05001397
1398 if sys.platform == "win32":
1399 # The current directory takes precedence on Windows.
Cheryl Sabella5680f652019-02-13 06:25:10 -05001400 curdir = os.curdir
1401 if use_bytes:
1402 curdir = os.fsencode(curdir)
1403 if curdir not in path:
1404 path.insert(0, curdir)
Brian Curtinc57a3452012-06-22 16:00:30 -05001405
1406 # PATHEXT is necessary to check on Windows.
1407 pathext = os.environ.get("PATHEXT", "").split(os.pathsep)
Cheryl Sabella5680f652019-02-13 06:25:10 -05001408 if use_bytes:
1409 pathext = [os.fsencode(ext) for ext in pathext]
Brian Curtinc57a3452012-06-22 16:00:30 -05001410 # See if the given file matches any of the expected path extensions.
1411 # This will allow us to short circuit when given "python.exe".
Philip Jenvey88bc0d22012-06-23 15:54:38 -07001412 # If it does match, only test that one, otherwise we have to try
1413 # others.
Serhiy Storchaka014791f2013-01-21 15:00:27 +02001414 if any(cmd.lower().endswith(ext.lower()) for ext in pathext):
1415 files = [cmd]
1416 else:
1417 files = [cmd + ext for ext in pathext]
Brian Curtinc57a3452012-06-22 16:00:30 -05001418 else:
1419 # On other platforms you don't have things like PATHEXT to tell you
1420 # what file suffixes are executable, so just pass on cmd as-is.
1421 files = [cmd]
1422
1423 seen = set()
1424 for dir in path:
Serhiy Storchaka014791f2013-01-21 15:00:27 +02001425 normdir = os.path.normcase(dir)
1426 if not normdir in seen:
1427 seen.add(normdir)
Brian Curtinc57a3452012-06-22 16:00:30 -05001428 for thefile in files:
1429 name = os.path.join(dir, thefile)
1430 if _access_check(name, mode):
1431 return name
1432 return None