blob: 499e6285618f212801d3690311badc739b824070 [file] [log] [blame]
Ned Deily5c867012014-06-26 23:40:06 -07001r"""OS routines for NT or Posix depending on what system we're on.
Guido van Rossum31104f41992-01-14 18:28:36 +00002
Guido van Rossum54f22ed2000-02-04 15:10:34 +00003This exports:
Larry Hastings10108a72016-09-05 15:11:23 -07004 - all functions from posix or nt, e.g. unlink, stat, etc.
Alexandre Vassalottieca20b62008-05-16 02:54:33 +00005 - os.path is either posixpath or ntpath
Larry Hastings10108a72016-09-05 15:11:23 -07006 - os.name is either 'posix' or 'nt'
Ned Deilybf090e32016-10-01 21:12:35 -04007 - os.curdir is a string representing the current directory (always '.')
8 - os.pardir is a string representing the parent directory (always '..')
9 - os.sep is the (or a most common) pathname separator ('/' or '\\')
Georg Brandled5b9b32008-12-05 07:45:54 +000010 - os.extsep is the extension separator (always '.')
Guido van Rossum4b8c6ea2000-02-04 15:39:30 +000011 - os.altsep is the alternate pathname separator (None or '/')
Guido van Rossum54f22ed2000-02-04 15:10:34 +000012 - os.pathsep is the component separator used in $PATH etc
Guido van Rossum4b8c6ea2000-02-04 15:39:30 +000013 - os.linesep is the line separator in text files ('\r' or '\n' or '\r\n')
Guido van Rossum54f22ed2000-02-04 15:10:34 +000014 - os.defpath is the default search path for executables
Martin v. Löwisbdec50f2004-06-08 08:29:33 +000015 - os.devnull is the file path of the null device ('/dev/null', etc.)
Guido van Rossum31104f41992-01-14 18:28:36 +000016
Guido van Rossum54f22ed2000-02-04 15:10:34 +000017Programs that import and use 'os' stand a better chance of being
18portable between different platforms. Of course, they must then
19only use functions that are defined by all platforms (e.g., unlink
20and opendir), and leave all pathname manipulation to os.path
21(e.g., split and join).
22"""
Guido van Rossum31104f41992-01-14 18:28:36 +000023
Skip Montanaro269b83b2001-02-06 01:07:02 +000024#'
Ethan Furman958b3e42016-06-04 12:49:35 -070025import abc
Serhiy Storchaka81108372017-09-26 00:55:55 +030026import sys
Charles-François Natali7372b062012-02-05 15:15:38 +010027import stat as st
Guido van Rossuma28dab51997-08-29 22:36:47 +000028
29_names = sys.builtin_module_names
30
Tim Petersc4e09402003-04-25 07:11:48 +000031# Note: more names are added to __all__ later.
Brett Cannon13962fc2008-08-18 01:45:29 +000032__all__ = ["altsep", "curdir", "pardir", "sep", "pathsep", "linesep",
Petri Lehtinen3bc37f22012-05-23 21:36:16 +030033 "defpath", "name", "path", "devnull", "SEEK_SET", "SEEK_CUR",
34 "SEEK_END", "fsencode", "fsdecode", "get_exec_path", "fdopen",
35 "popen", "extsep"]
Skip Montanaro269b83b2001-02-06 01:07:02 +000036
Charles-François Natali7372b062012-02-05 15:15:38 +010037def _exists(name):
38 return name in globals()
39
Skip Montanaro269b83b2001-02-06 01:07:02 +000040def _get_exports_list(module):
41 try:
42 return list(module.__all__)
43 except AttributeError:
44 return [n for n in dir(module) if n[0] != '_']
45
Brett Cannonfd074152012-04-14 14:10:13 -040046# Any new dependencies of the os module and/or changes in path separator
47# requires updating importlib as well.
Guido van Rossuma28dab51997-08-29 22:36:47 +000048if 'posix' in _names:
Guido van Rossum61de0ac1997-12-05 21:24:30 +000049 name = 'posix'
Guido van Rossume9387ea1998-05-22 15:26:04 +000050 linesep = '\n'
Guido van Rossum61de0ac1997-12-05 21:24:30 +000051 from posix import *
52 try:
53 from posix import _exit
Petri Lehtinen3bc37f22012-05-23 21:36:16 +030054 __all__.append('_exit')
Brett Cannoncd171c82013-07-04 17:43:24 -040055 except ImportError:
Guido van Rossum61de0ac1997-12-05 21:24:30 +000056 pass
Skip Montanaro117910d2003-02-14 19:35:31 +000057 import posixpath as path
Tim Petersf2715e02003-02-19 02:35:07 +000058
Larry Hastings9cf065c2012-06-22 16:30:09 -070059 try:
60 from posix import _have_functions
Brett Cannoncd171c82013-07-04 17:43:24 -040061 except ImportError:
Larry Hastings9cf065c2012-06-22 16:30:09 -070062 pass
Skip Montanaro269b83b2001-02-06 01:07:02 +000063
Yury Selivanov97e2e062014-09-26 12:33:06 -040064 import posix
65 __all__.extend(_get_exports_list(posix))
66 del posix
67
Guido van Rossuma28dab51997-08-29 22:36:47 +000068elif 'nt' in _names:
Guido van Rossum61de0ac1997-12-05 21:24:30 +000069 name = 'nt'
Guido van Rossume9387ea1998-05-22 15:26:04 +000070 linesep = '\r\n'
Guido van Rossum61de0ac1997-12-05 21:24:30 +000071 from nt import *
Tim Peters6757c1e2003-01-08 21:20:57 +000072 try:
73 from nt import _exit
Petri Lehtinen3bc37f22012-05-23 21:36:16 +030074 __all__.append('_exit')
Brett Cannoncd171c82013-07-04 17:43:24 -040075 except ImportError:
Tim Peters6757c1e2003-01-08 21:20:57 +000076 pass
Skip Montanaro117910d2003-02-14 19:35:31 +000077 import ntpath as path
Tim Petersf2715e02003-02-19 02:35:07 +000078
Skip Montanaro269b83b2001-02-06 01:07:02 +000079 import nt
80 __all__.extend(_get_exports_list(nt))
81 del nt
82
Larry Hastings9cf065c2012-06-22 16:30:09 -070083 try:
84 from nt import _have_functions
Brett Cannoncd171c82013-07-04 17:43:24 -040085 except ImportError:
Larry Hastings9cf065c2012-06-22 16:30:09 -070086 pass
87
Guido van Rossum2979b011994-08-01 11:18:30 +000088else:
Brett Cannoncd171c82013-07-04 17:43:24 -040089 raise ImportError('no os specific module found')
Guido van Rossume65cce51993-11-08 15:05:21 +000090
Skip Montanaro117910d2003-02-14 19:35:31 +000091sys.modules['os.path'] = path
Georg Brandled5b9b32008-12-05 07:45:54 +000092from os.path import (curdir, pardir, sep, pathsep, defpath, extsep, altsep,
93 devnull)
Skip Montanaro269b83b2001-02-06 01:07:02 +000094
Guido van Rossuma28dab51997-08-29 22:36:47 +000095del _names
96
Larry Hastings9cf065c2012-06-22 16:30:09 -070097
98if _exists("_have_functions"):
99 _globals = globals()
100 def _add(str, fn):
101 if (fn in _globals) and (str in _have_functions):
102 _set.add(_globals[fn])
103
104 _set = set()
105 _add("HAVE_FACCESSAT", "access")
106 _add("HAVE_FCHMODAT", "chmod")
107 _add("HAVE_FCHOWNAT", "chown")
108 _add("HAVE_FSTATAT", "stat")
109 _add("HAVE_FUTIMESAT", "utime")
110 _add("HAVE_LINKAT", "link")
111 _add("HAVE_MKDIRAT", "mkdir")
112 _add("HAVE_MKFIFOAT", "mkfifo")
113 _add("HAVE_MKNODAT", "mknod")
114 _add("HAVE_OPENAT", "open")
115 _add("HAVE_READLINKAT", "readlink")
116 _add("HAVE_RENAMEAT", "rename")
117 _add("HAVE_SYMLINKAT", "symlink")
118 _add("HAVE_UNLINKAT", "unlink")
Larry Hastingsb698d8e2012-06-23 16:55:07 -0700119 _add("HAVE_UNLINKAT", "rmdir")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700120 _add("HAVE_UTIMENSAT", "utime")
121 supports_dir_fd = _set
122
123 _set = set()
124 _add("HAVE_FACCESSAT", "access")
125 supports_effective_ids = _set
126
127 _set = set()
128 _add("HAVE_FCHDIR", "chdir")
129 _add("HAVE_FCHMOD", "chmod")
130 _add("HAVE_FCHOWN", "chown")
131 _add("HAVE_FDOPENDIR", "listdir")
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300132 _add("HAVE_FDOPENDIR", "scandir")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700133 _add("HAVE_FEXECVE", "execve")
134 _set.add(stat) # fstat always works
Georg Brandl306336b2012-06-24 12:55:33 +0200135 _add("HAVE_FTRUNCATE", "truncate")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700136 _add("HAVE_FUTIMENS", "utime")
137 _add("HAVE_FUTIMES", "utime")
Georg Brandl306336b2012-06-24 12:55:33 +0200138 _add("HAVE_FPATHCONF", "pathconf")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700139 if _exists("statvfs") and _exists("fstatvfs"): # mac os x10.3
140 _add("HAVE_FSTATVFS", "statvfs")
141 supports_fd = _set
142
143 _set = set()
144 _add("HAVE_FACCESSAT", "access")
Larry Hastingsdbbc0c82012-06-22 19:50:21 -0700145 # Some platforms don't support lchmod(). Often the function exists
146 # anyway, as a stub that always returns ENOSUP or perhaps EOPNOTSUPP.
147 # (No, I don't know why that's a good design.) ./configure will detect
148 # this and reject it--so HAVE_LCHMOD still won't be defined on such
149 # platforms. This is Very Helpful.
150 #
151 # However, sometimes platforms without a working lchmod() *do* have
152 # fchmodat(). (Examples: Linux kernel 3.2 with glibc 2.15,
153 # OpenIndiana 3.x.) And fchmodat() has a flag that theoretically makes
154 # it behave like lchmod(). So in theory it would be a suitable
155 # replacement for lchmod(). But when lchmod() doesn't work, fchmodat()'s
156 # flag doesn't work *either*. Sadly ./configure isn't sophisticated
157 # enough to detect this condition--it only determines whether or not
158 # fchmodat() minimally works.
159 #
160 # Therefore we simply ignore fchmodat() when deciding whether or not
161 # os.chmod supports follow_symlinks. Just checking lchmod() is
162 # sufficient. After all--if you have a working fchmodat(), your
163 # lchmod() almost certainly works too.
164 #
165 # _add("HAVE_FCHMODAT", "chmod")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700166 _add("HAVE_FCHOWNAT", "chown")
167 _add("HAVE_FSTATAT", "stat")
168 _add("HAVE_LCHFLAGS", "chflags")
169 _add("HAVE_LCHMOD", "chmod")
170 if _exists("lchown"): # mac os x10.3
171 _add("HAVE_LCHOWN", "chown")
172 _add("HAVE_LINKAT", "link")
173 _add("HAVE_LUTIMES", "utime")
174 _add("HAVE_LSTAT", "stat")
175 _add("HAVE_FSTATAT", "stat")
176 _add("HAVE_UTIMENSAT", "utime")
177 _add("MS_WINDOWS", "stat")
178 supports_follow_symlinks = _set
179
Larry Hastings9cf065c2012-06-22 16:30:09 -0700180 del _set
181 del _have_functions
182 del _globals
183 del _add
184
185
Martin v. Löwis22b457e2005-01-16 08:40:58 +0000186# Python uses fixed values for the SEEK_ constants; they are mapped
187# to native constants if necessary in posixmodule.c
Jesus Cea94363612012-06-22 18:32:07 +0200188# Other possible SEEK values are directly imported from posixmodule.c
Martin v. Löwis22b457e2005-01-16 08:40:58 +0000189SEEK_SET = 0
190SEEK_CUR = 1
191SEEK_END = 2
192
Guido van Rossum4def7de1998-07-24 20:48:03 +0000193# Super directory utilities.
194# (Inspired by Eric Raymond; the doc strings are mostly his)
195
Terry Reedy5a22b652010-12-02 07:05:56 +0000196def makedirs(name, mode=0o777, exist_ok=False):
Zachary Warea22ae212014-03-20 09:42:01 -0500197 """makedirs(name [, mode=0o777][, exist_ok=False])
Guido van Rossum4def7de1998-07-24 20:48:03 +0000198
Benjamin Petersonee5f1c12014-04-01 19:13:18 -0400199 Super-mkdir; create a leaf directory and all intermediate ones. Works like
200 mkdir, except that any intermediate path segment (not just the rightmost)
201 will be created if it does not exist. If the target directory already
202 exists, raise an OSError if exist_ok is False. Otherwise no exception is
Terry Reedy5a22b652010-12-02 07:05:56 +0000203 raised. This is recursive.
Guido van Rossum4def7de1998-07-24 20:48:03 +0000204
205 """
206 head, tail = path.split(name)
Fred Drake9f2550f2000-07-25 15:16:40 +0000207 if not tail:
208 head, tail = path.split(head)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000209 if head and tail and not path.exists(head):
Thomas Wouters89f507f2006-12-13 04:49:30 +0000210 try:
Serhiy Storchakae304e332017-03-24 13:27:42 +0200211 makedirs(head, exist_ok=exist_ok)
Giampaolo Rodola'0166a282013-02-12 15:14:17 +0100212 except FileExistsError:
Martin Pantera82642f2015-11-19 04:48:44 +0000213 # Defeats race condition when another thread created the path
Giampaolo Rodola'0166a282013-02-12 15:14:17 +0100214 pass
Serhiy Storchaka4ab23bf2013-01-08 11:32:58 +0200215 cdir = curdir
216 if isinstance(tail, bytes):
217 cdir = bytes(curdir, 'ASCII')
218 if tail == cdir: # xxx/newdir/. exists if xxx/newdir exists
Andrew M. Kuchling6fccc8a2003-12-23 16:33:28 +0000219 return
Terry Reedy5a22b652010-12-02 07:05:56 +0000220 try:
221 mkdir(name, mode)
Martin Pantera82642f2015-11-19 04:48:44 +0000222 except OSError:
223 # Cannot rely on checking for EEXIST, since the operating system
224 # could give priority to other errors like EACCES or EROFS
225 if not exist_ok or not path.isdir(name):
Terry Reedy5a22b652010-12-02 07:05:56 +0000226 raise
Guido van Rossum4def7de1998-07-24 20:48:03 +0000227
228def removedirs(name):
Zachary Warea22ae212014-03-20 09:42:01 -0500229 """removedirs(name)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000230
Fredrik Lundh96c1c7a2005-11-12 15:55:04 +0000231 Super-rmdir; remove a leaf directory and all empty intermediate
Guido van Rossum4def7de1998-07-24 20:48:03 +0000232 ones. Works like rmdir except that, if the leaf directory is
233 successfully removed, directories corresponding to rightmost path
Tim Petersc4e09402003-04-25 07:11:48 +0000234 segments will be pruned away until either the whole path is
Guido van Rossum4def7de1998-07-24 20:48:03 +0000235 consumed or an error occurs. Errors during this latter phase are
236 ignored -- they generally mean that a directory was not empty.
237
238 """
239 rmdir(name)
240 head, tail = path.split(name)
Fred Drake9f2550f2000-07-25 15:16:40 +0000241 if not tail:
242 head, tail = path.split(head)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000243 while head and tail:
244 try:
245 rmdir(head)
Andrew Svetlov2552bc02012-12-24 21:47:24 +0200246 except OSError:
Guido van Rossum4def7de1998-07-24 20:48:03 +0000247 break
248 head, tail = path.split(head)
249
250def renames(old, new):
Fred Drakecadb9eb2002-07-02 21:28:04 +0000251 """renames(old, new)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000252
253 Super-rename; create directories as necessary and delete any left
254 empty. Works like rename, except creation of any intermediate
255 directories needed to make the new pathname good is attempted
256 first. After the rename, directories corresponding to rightmost
Benjamin Peterson52a3b742015-04-13 20:24:10 -0400257 path segments of the old name will be pruned until either the
Guido van Rossum4def7de1998-07-24 20:48:03 +0000258 whole path is consumed or a nonempty directory is found.
259
260 Note: this function can fail with the new directory structure made
261 if you lack permissions needed to unlink the leaf directory or
262 file.
263
264 """
265 head, tail = path.split(new)
266 if head and tail and not path.exists(head):
267 makedirs(head)
268 rename(old, new)
269 head, tail = path.split(old)
270 if head and tail:
271 try:
272 removedirs(head)
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200273 except OSError:
Guido van Rossum4def7de1998-07-24 20:48:03 +0000274 pass
275
Skip Montanaro269b83b2001-02-06 01:07:02 +0000276__all__.extend(["makedirs", "removedirs", "renames"])
277
Guido van Rossumd8faa362007-04-27 19:54:29 +0000278def walk(top, topdown=True, onerror=None, followlinks=False):
Tim Petersc4e09402003-04-25 07:11:48 +0000279 """Directory tree generator.
280
281 For each directory in the directory tree rooted at top (including top
282 itself, but excluding '.' and '..'), yields a 3-tuple
283
284 dirpath, dirnames, filenames
285
286 dirpath is a string, the path to the directory. dirnames is a list of
287 the names of the subdirectories in dirpath (excluding '.' and '..').
288 filenames is a list of the names of the non-directory files in dirpath.
289 Note that the names in the lists are just names, with no path components.
290 To get a full path (which begins with top) to a file or directory in
291 dirpath, do os.path.join(dirpath, name).
292
293 If optional arg 'topdown' is true or not specified, the triple for a
294 directory is generated before the triples for any of its subdirectories
295 (directories are generated top down). If topdown is false, the triple
296 for a directory is generated after the triples for all of its
297 subdirectories (directories are generated bottom up).
298
299 When topdown is true, the caller can modify the dirnames list in-place
300 (e.g., via del or slice assignment), and walk will only recurse into the
Benjamin Petersone58e0c72014-06-15 20:51:12 -0700301 subdirectories whose names remain in dirnames; this can be used to prune the
302 search, or to impose a specific order of visiting. Modifying dirnames when
303 topdown is false is ineffective, since the directories in dirnames have
304 already been generated by the time dirnames itself is generated. No matter
305 the value of topdown, the list of subdirectories is retrieved before the
306 tuples for the directory and its subdirectories are generated.
Tim Petersc4e09402003-04-25 07:11:48 +0000307
Victor Stinner524a5ba2015-03-10 13:20:34 +0100308 By default errors from the os.scandir() call are ignored. If
Guido van Rossumbf1bef82003-05-13 18:01:19 +0000309 optional arg 'onerror' is specified, it should be a function; it
Andrew Svetlovad28c7f2012-12-18 22:02:39 +0200310 will be called with one argument, an OSError instance. It can
Guido van Rossumbf1bef82003-05-13 18:01:19 +0000311 report the error to continue with the walk, or raise the exception
312 to abort the walk. Note that the filename is available as the
313 filename attribute of the exception object.
314
Guido van Rossumd8faa362007-04-27 19:54:29 +0000315 By default, os.walk does not follow symbolic links to subdirectories on
316 systems that support them. In order to get this functionality, set the
317 optional argument 'followlinks' to true.
318
Tim Petersc4e09402003-04-25 07:11:48 +0000319 Caution: if you pass a relative pathname for top, don't change the
320 current working directory between resumptions of walk. walk never
321 changes the current directory, and assumes that the client doesn't
322 either.
323
324 Example:
325
Christian Heimes5d8da202008-05-06 13:58:24 +0000326 import os
Tim Petersc4e09402003-04-25 07:11:48 +0000327 from os.path import join, getsize
Christian Heimes5d8da202008-05-06 13:58:24 +0000328 for root, dirs, files in os.walk('python/Lib/email'):
Neal Norwitz752abd02008-05-13 04:55:24 +0000329 print(root, "consumes", end="")
330 print(sum([getsize(join(root, name)) for name in files]), end="")
331 print("bytes in", len(files), "non-directory files")
Tim Petersc4e09402003-04-25 07:11:48 +0000332 if 'CVS' in dirs:
333 dirs.remove('CVS') # don't visit CVS directories
Benjamin Petersone58e0c72014-06-15 20:51:12 -0700334
Tim Petersc4e09402003-04-25 07:11:48 +0000335 """
Brett Cannon3f9183b2016-08-26 14:44:48 -0700336 top = fspath(top)
Victor Stinner524a5ba2015-03-10 13:20:34 +0100337 dirs = []
338 nondirs = []
Serhiy Storchaka7c90a822016-02-11 13:31:00 +0200339 walk_dirs = []
Tim Petersc4e09402003-04-25 07:11:48 +0000340
341 # We may not have read permission for top, in which case we can't
Alexandre Vassalotti4e6531e2008-05-09 20:00:17 +0000342 # get a list of the files the directory contains. os.walk
Tim Petersc4e09402003-04-25 07:11:48 +0000343 # always suppressed the exception then, rather than blow up for a
344 # minor reason when (say) a thousand readable directories are still
345 # left to visit. That logic is copied here.
346 try:
Serhiy Storchaka3ae41552016-10-05 23:17:10 +0300347 # Note that scandir is global in this module due
348 # to earlier import-*.
349 scandir_it = scandir(top)
Victor Stinner7fea9742015-03-18 11:29:47 +0100350 except OSError as error:
351 if onerror is not None:
352 onerror(error)
353 return
354
Serhiy Storchakaffe96ae2016-02-11 13:21:30 +0200355 with scandir_it:
356 while True:
Victor Stinner524a5ba2015-03-10 13:20:34 +0100357 try:
Victor Stinner524a5ba2015-03-10 13:20:34 +0100358 try:
Serhiy Storchakaffe96ae2016-02-11 13:21:30 +0200359 entry = next(scandir_it)
360 except StopIteration:
361 break
362 except OSError as error:
363 if onerror is not None:
364 onerror(error)
365 return
Victor Stinner7fea9742015-03-18 11:29:47 +0100366
Serhiy Storchakaffe96ae2016-02-11 13:21:30 +0200367 try:
368 is_dir = entry.is_dir()
369 except OSError:
370 # If is_dir() raises an OSError, consider that the entry is not
371 # a directory, same behaviour than os.path.isdir().
372 is_dir = False
373
374 if is_dir:
375 dirs.append(entry.name)
376 else:
377 nondirs.append(entry.name)
378
379 if not topdown and is_dir:
380 # Bottom-up: recurse into sub-directory, but exclude symlinks to
381 # directories if followlinks is False
382 if followlinks:
383 walk_into = True
384 else:
385 try:
386 is_symlink = entry.is_symlink()
387 except OSError:
388 # If is_symlink() raises an OSError, consider that the
389 # entry is not a symbolic link, same behaviour than
390 # os.path.islink().
391 is_symlink = False
392 walk_into = not is_symlink
393
394 if walk_into:
Serhiy Storchaka7c90a822016-02-11 13:31:00 +0200395 walk_dirs.append(entry.path)
Tim Petersc4e09402003-04-25 07:11:48 +0000396
Victor Stinner524a5ba2015-03-10 13:20:34 +0100397 # Yield before recursion if going top down
Tim Petersc4e09402003-04-25 07:11:48 +0000398 if topdown:
399 yield top, dirs, nondirs
Victor Stinner524a5ba2015-03-10 13:20:34 +0100400
Victor Stinner7fea9742015-03-18 11:29:47 +0100401 # Recurse into sub-directories
402 islink, join = path.islink, path.join
Serhiy Storchaka5f6a0b42016-02-08 16:23:28 +0200403 for dirname in dirs:
404 new_path = join(top, dirname)
Victor Stinner7fea9742015-03-18 11:29:47 +0100405 # Issue #23605: os.path.islink() is used instead of caching
406 # entry.is_symlink() result during the loop on os.scandir() because
407 # the caller can replace the directory entry during the "yield"
408 # above.
409 if followlinks or not islink(new_path):
410 yield from walk(new_path, topdown, onerror, followlinks)
411 else:
Serhiy Storchaka7c90a822016-02-11 13:31:00 +0200412 # Recurse into sub-directories
413 for new_path in walk_dirs:
414 yield from walk(new_path, topdown, onerror, followlinks)
Victor Stinner7fea9742015-03-18 11:29:47 +0100415 # Yield after recursion if going bottom up
Tim Petersc4e09402003-04-25 07:11:48 +0000416 yield top, dirs, nondirs
417
418__all__.append("walk")
419
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300420if {open, stat} <= supports_dir_fd and {scandir, stat} <= supports_fd:
Charles-François Natali7372b062012-02-05 15:15:38 +0100421
Larry Hastingsb4038062012-07-15 10:57:38 -0700422 def fwalk(top=".", topdown=True, onerror=None, *, follow_symlinks=False, dir_fd=None):
Charles-François Natali7372b062012-02-05 15:15:38 +0100423 """Directory tree generator.
424
425 This behaves exactly like walk(), except that it yields a 4-tuple
426
427 dirpath, dirnames, filenames, dirfd
428
429 `dirpath`, `dirnames` and `filenames` are identical to walk() output,
430 and `dirfd` is a file descriptor referring to the directory `dirpath`.
431
Larry Hastingsc48fe982012-06-25 04:49:05 -0700432 The advantage of fwalk() over walk() is that it's safe against symlink
Larry Hastingsb4038062012-07-15 10:57:38 -0700433 races (when follow_symlinks is False).
Charles-François Natali7372b062012-02-05 15:15:38 +0100434
Larry Hastingsc48fe982012-06-25 04:49:05 -0700435 If dir_fd is not None, it should be a file descriptor open to a directory,
436 and top should be relative; top will then be relative to that directory.
437 (dir_fd is always supported for fwalk.)
438
Charles-François Natali7372b062012-02-05 15:15:38 +0100439 Caution:
440 Since fwalk() yields file descriptors, those are only valid until the
441 next iteration step, so you should dup() them if you want to keep them
442 for a longer period.
443
444 Example:
445
446 import os
447 for root, dirs, files, rootfd in os.fwalk('python/Lib/email'):
448 print(root, "consumes", end="")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700449 print(sum([os.stat(name, dir_fd=rootfd).st_size for name in files]),
Charles-François Natali7372b062012-02-05 15:15:38 +0100450 end="")
451 print("bytes in", len(files), "non-directory files")
452 if 'CVS' in dirs:
453 dirs.remove('CVS') # don't visit CVS directories
454 """
Brett Cannon3f9183b2016-08-26 14:44:48 -0700455 if not isinstance(top, int) or not hasattr(top, '__index__'):
456 top = fspath(top)
Charles-François Natali7372b062012-02-05 15:15:38 +0100457 # Note: To guard against symlink races, we use the standard
458 # lstat()/open()/fstat() trick.
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300459 if not follow_symlinks:
460 orig_st = stat(top, follow_symlinks=False, dir_fd=dir_fd)
Larry Hastingsc48fe982012-06-25 04:49:05 -0700461 topfd = open(top, O_RDONLY, dir_fd=dir_fd)
Charles-François Natali7372b062012-02-05 15:15:38 +0100462 try:
Larry Hastingsb4038062012-07-15 10:57:38 -0700463 if (follow_symlinks or (st.S_ISDIR(orig_st.st_mode) and
464 path.samestat(orig_st, stat(topfd)))):
Serhiy Storchaka8f6b3442017-03-07 14:33:21 +0200465 yield from _fwalk(topfd, top, isinstance(top, bytes),
466 topdown, onerror, follow_symlinks)
Charles-François Natali7372b062012-02-05 15:15:38 +0100467 finally:
468 close(topfd)
469
Serhiy Storchaka8f6b3442017-03-07 14:33:21 +0200470 def _fwalk(topfd, toppath, isbytes, topdown, onerror, follow_symlinks):
Charles-François Natali7372b062012-02-05 15:15:38 +0100471 # Note: This uses O(depth of the directory tree) file descriptors: if
472 # necessary, it can be adapted to only require O(1) FDs, see issue
473 # #13734.
474
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300475 scandir_it = scandir(topfd)
476 dirs = []
477 nondirs = []
478 entries = None if topdown or follow_symlinks else []
479 for entry in scandir_it:
480 name = entry.name
481 if isbytes:
482 name = fsencode(name)
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200483 try:
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300484 if entry.is_dir():
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200485 dirs.append(name)
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300486 if entries is not None:
487 entries.append(entry)
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200488 else:
489 nondirs.append(name)
Serhiy Storchaka42babab2016-10-25 14:28:38 +0300490 except OSError:
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200491 try:
492 # Add dangling symlinks, ignore disappeared files
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300493 if entry.is_symlink():
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200494 nondirs.append(name)
Serhiy Storchaka42babab2016-10-25 14:28:38 +0300495 except OSError:
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300496 pass
Charles-François Natali7372b062012-02-05 15:15:38 +0100497
498 if topdown:
499 yield toppath, dirs, nondirs, topfd
500
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300501 for name in dirs if entries is None else zip(dirs, entries):
Charles-François Natali7372b062012-02-05 15:15:38 +0100502 try:
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300503 if not follow_symlinks:
504 if topdown:
505 orig_st = stat(name, dir_fd=topfd, follow_symlinks=False)
506 else:
507 assert entries is not None
508 name, entry = name
509 orig_st = entry.stat(follow_symlinks=False)
Larry Hastings9cf065c2012-06-22 16:30:09 -0700510 dirfd = open(name, O_RDONLY, dir_fd=topfd)
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200511 except OSError as err:
Charles-François Natali7372b062012-02-05 15:15:38 +0100512 if onerror is not None:
513 onerror(err)
Serhiy Storchaka0bddc9e2015-12-23 00:08:24 +0200514 continue
Charles-François Natali7372b062012-02-05 15:15:38 +0100515 try:
Larry Hastingsb4038062012-07-15 10:57:38 -0700516 if follow_symlinks or path.samestat(orig_st, stat(dirfd)):
Charles-François Natali7372b062012-02-05 15:15:38 +0100517 dirpath = path.join(toppath, name)
Serhiy Storchaka8f6b3442017-03-07 14:33:21 +0200518 yield from _fwalk(dirfd, dirpath, isbytes,
519 topdown, onerror, follow_symlinks)
Charles-François Natali7372b062012-02-05 15:15:38 +0100520 finally:
521 close(dirfd)
522
523 if not topdown:
524 yield toppath, dirs, nondirs, topfd
525
526 __all__.append("fwalk")
527
Guido van Rossuma28dab51997-08-29 22:36:47 +0000528# Make sure os.environ exists, at least
529try:
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000530 environ
Guido van Rossuma28dab51997-08-29 22:36:47 +0000531except NameError:
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000532 environ = {}
Guido van Rossuma28dab51997-08-29 22:36:47 +0000533
Guido van Rossume65cce51993-11-08 15:05:21 +0000534def execl(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000535 """execl(file, *args)
536
537 Execute the executable file with argument list args, replacing the
538 current process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000539 execv(file, args)
Guido van Rossume65cce51993-11-08 15:05:21 +0000540
541def execle(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000542 """execle(file, *args, env)
543
544 Execute the executable file with argument list args and
545 environment env, replacing the current process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000546 env = args[-1]
547 execve(file, args[:-1], env)
Guido van Rossume65cce51993-11-08 15:05:21 +0000548
549def execlp(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000550 """execlp(file, *args)
551
552 Execute the executable file (which is searched for along $PATH)
553 with argument list args, replacing the current process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000554 execvp(file, args)
Guido van Rossume65cce51993-11-08 15:05:21 +0000555
Guido van Rossum030afb11995-03-14 17:27:18 +0000556def execlpe(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000557 """execlpe(file, *args, env)
558
559 Execute the executable file (which is searched for along $PATH)
560 with argument list args and environment env, replacing the current
Tim Peters2344fae2001-01-15 00:50:52 +0000561 process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000562 env = args[-1]
563 execvpe(file, args[:-1], env)
Guido van Rossum030afb11995-03-14 17:27:18 +0000564
Guido van Rossume65cce51993-11-08 15:05:21 +0000565def execvp(file, args):
Matthias Klosea09c54f2010-01-31 16:48:44 +0000566 """execvp(file, args)
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000567
568 Execute the executable file (which is searched for along $PATH)
569 with argument list args, replacing the current process.
Thomas Wouters7e474022000-07-16 12:04:32 +0000570 args may be a list or tuple of strings. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000571 _execvpe(file, args)
Guido van Rossum030afb11995-03-14 17:27:18 +0000572
573def execvpe(file, args, env):
Guido van Rossum683c0fe2002-09-03 16:36:17 +0000574 """execvpe(file, args, env)
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000575
576 Execute the executable file (which is searched for along $PATH)
577 with argument list args and environment env , replacing the
578 current process.
Tim Peters2344fae2001-01-15 00:50:52 +0000579 args may be a list or tuple of strings. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000580 _execvpe(file, args, env)
Guido van Rossum030afb11995-03-14 17:27:18 +0000581
Skip Montanaro269b83b2001-02-06 01:07:02 +0000582__all__.extend(["execl","execle","execlp","execlpe","execvp","execvpe"])
583
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000584def _execvpe(file, args, env=None):
585 if env is not None:
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000586 exec_func = execve
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000587 argrest = (args, env)
588 else:
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000589 exec_func = execv
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000590 argrest = (args,)
591 env = environ
Guido van Rossumaed51d82002-08-05 16:13:24 +0000592
Serhiy Storchaka81108372017-09-26 00:55:55 +0300593 if path.dirname(file):
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000594 exec_func(file, *argrest)
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000595 return
Serhiy Storchaka81108372017-09-26 00:55:55 +0300596 saved_exc = None
Victor Stinnerb745a742010-05-18 17:17:23 +0000597 path_list = get_exec_path(env)
598 if name != 'nt':
599 file = fsencode(file)
600 path_list = map(fsencode, path_list)
601 for dir in path_list:
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000602 fullname = path.join(dir, file)
603 try:
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000604 exec_func(fullname, *argrest)
Serhiy Storchaka81108372017-09-26 00:55:55 +0300605 except (FileNotFoundError, NotADirectoryError) as e:
606 last_exc = e
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200607 except OSError as e:
Guido van Rossume7ba4952007-06-06 23:52:48 +0000608 last_exc = e
Serhiy Storchaka81108372017-09-26 00:55:55 +0300609 if saved_exc is None:
Guido van Rossum683c0fe2002-09-03 16:36:17 +0000610 saved_exc = e
Serhiy Storchaka81108372017-09-26 00:55:55 +0300611 if saved_exc is not None:
612 raise saved_exc
613 raise last_exc
Guido van Rossumd74fb6b2001-03-02 06:43:49 +0000614
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000615
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000616def get_exec_path(env=None):
617 """Returns the sequence of directories that will be searched for the
618 named executable (similar to a shell) when launching a process.
619
620 *env* must be an environment variable dict or None. If *env* is None,
621 os.environ will be used.
622 """
Victor Stinner273b7662010-11-06 12:59:33 +0000623 # Use a local import instead of a global import to limit the number of
624 # modules loaded at startup: the os module is always loaded at startup by
625 # Python. It may also avoid a bootstrap issue.
Victor Stinner6f35eda2010-10-29 00:38:58 +0000626 import warnings
627
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000628 if env is None:
629 env = environ
Victor Stinnerb745a742010-05-18 17:17:23 +0000630
Victor Stinnerbb4f2182010-11-07 15:43:39 +0000631 # {b'PATH': ...}.get('PATH') and {'PATH': ...}.get(b'PATH') emit a
632 # BytesWarning when using python -b or python -bb: ignore the warning
Victor Stinner273b7662010-11-06 12:59:33 +0000633 with warnings.catch_warnings():
634 warnings.simplefilter("ignore", BytesWarning)
Victor Stinnerb745a742010-05-18 17:17:23 +0000635
Victor Stinnerb745a742010-05-18 17:17:23 +0000636 try:
Victor Stinner273b7662010-11-06 12:59:33 +0000637 path_list = env.get('PATH')
638 except TypeError:
639 path_list = None
Victor Stinnerb745a742010-05-18 17:17:23 +0000640
Victor Stinner273b7662010-11-06 12:59:33 +0000641 if supports_bytes_environ:
642 try:
643 path_listb = env[b'PATH']
644 except (KeyError, TypeError):
645 pass
646 else:
647 if path_list is not None:
648 raise ValueError(
649 "env cannot contain 'PATH' and b'PATH' keys")
650 path_list = path_listb
651
652 if path_list is not None and isinstance(path_list, bytes):
653 path_list = fsdecode(path_list)
Victor Stinnerb745a742010-05-18 17:17:23 +0000654
655 if path_list is None:
656 path_list = defpath
657 return path_list.split(pathsep)
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000658
659
Skip Montanaro289bc052007-08-17 02:30:27 +0000660# Change environ to automatically call putenv(), unsetenv if they exist.
Christian Heimesf1dc3ee2013-10-13 02:04:20 +0200661from _collections_abc import MutableMapping
Skip Montanaro289bc052007-08-17 02:30:27 +0000662
663class _Environ(MutableMapping):
Victor Stinner84ae1182010-05-06 22:05:07 +0000664 def __init__(self, data, encodekey, decodekey, encodevalue, decodevalue, putenv, unsetenv):
665 self.encodekey = encodekey
666 self.decodekey = decodekey
667 self.encodevalue = encodevalue
668 self.decodevalue = decodevalue
Skip Montanaro289bc052007-08-17 02:30:27 +0000669 self.putenv = putenv
670 self.unsetenv = unsetenv
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000671 self._data = data
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000672
Skip Montanaro289bc052007-08-17 02:30:27 +0000673 def __getitem__(self, key):
Victor Stinner6d101392013-04-14 16:35:04 +0200674 try:
675 value = self._data[self.encodekey(key)]
676 except KeyError:
677 # raise KeyError with the original key value
Victor Stinner0c2dd0c2013-08-23 19:19:15 +0200678 raise KeyError(key) from None
Victor Stinner84ae1182010-05-06 22:05:07 +0000679 return self.decodevalue(value)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000680
Skip Montanaro289bc052007-08-17 02:30:27 +0000681 def __setitem__(self, key, value):
Victor Stinner84ae1182010-05-06 22:05:07 +0000682 key = self.encodekey(key)
683 value = self.encodevalue(value)
Skip Montanaro289bc052007-08-17 02:30:27 +0000684 self.putenv(key, value)
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000685 self._data[key] = value
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000686
Skip Montanaro289bc052007-08-17 02:30:27 +0000687 def __delitem__(self, key):
Victor Stinner6d101392013-04-14 16:35:04 +0200688 encodedkey = self.encodekey(key)
689 self.unsetenv(encodedkey)
690 try:
691 del self._data[encodedkey]
692 except KeyError:
693 # raise KeyError with the original key value
Victor Stinner0c2dd0c2013-08-23 19:19:15 +0200694 raise KeyError(key) from None
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000695
Skip Montanaro289bc052007-08-17 02:30:27 +0000696 def __iter__(self):
Osvaldo Santana Neto8a8d2852017-07-01 14:34:45 -0300697 # list() from dict object is an atomic operation
698 keys = list(self._data)
699 for key in keys:
Victor Stinner84ae1182010-05-06 22:05:07 +0000700 yield self.decodekey(key)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000701
Skip Montanaro289bc052007-08-17 02:30:27 +0000702 def __len__(self):
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000703 return len(self._data)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000704
705 def __repr__(self):
Victor Stinnerbed71172010-07-28 21:25:42 +0000706 return 'environ({{{}}})'.format(', '.join(
Victor Stinnerd73c1a32010-07-28 21:23:23 +0000707 ('{!r}: {!r}'.format(self.decodekey(key), self.decodevalue(value))
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000708 for key, value in self._data.items())))
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000709
Skip Montanaro289bc052007-08-17 02:30:27 +0000710 def copy(self):
711 return dict(self)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000712
Skip Montanaro289bc052007-08-17 02:30:27 +0000713 def setdefault(self, key, value):
714 if key not in self:
715 self[key] = value
716 return self[key]
717
718try:
719 _putenv = putenv
720except NameError:
721 _putenv = lambda key, value: None
Richard Oudkerkc41917f2013-05-07 14:36:51 +0100722else:
723 if "putenv" not in __all__:
724 __all__.append("putenv")
Guido van Rossum3b8e20d1996-07-24 00:55:17 +0000725
Skip Montanaro289bc052007-08-17 02:30:27 +0000726try:
727 _unsetenv = unsetenv
728except NameError:
729 _unsetenv = lambda key: _putenv(key, "")
Richard Oudkerkc41917f2013-05-07 14:36:51 +0100730else:
731 if "unsetenv" not in __all__:
732 __all__.append("unsetenv")
Guido van Rossumc524d952001-10-19 01:31:59 +0000733
Victor Stinner84ae1182010-05-06 22:05:07 +0000734def _createenviron():
Jesus Cea4791a242012-10-05 03:15:39 +0200735 if name == 'nt':
Victor Stinner84ae1182010-05-06 22:05:07 +0000736 # Where Env Var Names Must Be UPPERCASE
737 def check_str(value):
738 if not isinstance(value, str):
739 raise TypeError("str expected, not %s" % type(value).__name__)
740 return value
741 encode = check_str
742 decode = str
743 def encodekey(key):
744 return encode(key).upper()
745 data = {}
746 for key, value in environ.items():
747 data[encodekey(key)] = value
748 else:
749 # Where Env Var Names Can Be Mixed Case
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000750 encoding = sys.getfilesystemencoding()
Victor Stinner84ae1182010-05-06 22:05:07 +0000751 def encode(value):
752 if not isinstance(value, str):
753 raise TypeError("str expected, not %s" % type(value).__name__)
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000754 return value.encode(encoding, 'surrogateescape')
Victor Stinner84ae1182010-05-06 22:05:07 +0000755 def decode(value):
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000756 return value.decode(encoding, 'surrogateescape')
Victor Stinner84ae1182010-05-06 22:05:07 +0000757 encodekey = encode
758 data = environ
759 return _Environ(data,
760 encodekey, decode,
761 encode, decode,
762 _putenv, _unsetenv)
Guido van Rossumc524d952001-10-19 01:31:59 +0000763
Victor Stinner84ae1182010-05-06 22:05:07 +0000764# unicode environ
765environ = _createenviron()
766del _createenviron
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000767
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000768
Jack Jansenb11ce9b2003-01-08 16:33:40 +0000769def getenv(key, default=None):
Tim Peters2c60f7a2003-01-29 03:49:43 +0000770 """Get an environment variable, return None if it doesn't exist.
Victor Stinner84ae1182010-05-06 22:05:07 +0000771 The optional second argument can specify an alternate default.
772 key, default and the result are str."""
Tim Peters2c60f7a2003-01-29 03:49:43 +0000773 return environ.get(key, default)
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000774
Jesus Cea4791a242012-10-05 03:15:39 +0200775supports_bytes_environ = (name != 'nt')
Victor Stinnerb745a742010-05-18 17:17:23 +0000776__all__.extend(("getenv", "supports_bytes_environ"))
777
778if supports_bytes_environ:
Victor Stinner84ae1182010-05-06 22:05:07 +0000779 def _check_bytes(value):
780 if not isinstance(value, bytes):
781 raise TypeError("bytes expected, not %s" % type(value).__name__)
782 return value
783
784 # bytes environ
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000785 environb = _Environ(environ._data,
Victor Stinner84ae1182010-05-06 22:05:07 +0000786 _check_bytes, bytes,
787 _check_bytes, bytes,
788 _putenv, _unsetenv)
789 del _check_bytes
790
791 def getenvb(key, default=None):
792 """Get an environment variable, return None if it doesn't exist.
793 The optional second argument can specify an alternate default.
794 key, default and the result are bytes."""
795 return environb.get(key, default)
Victor Stinner70120e22010-07-29 17:19:38 +0000796
797 __all__.extend(("environb", "getenvb"))
Victor Stinner84ae1182010-05-06 22:05:07 +0000798
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000799def _fscodec():
800 encoding = sys.getfilesystemencoding()
Steve Dowercc16be82016-09-08 10:35:16 -0700801 errors = sys.getfilesystemencodeerrors()
Victor Stinnere8d51452010-08-19 01:05:19 +0000802
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000803 def fsencode(filename):
Brett Cannon5f74ebc2016-06-09 14:29:25 -0700804 """Encode filename (an os.PathLike, bytes, or str) to the filesystem
Ethan Furmanc1cbeed2016-06-04 10:19:27 -0700805 encoding with 'surrogateescape' error handler, return bytes unchanged.
806 On Windows, use 'strict' error handler if the file system encoding is
807 'mbcs' (which is the default encoding).
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000808 """
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700809 filename = fspath(filename) # Does type-checking of `filename`.
810 if isinstance(filename, str):
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000811 return filename.encode(encoding, errors)
Victor Stinnere8d51452010-08-19 01:05:19 +0000812 else:
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700813 return filename
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000814
815 def fsdecode(filename):
Brett Cannon5f74ebc2016-06-09 14:29:25 -0700816 """Decode filename (an os.PathLike, bytes, or str) from the filesystem
Ethan Furmanc1cbeed2016-06-04 10:19:27 -0700817 encoding with 'surrogateescape' error handler, return str unchanged. On
818 Windows, use 'strict' error handler if the file system encoding is
819 'mbcs' (which is the default encoding).
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000820 """
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700821 filename = fspath(filename) # Does type-checking of `filename`.
822 if isinstance(filename, bytes):
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000823 return filename.decode(encoding, errors)
824 else:
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700825 return filename
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000826
827 return fsencode, fsdecode
828
829fsencode, fsdecode = _fscodec()
830del _fscodec
Victor Stinner449c4662010-05-08 11:10:09 +0000831
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000832# Supply spawn*() (probably only for Unix)
833if _exists("fork") and not _exists("spawnv") and _exists("execv"):
834
835 P_WAIT = 0
836 P_NOWAIT = P_NOWAITO = 1
837
Petri Lehtinen3bc37f22012-05-23 21:36:16 +0300838 __all__.extend(["P_WAIT", "P_NOWAIT", "P_NOWAITO"])
839
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000840 # XXX Should we support P_DETACH? I suppose it could fork()**2
841 # and close the std I/O streams. Also, P_OVERLAY is the same
842 # as execv*()?
843
844 def _spawnvef(mode, file, args, env, func):
845 # Internal helper; func is the exec*() function to use
Steve Dowereccaa062016-11-19 20:11:56 -0800846 if not isinstance(args, (tuple, list)):
847 raise TypeError('argv must be a tuple or a list')
Steve Dowerbb08db42016-11-19 21:14:27 -0800848 if not args or not args[0]:
Steve Dowereccaa062016-11-19 20:11:56 -0800849 raise ValueError('argv first element cannot be empty')
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000850 pid = fork()
851 if not pid:
852 # Child
853 try:
854 if env is None:
855 func(file, args)
856 else:
857 func(file, args, env)
858 except:
859 _exit(127)
860 else:
861 # Parent
862 if mode == P_NOWAIT:
863 return pid # Caller is responsible for waiting!
864 while 1:
865 wpid, sts = waitpid(pid, 0)
866 if WIFSTOPPED(sts):
867 continue
868 elif WIFSIGNALED(sts):
869 return -WTERMSIG(sts)
870 elif WIFEXITED(sts):
871 return WEXITSTATUS(sts)
872 else:
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200873 raise OSError("Not stopped, signaled or exited???")
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000874
875 def spawnv(mode, file, args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000876 """spawnv(mode, file, args) -> integer
877
878Execute file with arguments from args in a subprocess.
879If mode == P_NOWAIT return the pid of the process.
880If mode == P_WAIT return the process's exit code if it exits normally;
Tim Peters2344fae2001-01-15 00:50:52 +0000881otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000882 return _spawnvef(mode, file, args, None, execv)
883
884 def spawnve(mode, file, args, env):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000885 """spawnve(mode, file, args, env) -> integer
886
887Execute file with arguments from args in a subprocess with the
888specified environment.
889If mode == P_NOWAIT return the pid of the process.
890If mode == P_WAIT return the process's exit code if it exits normally;
891otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000892 return _spawnvef(mode, file, args, env, execve)
893
Mike53f7a7c2017-12-14 14:04:53 +0300894 # Note: spawnvp[e] isn't currently supported on Windows
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000895
896 def spawnvp(mode, file, args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000897 """spawnvp(mode, file, args) -> integer
898
899Execute file (which is looked for along $PATH) with arguments from
900args in a subprocess.
901If mode == P_NOWAIT return the pid of the process.
902If mode == P_WAIT return the process's exit code if it exits normally;
903otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000904 return _spawnvef(mode, file, args, None, execvp)
905
906 def spawnvpe(mode, file, args, env):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000907 """spawnvpe(mode, file, args, env) -> integer
908
909Execute file (which is looked for along $PATH) with arguments from
910args in a subprocess with the supplied environment.
911If mode == P_NOWAIT return the pid of the process.
912If mode == P_WAIT return the process's exit code if it exits normally;
913otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000914 return _spawnvef(mode, file, args, env, execvpe)
915
Richard Oudkerkad34ef82013-05-07 14:23:42 +0100916
917 __all__.extend(["spawnv", "spawnve", "spawnvp", "spawnvpe"])
918
919
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000920if _exists("spawnv"):
921 # These aren't supplied by the basic Windows code
922 # but can be easily implemented in Python
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000923
924 def spawnl(mode, file, *args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000925 """spawnl(mode, file, *args) -> integer
926
927Execute file with arguments from args in a subprocess.
928If mode == P_NOWAIT return the pid of the process.
929If mode == P_WAIT return the process's exit code if it exits normally;
930otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000931 return spawnv(mode, file, args)
932
933 def spawnle(mode, file, *args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000934 """spawnle(mode, file, *args, env) -> integer
935
936Execute file with arguments from args in a subprocess with the
937supplied environment.
938If mode == P_NOWAIT return the pid of the process.
939If mode == P_WAIT return the process's exit code if it exits normally;
940otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000941 env = args[-1]
942 return spawnve(mode, file, args[:-1], env)
943
Andrew MacIntyre69e18c92004-04-04 07:11:43 +0000944
Richard Oudkerkad34ef82013-05-07 14:23:42 +0100945 __all__.extend(["spawnl", "spawnle"])
Andrew MacIntyre69e18c92004-04-04 07:11:43 +0000946
947
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000948if _exists("spawnvp"):
949 # At the moment, Windows doesn't implement spawnvp[e],
950 # so it won't have spawnlp[e] either.
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000951 def spawnlp(mode, file, *args):
Neal Norwitzb7f68102003-07-02 02:49:33 +0000952 """spawnlp(mode, file, *args) -> integer
Guido van Rossume0cd2912000-04-21 18:35:36 +0000953
954Execute file (which is looked for along $PATH) with arguments from
955args in a subprocess with the supplied environment.
956If mode == P_NOWAIT return the pid of the process.
957If mode == P_WAIT return the process's exit code if it exits normally;
958otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000959 return spawnvp(mode, file, args)
960
961 def spawnlpe(mode, file, *args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000962 """spawnlpe(mode, file, *args, env) -> integer
963
964Execute file (which is looked for along $PATH) with arguments from
965args in a subprocess with the supplied environment.
966If mode == P_NOWAIT return the pid of the process.
967If mode == P_WAIT return the process's exit code if it exits normally;
968otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000969 env = args[-1]
970 return spawnvpe(mode, file, args[:-1], env)
Guido van Rossume0cd2912000-04-21 18:35:36 +0000971
972
Richard Oudkerkad34ef82013-05-07 14:23:42 +0100973 __all__.extend(["spawnlp", "spawnlpe"])
974
Skip Montanaro269b83b2001-02-06 01:07:02 +0000975
Guido van Rossumc2f93dc2007-05-24 00:50:02 +0000976# Supply os.popen()
Antoine Pitrou877766d2011-03-19 17:00:37 +0100977def popen(cmd, mode="r", buffering=-1):
Guido van Rossum3172c5d2007-10-16 18:12:55 +0000978 if not isinstance(cmd, str):
Guido van Rossumc2f93dc2007-05-24 00:50:02 +0000979 raise TypeError("invalid cmd type (%s, expected string)" % type(cmd))
980 if mode not in ("r", "w"):
981 raise ValueError("invalid mode %r" % mode)
Benjamin Petersonb29614e2012-10-09 11:16:03 -0400982 if buffering == 0 or buffering is None:
Antoine Pitrou877766d2011-03-19 17:00:37 +0100983 raise ValueError("popen() does not support unbuffered streams")
Guido van Rossumc2f93dc2007-05-24 00:50:02 +0000984 import subprocess, io
985 if mode == "r":
986 proc = subprocess.Popen(cmd,
987 shell=True,
988 stdout=subprocess.PIPE,
989 bufsize=buffering)
990 return _wrap_close(io.TextIOWrapper(proc.stdout), proc)
991 else:
992 proc = subprocess.Popen(cmd,
993 shell=True,
994 stdin=subprocess.PIPE,
995 bufsize=buffering)
996 return _wrap_close(io.TextIOWrapper(proc.stdin), proc)
997
998# Helper for popen() -- a proxy for a file whose close waits for the process
999class _wrap_close:
1000 def __init__(self, stream, proc):
1001 self._stream = stream
1002 self._proc = proc
1003 def close(self):
1004 self._stream.close()
Amaury Forgeot d'Arc97e5f282009-07-11 09:35:13 +00001005 returncode = self._proc.wait()
1006 if returncode == 0:
1007 return None
1008 if name == 'nt':
1009 return returncode
1010 else:
1011 return returncode << 8 # Shift left to match old behavior
Antoine Pitrouac625352009-12-09 00:01:27 +00001012 def __enter__(self):
1013 return self
1014 def __exit__(self, *args):
1015 self.close()
Guido van Rossumc2f93dc2007-05-24 00:50:02 +00001016 def __getattr__(self, name):
1017 return getattr(self._stream, name)
Thomas Heller476157b2007-09-04 11:27:47 +00001018 def __iter__(self):
1019 return iter(self._stream)
Guido van Rossumc2f93dc2007-05-24 00:50:02 +00001020
Amaury Forgeot d'Arcbdbddf82008-08-01 00:06:49 +00001021# Supply os.fdopen()
1022def fdopen(fd, *args, **kwargs):
Guido van Rossumc2f93dc2007-05-24 00:50:02 +00001023 if not isinstance(fd, int):
1024 raise TypeError("invalid fd type (%s, expected integer)" % type(fd))
1025 import io
Amaury Forgeot d'Arcbdbddf82008-08-01 00:06:49 +00001026 return io.open(fd, *args, **kwargs)
Ethan Furmancdc08792016-06-02 15:06:09 -07001027
Brett Cannonc78ca1e2016-06-24 12:03:43 -07001028
1029# For testing purposes, make sure the function is available when the C
1030# implementation exists.
1031def _fspath(path):
1032 """Return the path representation of a path-like object.
1033
1034 If str or bytes is passed in, it is returned unchanged. Otherwise the
1035 os.PathLike interface is used to get the path representation. If the
1036 path representation is not str or bytes, TypeError is raised. If the
1037 provided path is not str, bytes, or os.PathLike, TypeError is raised.
1038 """
1039 if isinstance(path, (str, bytes)):
1040 return path
1041
1042 # Work from the object's type to match method resolution of other magic
1043 # methods.
1044 path_type = type(path)
1045 try:
1046 path_repr = path_type.__fspath__(path)
1047 except AttributeError:
1048 if hasattr(path_type, '__fspath__'):
1049 raise
1050 else:
1051 raise TypeError("expected str, bytes or os.PathLike object, "
1052 "not " + path_type.__name__)
1053 if isinstance(path_repr, (str, bytes)):
1054 return path_repr
1055 else:
1056 raise TypeError("expected {}.__fspath__() to return str or bytes, "
1057 "not {}".format(path_type.__name__,
1058 type(path_repr).__name__))
1059
1060# If there is no C implementation, make the pure Python version the
1061# implementation as transparently as possible.
Ethan Furman410ef8e2016-06-04 12:06:26 -07001062if not _exists('fspath'):
Brett Cannonc78ca1e2016-06-24 12:03:43 -07001063 fspath = _fspath
1064 fspath.__name__ = "fspath"
Ethan Furmancdc08792016-06-02 15:06:09 -07001065
Ethan Furman958b3e42016-06-04 12:49:35 -07001066
1067class PathLike(abc.ABC):
Brett Cannon5f74ebc2016-06-09 14:29:25 -07001068
1069 """Abstract base class for implementing the file system path protocol."""
1070
Ethan Furman958b3e42016-06-04 12:49:35 -07001071 @abc.abstractmethod
1072 def __fspath__(self):
Brett Cannon5f74ebc2016-06-09 14:29:25 -07001073 """Return the file system path representation of the object."""
Ethan Furman958b3e42016-06-04 12:49:35 -07001074 raise NotImplementedError
1075
1076 @classmethod
1077 def __subclasshook__(cls, subclass):
1078 return hasattr(subclass, '__fspath__')