blob: e293ecae7fd3a4ed40d5c4846ba147c22203be2f [file] [log] [blame]
Ned Deily5c867012014-06-26 23:40:06 -07001r"""OS routines for NT or Posix depending on what system we're on.
Guido van Rossum31104f41992-01-14 18:28:36 +00002
Guido van Rossum54f22ed2000-02-04 15:10:34 +00003This exports:
Larry Hastings10108a72016-09-05 15:11:23 -07004 - all functions from posix or nt, e.g. unlink, stat, etc.
Alexandre Vassalottieca20b62008-05-16 02:54:33 +00005 - os.path is either posixpath or ntpath
Larry Hastings10108a72016-09-05 15:11:23 -07006 - os.name is either 'posix' or 'nt'
Ned Deilybf090e32016-10-01 21:12:35 -04007 - os.curdir is a string representing the current directory (always '.')
8 - os.pardir is a string representing the parent directory (always '..')
9 - os.sep is the (or a most common) pathname separator ('/' or '\\')
Georg Brandled5b9b32008-12-05 07:45:54 +000010 - os.extsep is the extension separator (always '.')
Guido van Rossum4b8c6ea2000-02-04 15:39:30 +000011 - os.altsep is the alternate pathname separator (None or '/')
Guido van Rossum54f22ed2000-02-04 15:10:34 +000012 - os.pathsep is the component separator used in $PATH etc
Guido van Rossum4b8c6ea2000-02-04 15:39:30 +000013 - os.linesep is the line separator in text files ('\r' or '\n' or '\r\n')
Guido van Rossum54f22ed2000-02-04 15:10:34 +000014 - os.defpath is the default search path for executables
Martin v. Löwisbdec50f2004-06-08 08:29:33 +000015 - os.devnull is the file path of the null device ('/dev/null', etc.)
Guido van Rossum31104f41992-01-14 18:28:36 +000016
Guido van Rossum54f22ed2000-02-04 15:10:34 +000017Programs that import and use 'os' stand a better chance of being
18portable between different platforms. Of course, they must then
19only use functions that are defined by all platforms (e.g., unlink
20and opendir), and leave all pathname manipulation to os.path
21(e.g., split and join).
22"""
Guido van Rossum31104f41992-01-14 18:28:36 +000023
Skip Montanaro269b83b2001-02-06 01:07:02 +000024#'
Ethan Furman958b3e42016-06-04 12:49:35 -070025import abc
Christian Heimes45f9af32007-11-27 21:50:00 +000026import sys, errno
Charles-François Natali7372b062012-02-05 15:15:38 +010027import stat as st
Guido van Rossuma28dab51997-08-29 22:36:47 +000028
29_names = sys.builtin_module_names
30
Tim Petersc4e09402003-04-25 07:11:48 +000031# Note: more names are added to __all__ later.
Brett Cannon13962fc2008-08-18 01:45:29 +000032__all__ = ["altsep", "curdir", "pardir", "sep", "pathsep", "linesep",
Petri Lehtinen3bc37f22012-05-23 21:36:16 +030033 "defpath", "name", "path", "devnull", "SEEK_SET", "SEEK_CUR",
34 "SEEK_END", "fsencode", "fsdecode", "get_exec_path", "fdopen",
35 "popen", "extsep"]
Skip Montanaro269b83b2001-02-06 01:07:02 +000036
Charles-François Natali7372b062012-02-05 15:15:38 +010037def _exists(name):
38 return name in globals()
39
Skip Montanaro269b83b2001-02-06 01:07:02 +000040def _get_exports_list(module):
41 try:
42 return list(module.__all__)
43 except AttributeError:
44 return [n for n in dir(module) if n[0] != '_']
45
Brett Cannonfd074152012-04-14 14:10:13 -040046# Any new dependencies of the os module and/or changes in path separator
47# requires updating importlib as well.
Guido van Rossuma28dab51997-08-29 22:36:47 +000048if 'posix' in _names:
Guido van Rossum61de0ac1997-12-05 21:24:30 +000049 name = 'posix'
Guido van Rossume9387ea1998-05-22 15:26:04 +000050 linesep = '\n'
Guido van Rossum61de0ac1997-12-05 21:24:30 +000051 from posix import *
52 try:
53 from posix import _exit
Petri Lehtinen3bc37f22012-05-23 21:36:16 +030054 __all__.append('_exit')
Brett Cannoncd171c82013-07-04 17:43:24 -040055 except ImportError:
Guido van Rossum61de0ac1997-12-05 21:24:30 +000056 pass
Skip Montanaro117910d2003-02-14 19:35:31 +000057 import posixpath as path
Tim Petersf2715e02003-02-19 02:35:07 +000058
Larry Hastings9cf065c2012-06-22 16:30:09 -070059 try:
60 from posix import _have_functions
Brett Cannoncd171c82013-07-04 17:43:24 -040061 except ImportError:
Larry Hastings9cf065c2012-06-22 16:30:09 -070062 pass
Skip Montanaro269b83b2001-02-06 01:07:02 +000063
Yury Selivanov97e2e062014-09-26 12:33:06 -040064 import posix
65 __all__.extend(_get_exports_list(posix))
66 del posix
67
Guido van Rossuma28dab51997-08-29 22:36:47 +000068elif 'nt' in _names:
Guido van Rossum61de0ac1997-12-05 21:24:30 +000069 name = 'nt'
Guido van Rossume9387ea1998-05-22 15:26:04 +000070 linesep = '\r\n'
Guido van Rossum61de0ac1997-12-05 21:24:30 +000071 from nt import *
Tim Peters6757c1e2003-01-08 21:20:57 +000072 try:
73 from nt import _exit
Petri Lehtinen3bc37f22012-05-23 21:36:16 +030074 __all__.append('_exit')
Brett Cannoncd171c82013-07-04 17:43:24 -040075 except ImportError:
Tim Peters6757c1e2003-01-08 21:20:57 +000076 pass
Skip Montanaro117910d2003-02-14 19:35:31 +000077 import ntpath as path
Tim Petersf2715e02003-02-19 02:35:07 +000078
Skip Montanaro269b83b2001-02-06 01:07:02 +000079 import nt
80 __all__.extend(_get_exports_list(nt))
81 del nt
82
Larry Hastings9cf065c2012-06-22 16:30:09 -070083 try:
84 from nt import _have_functions
Brett Cannoncd171c82013-07-04 17:43:24 -040085 except ImportError:
Larry Hastings9cf065c2012-06-22 16:30:09 -070086 pass
87
Guido van Rossum2979b011994-08-01 11:18:30 +000088else:
Brett Cannoncd171c82013-07-04 17:43:24 -040089 raise ImportError('no os specific module found')
Guido van Rossume65cce51993-11-08 15:05:21 +000090
Skip Montanaro117910d2003-02-14 19:35:31 +000091sys.modules['os.path'] = path
Georg Brandled5b9b32008-12-05 07:45:54 +000092from os.path import (curdir, pardir, sep, pathsep, defpath, extsep, altsep,
93 devnull)
Skip Montanaro269b83b2001-02-06 01:07:02 +000094
Guido van Rossuma28dab51997-08-29 22:36:47 +000095del _names
96
Larry Hastings9cf065c2012-06-22 16:30:09 -070097
98if _exists("_have_functions"):
99 _globals = globals()
100 def _add(str, fn):
101 if (fn in _globals) and (str in _have_functions):
102 _set.add(_globals[fn])
103
104 _set = set()
105 _add("HAVE_FACCESSAT", "access")
106 _add("HAVE_FCHMODAT", "chmod")
107 _add("HAVE_FCHOWNAT", "chown")
108 _add("HAVE_FSTATAT", "stat")
109 _add("HAVE_FUTIMESAT", "utime")
110 _add("HAVE_LINKAT", "link")
111 _add("HAVE_MKDIRAT", "mkdir")
112 _add("HAVE_MKFIFOAT", "mkfifo")
113 _add("HAVE_MKNODAT", "mknod")
114 _add("HAVE_OPENAT", "open")
115 _add("HAVE_READLINKAT", "readlink")
116 _add("HAVE_RENAMEAT", "rename")
117 _add("HAVE_SYMLINKAT", "symlink")
118 _add("HAVE_UNLINKAT", "unlink")
Larry Hastingsb698d8e2012-06-23 16:55:07 -0700119 _add("HAVE_UNLINKAT", "rmdir")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700120 _add("HAVE_UTIMENSAT", "utime")
121 supports_dir_fd = _set
122
123 _set = set()
124 _add("HAVE_FACCESSAT", "access")
125 supports_effective_ids = _set
126
127 _set = set()
128 _add("HAVE_FCHDIR", "chdir")
129 _add("HAVE_FCHMOD", "chmod")
130 _add("HAVE_FCHOWN", "chown")
131 _add("HAVE_FDOPENDIR", "listdir")
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300132 _add("HAVE_FDOPENDIR", "scandir")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700133 _add("HAVE_FEXECVE", "execve")
134 _set.add(stat) # fstat always works
Georg Brandl306336b2012-06-24 12:55:33 +0200135 _add("HAVE_FTRUNCATE", "truncate")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700136 _add("HAVE_FUTIMENS", "utime")
137 _add("HAVE_FUTIMES", "utime")
Georg Brandl306336b2012-06-24 12:55:33 +0200138 _add("HAVE_FPATHCONF", "pathconf")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700139 if _exists("statvfs") and _exists("fstatvfs"): # mac os x10.3
140 _add("HAVE_FSTATVFS", "statvfs")
141 supports_fd = _set
142
143 _set = set()
144 _add("HAVE_FACCESSAT", "access")
Larry Hastingsdbbc0c82012-06-22 19:50:21 -0700145 # Some platforms don't support lchmod(). Often the function exists
146 # anyway, as a stub that always returns ENOSUP or perhaps EOPNOTSUPP.
147 # (No, I don't know why that's a good design.) ./configure will detect
148 # this and reject it--so HAVE_LCHMOD still won't be defined on such
149 # platforms. This is Very Helpful.
150 #
151 # However, sometimes platforms without a working lchmod() *do* have
152 # fchmodat(). (Examples: Linux kernel 3.2 with glibc 2.15,
153 # OpenIndiana 3.x.) And fchmodat() has a flag that theoretically makes
154 # it behave like lchmod(). So in theory it would be a suitable
155 # replacement for lchmod(). But when lchmod() doesn't work, fchmodat()'s
156 # flag doesn't work *either*. Sadly ./configure isn't sophisticated
157 # enough to detect this condition--it only determines whether or not
158 # fchmodat() minimally works.
159 #
160 # Therefore we simply ignore fchmodat() when deciding whether or not
161 # os.chmod supports follow_symlinks. Just checking lchmod() is
162 # sufficient. After all--if you have a working fchmodat(), your
163 # lchmod() almost certainly works too.
164 #
165 # _add("HAVE_FCHMODAT", "chmod")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700166 _add("HAVE_FCHOWNAT", "chown")
167 _add("HAVE_FSTATAT", "stat")
168 _add("HAVE_LCHFLAGS", "chflags")
169 _add("HAVE_LCHMOD", "chmod")
170 if _exists("lchown"): # mac os x10.3
171 _add("HAVE_LCHOWN", "chown")
172 _add("HAVE_LINKAT", "link")
173 _add("HAVE_LUTIMES", "utime")
174 _add("HAVE_LSTAT", "stat")
175 _add("HAVE_FSTATAT", "stat")
176 _add("HAVE_UTIMENSAT", "utime")
177 _add("MS_WINDOWS", "stat")
178 supports_follow_symlinks = _set
179
Larry Hastings9cf065c2012-06-22 16:30:09 -0700180 del _set
181 del _have_functions
182 del _globals
183 del _add
184
185
Martin v. Löwis22b457e2005-01-16 08:40:58 +0000186# Python uses fixed values for the SEEK_ constants; they are mapped
187# to native constants if necessary in posixmodule.c
Jesus Cea94363612012-06-22 18:32:07 +0200188# Other possible SEEK values are directly imported from posixmodule.c
Martin v. Löwis22b457e2005-01-16 08:40:58 +0000189SEEK_SET = 0
190SEEK_CUR = 1
191SEEK_END = 2
192
Guido van Rossum4def7de1998-07-24 20:48:03 +0000193# Super directory utilities.
194# (Inspired by Eric Raymond; the doc strings are mostly his)
195
Terry Reedy5a22b652010-12-02 07:05:56 +0000196def makedirs(name, mode=0o777, exist_ok=False):
Zachary Warea22ae212014-03-20 09:42:01 -0500197 """makedirs(name [, mode=0o777][, exist_ok=False])
Guido van Rossum4def7de1998-07-24 20:48:03 +0000198
Benjamin Petersonee5f1c12014-04-01 19:13:18 -0400199 Super-mkdir; create a leaf directory and all intermediate ones. Works like
200 mkdir, except that any intermediate path segment (not just the rightmost)
201 will be created if it does not exist. If the target directory already
202 exists, raise an OSError if exist_ok is False. Otherwise no exception is
Terry Reedy5a22b652010-12-02 07:05:56 +0000203 raised. This is recursive.
Guido van Rossum4def7de1998-07-24 20:48:03 +0000204
205 """
206 head, tail = path.split(name)
Fred Drake9f2550f2000-07-25 15:16:40 +0000207 if not tail:
208 head, tail = path.split(head)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000209 if head and tail and not path.exists(head):
Thomas Wouters89f507f2006-12-13 04:49:30 +0000210 try:
Serhiy Storchakae304e332017-03-24 13:27:42 +0200211 makedirs(head, exist_ok=exist_ok)
Giampaolo Rodola'0166a282013-02-12 15:14:17 +0100212 except FileExistsError:
Martin Pantera82642f2015-11-19 04:48:44 +0000213 # Defeats race condition when another thread created the path
Giampaolo Rodola'0166a282013-02-12 15:14:17 +0100214 pass
Serhiy Storchaka4ab23bf2013-01-08 11:32:58 +0200215 cdir = curdir
216 if isinstance(tail, bytes):
217 cdir = bytes(curdir, 'ASCII')
218 if tail == cdir: # xxx/newdir/. exists if xxx/newdir exists
Andrew M. Kuchling6fccc8a2003-12-23 16:33:28 +0000219 return
Terry Reedy5a22b652010-12-02 07:05:56 +0000220 try:
221 mkdir(name, mode)
Martin Pantera82642f2015-11-19 04:48:44 +0000222 except OSError:
223 # Cannot rely on checking for EEXIST, since the operating system
224 # could give priority to other errors like EACCES or EROFS
225 if not exist_ok or not path.isdir(name):
Terry Reedy5a22b652010-12-02 07:05:56 +0000226 raise
Guido van Rossum4def7de1998-07-24 20:48:03 +0000227
228def removedirs(name):
Zachary Warea22ae212014-03-20 09:42:01 -0500229 """removedirs(name)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000230
Fredrik Lundh96c1c7a2005-11-12 15:55:04 +0000231 Super-rmdir; remove a leaf directory and all empty intermediate
Guido van Rossum4def7de1998-07-24 20:48:03 +0000232 ones. Works like rmdir except that, if the leaf directory is
233 successfully removed, directories corresponding to rightmost path
Tim Petersc4e09402003-04-25 07:11:48 +0000234 segments will be pruned away until either the whole path is
Guido van Rossum4def7de1998-07-24 20:48:03 +0000235 consumed or an error occurs. Errors during this latter phase are
236 ignored -- they generally mean that a directory was not empty.
237
238 """
239 rmdir(name)
240 head, tail = path.split(name)
Fred Drake9f2550f2000-07-25 15:16:40 +0000241 if not tail:
242 head, tail = path.split(head)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000243 while head and tail:
244 try:
245 rmdir(head)
Andrew Svetlov2552bc02012-12-24 21:47:24 +0200246 except OSError:
Guido van Rossum4def7de1998-07-24 20:48:03 +0000247 break
248 head, tail = path.split(head)
249
250def renames(old, new):
Fred Drakecadb9eb2002-07-02 21:28:04 +0000251 """renames(old, new)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000252
253 Super-rename; create directories as necessary and delete any left
254 empty. Works like rename, except creation of any intermediate
255 directories needed to make the new pathname good is attempted
256 first. After the rename, directories corresponding to rightmost
Benjamin Peterson52a3b742015-04-13 20:24:10 -0400257 path segments of the old name will be pruned until either the
Guido van Rossum4def7de1998-07-24 20:48:03 +0000258 whole path is consumed or a nonempty directory is found.
259
260 Note: this function can fail with the new directory structure made
261 if you lack permissions needed to unlink the leaf directory or
262 file.
263
264 """
265 head, tail = path.split(new)
266 if head and tail and not path.exists(head):
267 makedirs(head)
268 rename(old, new)
269 head, tail = path.split(old)
270 if head and tail:
271 try:
272 removedirs(head)
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200273 except OSError:
Guido van Rossum4def7de1998-07-24 20:48:03 +0000274 pass
275
Skip Montanaro269b83b2001-02-06 01:07:02 +0000276__all__.extend(["makedirs", "removedirs", "renames"])
277
Guido van Rossumd8faa362007-04-27 19:54:29 +0000278def walk(top, topdown=True, onerror=None, followlinks=False):
Tim Petersc4e09402003-04-25 07:11:48 +0000279 """Directory tree generator.
280
281 For each directory in the directory tree rooted at top (including top
282 itself, but excluding '.' and '..'), yields a 3-tuple
283
284 dirpath, dirnames, filenames
285
286 dirpath is a string, the path to the directory. dirnames is a list of
287 the names of the subdirectories in dirpath (excluding '.' and '..').
288 filenames is a list of the names of the non-directory files in dirpath.
289 Note that the names in the lists are just names, with no path components.
290 To get a full path (which begins with top) to a file or directory in
291 dirpath, do os.path.join(dirpath, name).
292
293 If optional arg 'topdown' is true or not specified, the triple for a
294 directory is generated before the triples for any of its subdirectories
295 (directories are generated top down). If topdown is false, the triple
296 for a directory is generated after the triples for all of its
297 subdirectories (directories are generated bottom up).
298
299 When topdown is true, the caller can modify the dirnames list in-place
300 (e.g., via del or slice assignment), and walk will only recurse into the
Benjamin Petersone58e0c72014-06-15 20:51:12 -0700301 subdirectories whose names remain in dirnames; this can be used to prune the
302 search, or to impose a specific order of visiting. Modifying dirnames when
303 topdown is false is ineffective, since the directories in dirnames have
304 already been generated by the time dirnames itself is generated. No matter
305 the value of topdown, the list of subdirectories is retrieved before the
306 tuples for the directory and its subdirectories are generated.
Tim Petersc4e09402003-04-25 07:11:48 +0000307
Victor Stinner524a5ba2015-03-10 13:20:34 +0100308 By default errors from the os.scandir() call are ignored. If
Guido van Rossumbf1bef82003-05-13 18:01:19 +0000309 optional arg 'onerror' is specified, it should be a function; it
Andrew Svetlovad28c7f2012-12-18 22:02:39 +0200310 will be called with one argument, an OSError instance. It can
Guido van Rossumbf1bef82003-05-13 18:01:19 +0000311 report the error to continue with the walk, or raise the exception
312 to abort the walk. Note that the filename is available as the
313 filename attribute of the exception object.
314
Guido van Rossumd8faa362007-04-27 19:54:29 +0000315 By default, os.walk does not follow symbolic links to subdirectories on
316 systems that support them. In order to get this functionality, set the
317 optional argument 'followlinks' to true.
318
Tim Petersc4e09402003-04-25 07:11:48 +0000319 Caution: if you pass a relative pathname for top, don't change the
320 current working directory between resumptions of walk. walk never
321 changes the current directory, and assumes that the client doesn't
322 either.
323
324 Example:
325
Christian Heimes5d8da202008-05-06 13:58:24 +0000326 import os
Tim Petersc4e09402003-04-25 07:11:48 +0000327 from os.path import join, getsize
Christian Heimes5d8da202008-05-06 13:58:24 +0000328 for root, dirs, files in os.walk('python/Lib/email'):
Neal Norwitz752abd02008-05-13 04:55:24 +0000329 print(root, "consumes", end="")
330 print(sum([getsize(join(root, name)) for name in files]), end="")
331 print("bytes in", len(files), "non-directory files")
Tim Petersc4e09402003-04-25 07:11:48 +0000332 if 'CVS' in dirs:
333 dirs.remove('CVS') # don't visit CVS directories
Benjamin Petersone58e0c72014-06-15 20:51:12 -0700334
Tim Petersc4e09402003-04-25 07:11:48 +0000335 """
Brett Cannon3f9183b2016-08-26 14:44:48 -0700336 top = fspath(top)
Victor Stinner524a5ba2015-03-10 13:20:34 +0100337 dirs = []
338 nondirs = []
Serhiy Storchaka7c90a822016-02-11 13:31:00 +0200339 walk_dirs = []
Tim Petersc4e09402003-04-25 07:11:48 +0000340
341 # We may not have read permission for top, in which case we can't
Alexandre Vassalotti4e6531e2008-05-09 20:00:17 +0000342 # get a list of the files the directory contains. os.walk
Tim Petersc4e09402003-04-25 07:11:48 +0000343 # always suppressed the exception then, rather than blow up for a
344 # minor reason when (say) a thousand readable directories are still
345 # left to visit. That logic is copied here.
346 try:
Serhiy Storchaka3ae41552016-10-05 23:17:10 +0300347 # Note that scandir is global in this module due
348 # to earlier import-*.
349 scandir_it = scandir(top)
Victor Stinner7fea9742015-03-18 11:29:47 +0100350 except OSError as error:
351 if onerror is not None:
352 onerror(error)
353 return
354
Serhiy Storchakaffe96ae2016-02-11 13:21:30 +0200355 with scandir_it:
356 while True:
Victor Stinner524a5ba2015-03-10 13:20:34 +0100357 try:
Victor Stinner524a5ba2015-03-10 13:20:34 +0100358 try:
Serhiy Storchakaffe96ae2016-02-11 13:21:30 +0200359 entry = next(scandir_it)
360 except StopIteration:
361 break
362 except OSError as error:
363 if onerror is not None:
364 onerror(error)
365 return
Victor Stinner7fea9742015-03-18 11:29:47 +0100366
Serhiy Storchakaffe96ae2016-02-11 13:21:30 +0200367 try:
368 is_dir = entry.is_dir()
369 except OSError:
370 # If is_dir() raises an OSError, consider that the entry is not
371 # a directory, same behaviour than os.path.isdir().
372 is_dir = False
373
374 if is_dir:
375 dirs.append(entry.name)
376 else:
377 nondirs.append(entry.name)
378
379 if not topdown and is_dir:
380 # Bottom-up: recurse into sub-directory, but exclude symlinks to
381 # directories if followlinks is False
382 if followlinks:
383 walk_into = True
384 else:
385 try:
386 is_symlink = entry.is_symlink()
387 except OSError:
388 # If is_symlink() raises an OSError, consider that the
389 # entry is not a symbolic link, same behaviour than
390 # os.path.islink().
391 is_symlink = False
392 walk_into = not is_symlink
393
394 if walk_into:
Serhiy Storchaka7c90a822016-02-11 13:31:00 +0200395 walk_dirs.append(entry.path)
Tim Petersc4e09402003-04-25 07:11:48 +0000396
Victor Stinner524a5ba2015-03-10 13:20:34 +0100397 # Yield before recursion if going top down
Tim Petersc4e09402003-04-25 07:11:48 +0000398 if topdown:
399 yield top, dirs, nondirs
Victor Stinner524a5ba2015-03-10 13:20:34 +0100400
Victor Stinner7fea9742015-03-18 11:29:47 +0100401 # Recurse into sub-directories
402 islink, join = path.islink, path.join
Serhiy Storchaka5f6a0b42016-02-08 16:23:28 +0200403 for dirname in dirs:
404 new_path = join(top, dirname)
Victor Stinner7fea9742015-03-18 11:29:47 +0100405 # Issue #23605: os.path.islink() is used instead of caching
406 # entry.is_symlink() result during the loop on os.scandir() because
407 # the caller can replace the directory entry during the "yield"
408 # above.
409 if followlinks or not islink(new_path):
410 yield from walk(new_path, topdown, onerror, followlinks)
411 else:
Serhiy Storchaka7c90a822016-02-11 13:31:00 +0200412 # Recurse into sub-directories
413 for new_path in walk_dirs:
414 yield from walk(new_path, topdown, onerror, followlinks)
Victor Stinner7fea9742015-03-18 11:29:47 +0100415 # Yield after recursion if going bottom up
Tim Petersc4e09402003-04-25 07:11:48 +0000416 yield top, dirs, nondirs
417
418__all__.append("walk")
419
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300420if {open, stat} <= supports_dir_fd and {scandir, stat} <= supports_fd:
Charles-François Natali7372b062012-02-05 15:15:38 +0100421
Larry Hastingsb4038062012-07-15 10:57:38 -0700422 def fwalk(top=".", topdown=True, onerror=None, *, follow_symlinks=False, dir_fd=None):
Charles-François Natali7372b062012-02-05 15:15:38 +0100423 """Directory tree generator.
424
425 This behaves exactly like walk(), except that it yields a 4-tuple
426
427 dirpath, dirnames, filenames, dirfd
428
429 `dirpath`, `dirnames` and `filenames` are identical to walk() output,
430 and `dirfd` is a file descriptor referring to the directory `dirpath`.
431
Larry Hastingsc48fe982012-06-25 04:49:05 -0700432 The advantage of fwalk() over walk() is that it's safe against symlink
Larry Hastingsb4038062012-07-15 10:57:38 -0700433 races (when follow_symlinks is False).
Charles-François Natali7372b062012-02-05 15:15:38 +0100434
Larry Hastingsc48fe982012-06-25 04:49:05 -0700435 If dir_fd is not None, it should be a file descriptor open to a directory,
436 and top should be relative; top will then be relative to that directory.
437 (dir_fd is always supported for fwalk.)
438
Charles-François Natali7372b062012-02-05 15:15:38 +0100439 Caution:
440 Since fwalk() yields file descriptors, those are only valid until the
441 next iteration step, so you should dup() them if you want to keep them
442 for a longer period.
443
444 Example:
445
446 import os
447 for root, dirs, files, rootfd in os.fwalk('python/Lib/email'):
448 print(root, "consumes", end="")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700449 print(sum([os.stat(name, dir_fd=rootfd).st_size for name in files]),
Charles-François Natali7372b062012-02-05 15:15:38 +0100450 end="")
451 print("bytes in", len(files), "non-directory files")
452 if 'CVS' in dirs:
453 dirs.remove('CVS') # don't visit CVS directories
454 """
Brett Cannon3f9183b2016-08-26 14:44:48 -0700455 if not isinstance(top, int) or not hasattr(top, '__index__'):
456 top = fspath(top)
Charles-François Natali7372b062012-02-05 15:15:38 +0100457 # Note: To guard against symlink races, we use the standard
458 # lstat()/open()/fstat() trick.
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300459 if not follow_symlinks:
460 orig_st = stat(top, follow_symlinks=False, dir_fd=dir_fd)
Larry Hastingsc48fe982012-06-25 04:49:05 -0700461 topfd = open(top, O_RDONLY, dir_fd=dir_fd)
Charles-François Natali7372b062012-02-05 15:15:38 +0100462 try:
Larry Hastingsb4038062012-07-15 10:57:38 -0700463 if (follow_symlinks or (st.S_ISDIR(orig_st.st_mode) and
464 path.samestat(orig_st, stat(topfd)))):
Serhiy Storchaka8f6b3442017-03-07 14:33:21 +0200465 yield from _fwalk(topfd, top, isinstance(top, bytes),
466 topdown, onerror, follow_symlinks)
Charles-François Natali7372b062012-02-05 15:15:38 +0100467 finally:
468 close(topfd)
469
Serhiy Storchaka8f6b3442017-03-07 14:33:21 +0200470 def _fwalk(topfd, toppath, isbytes, topdown, onerror, follow_symlinks):
Charles-François Natali7372b062012-02-05 15:15:38 +0100471 # Note: This uses O(depth of the directory tree) file descriptors: if
472 # necessary, it can be adapted to only require O(1) FDs, see issue
473 # #13734.
474
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300475 scandir_it = scandir(topfd)
476 dirs = []
477 nondirs = []
478 entries = None if topdown or follow_symlinks else []
479 for entry in scandir_it:
480 name = entry.name
481 if isbytes:
482 name = fsencode(name)
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200483 try:
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300484 if entry.is_dir():
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200485 dirs.append(name)
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300486 if entries is not None:
487 entries.append(entry)
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200488 else:
489 nondirs.append(name)
Serhiy Storchaka42babab2016-10-25 14:28:38 +0300490 except OSError:
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200491 try:
492 # Add dangling symlinks, ignore disappeared files
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300493 if entry.is_symlink():
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200494 nondirs.append(name)
Serhiy Storchaka42babab2016-10-25 14:28:38 +0300495 except OSError:
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300496 pass
Charles-François Natali7372b062012-02-05 15:15:38 +0100497
498 if topdown:
499 yield toppath, dirs, nondirs, topfd
500
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300501 for name in dirs if entries is None else zip(dirs, entries):
Charles-François Natali7372b062012-02-05 15:15:38 +0100502 try:
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300503 if not follow_symlinks:
504 if topdown:
505 orig_st = stat(name, dir_fd=topfd, follow_symlinks=False)
506 else:
507 assert entries is not None
508 name, entry = name
509 orig_st = entry.stat(follow_symlinks=False)
Larry Hastings9cf065c2012-06-22 16:30:09 -0700510 dirfd = open(name, O_RDONLY, dir_fd=topfd)
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200511 except OSError as err:
Charles-François Natali7372b062012-02-05 15:15:38 +0100512 if onerror is not None:
513 onerror(err)
Serhiy Storchaka0bddc9e2015-12-23 00:08:24 +0200514 continue
Charles-François Natali7372b062012-02-05 15:15:38 +0100515 try:
Larry Hastingsb4038062012-07-15 10:57:38 -0700516 if follow_symlinks or path.samestat(orig_st, stat(dirfd)):
Charles-François Natali7372b062012-02-05 15:15:38 +0100517 dirpath = path.join(toppath, name)
Serhiy Storchaka8f6b3442017-03-07 14:33:21 +0200518 yield from _fwalk(dirfd, dirpath, isbytes,
519 topdown, onerror, follow_symlinks)
Charles-François Natali7372b062012-02-05 15:15:38 +0100520 finally:
521 close(dirfd)
522
523 if not topdown:
524 yield toppath, dirs, nondirs, topfd
525
526 __all__.append("fwalk")
527
Guido van Rossuma28dab51997-08-29 22:36:47 +0000528# Make sure os.environ exists, at least
529try:
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000530 environ
Guido van Rossuma28dab51997-08-29 22:36:47 +0000531except NameError:
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000532 environ = {}
Guido van Rossuma28dab51997-08-29 22:36:47 +0000533
Guido van Rossume65cce51993-11-08 15:05:21 +0000534def execl(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000535 """execl(file, *args)
536
537 Execute the executable file with argument list args, replacing the
538 current process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000539 execv(file, args)
Guido van Rossume65cce51993-11-08 15:05:21 +0000540
541def execle(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000542 """execle(file, *args, env)
543
544 Execute the executable file with argument list args and
545 environment env, replacing the current process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000546 env = args[-1]
547 execve(file, args[:-1], env)
Guido van Rossume65cce51993-11-08 15:05:21 +0000548
549def execlp(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000550 """execlp(file, *args)
551
552 Execute the executable file (which is searched for along $PATH)
553 with argument list args, replacing the current process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000554 execvp(file, args)
Guido van Rossume65cce51993-11-08 15:05:21 +0000555
Guido van Rossum030afb11995-03-14 17:27:18 +0000556def execlpe(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000557 """execlpe(file, *args, env)
558
559 Execute the executable file (which is searched for along $PATH)
560 with argument list args and environment env, replacing the current
Tim Peters2344fae2001-01-15 00:50:52 +0000561 process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000562 env = args[-1]
563 execvpe(file, args[:-1], env)
Guido van Rossum030afb11995-03-14 17:27:18 +0000564
Guido van Rossume65cce51993-11-08 15:05:21 +0000565def execvp(file, args):
Matthias Klosea09c54f2010-01-31 16:48:44 +0000566 """execvp(file, args)
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000567
568 Execute the executable file (which is searched for along $PATH)
569 with argument list args, replacing the current process.
Thomas Wouters7e474022000-07-16 12:04:32 +0000570 args may be a list or tuple of strings. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000571 _execvpe(file, args)
Guido van Rossum030afb11995-03-14 17:27:18 +0000572
573def execvpe(file, args, env):
Guido van Rossum683c0fe2002-09-03 16:36:17 +0000574 """execvpe(file, args, env)
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000575
576 Execute the executable file (which is searched for along $PATH)
577 with argument list args and environment env , replacing the
578 current process.
Tim Peters2344fae2001-01-15 00:50:52 +0000579 args may be a list or tuple of strings. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000580 _execvpe(file, args, env)
Guido van Rossum030afb11995-03-14 17:27:18 +0000581
Skip Montanaro269b83b2001-02-06 01:07:02 +0000582__all__.extend(["execl","execle","execlp","execlpe","execvp","execvpe"])
583
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000584def _execvpe(file, args, env=None):
585 if env is not None:
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000586 exec_func = execve
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000587 argrest = (args, env)
588 else:
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000589 exec_func = execv
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000590 argrest = (args,)
591 env = environ
Guido van Rossumaed51d82002-08-05 16:13:24 +0000592
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000593 head, tail = path.split(file)
594 if head:
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000595 exec_func(file, *argrest)
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000596 return
Guido van Rossume7ba4952007-06-06 23:52:48 +0000597 last_exc = saved_exc = None
Guido van Rossum683c0fe2002-09-03 16:36:17 +0000598 saved_tb = None
Victor Stinnerb745a742010-05-18 17:17:23 +0000599 path_list = get_exec_path(env)
600 if name != 'nt':
601 file = fsencode(file)
602 path_list = map(fsencode, path_list)
603 for dir in path_list:
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000604 fullname = path.join(dir, file)
605 try:
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000606 exec_func(fullname, *argrest)
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200607 except OSError as e:
Guido van Rossume7ba4952007-06-06 23:52:48 +0000608 last_exc = e
Guido van Rossum683c0fe2002-09-03 16:36:17 +0000609 tb = sys.exc_info()[2]
Christian Heimes45f9af32007-11-27 21:50:00 +0000610 if (e.errno != errno.ENOENT and e.errno != errno.ENOTDIR
Guido van Rossum683c0fe2002-09-03 16:36:17 +0000611 and saved_exc is None):
612 saved_exc = e
613 saved_tb = tb
614 if saved_exc:
Benjamin Peterson4b068192009-02-20 03:19:25 +0000615 raise saved_exc.with_traceback(saved_tb)
616 raise last_exc.with_traceback(tb)
Guido van Rossumd74fb6b2001-03-02 06:43:49 +0000617
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000618
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000619def get_exec_path(env=None):
620 """Returns the sequence of directories that will be searched for the
621 named executable (similar to a shell) when launching a process.
622
623 *env* must be an environment variable dict or None. If *env* is None,
624 os.environ will be used.
625 """
Victor Stinner273b7662010-11-06 12:59:33 +0000626 # Use a local import instead of a global import to limit the number of
627 # modules loaded at startup: the os module is always loaded at startup by
628 # Python. It may also avoid a bootstrap issue.
Victor Stinner6f35eda2010-10-29 00:38:58 +0000629 import warnings
630
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000631 if env is None:
632 env = environ
Victor Stinnerb745a742010-05-18 17:17:23 +0000633
Victor Stinnerbb4f2182010-11-07 15:43:39 +0000634 # {b'PATH': ...}.get('PATH') and {'PATH': ...}.get(b'PATH') emit a
635 # BytesWarning when using python -b or python -bb: ignore the warning
Victor Stinner273b7662010-11-06 12:59:33 +0000636 with warnings.catch_warnings():
637 warnings.simplefilter("ignore", BytesWarning)
Victor Stinnerb745a742010-05-18 17:17:23 +0000638
Victor Stinnerb745a742010-05-18 17:17:23 +0000639 try:
Victor Stinner273b7662010-11-06 12:59:33 +0000640 path_list = env.get('PATH')
641 except TypeError:
642 path_list = None
Victor Stinnerb745a742010-05-18 17:17:23 +0000643
Victor Stinner273b7662010-11-06 12:59:33 +0000644 if supports_bytes_environ:
645 try:
646 path_listb = env[b'PATH']
647 except (KeyError, TypeError):
648 pass
649 else:
650 if path_list is not None:
651 raise ValueError(
652 "env cannot contain 'PATH' and b'PATH' keys")
653 path_list = path_listb
654
655 if path_list is not None and isinstance(path_list, bytes):
656 path_list = fsdecode(path_list)
Victor Stinnerb745a742010-05-18 17:17:23 +0000657
658 if path_list is None:
659 path_list = defpath
660 return path_list.split(pathsep)
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000661
662
Skip Montanaro289bc052007-08-17 02:30:27 +0000663# Change environ to automatically call putenv(), unsetenv if they exist.
Christian Heimesf1dc3ee2013-10-13 02:04:20 +0200664from _collections_abc import MutableMapping
Skip Montanaro289bc052007-08-17 02:30:27 +0000665
666class _Environ(MutableMapping):
Victor Stinner84ae1182010-05-06 22:05:07 +0000667 def __init__(self, data, encodekey, decodekey, encodevalue, decodevalue, putenv, unsetenv):
668 self.encodekey = encodekey
669 self.decodekey = decodekey
670 self.encodevalue = encodevalue
671 self.decodevalue = decodevalue
Skip Montanaro289bc052007-08-17 02:30:27 +0000672 self.putenv = putenv
673 self.unsetenv = unsetenv
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000674 self._data = data
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000675
Skip Montanaro289bc052007-08-17 02:30:27 +0000676 def __getitem__(self, key):
Victor Stinner6d101392013-04-14 16:35:04 +0200677 try:
678 value = self._data[self.encodekey(key)]
679 except KeyError:
680 # raise KeyError with the original key value
Victor Stinner0c2dd0c2013-08-23 19:19:15 +0200681 raise KeyError(key) from None
Victor Stinner84ae1182010-05-06 22:05:07 +0000682 return self.decodevalue(value)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000683
Skip Montanaro289bc052007-08-17 02:30:27 +0000684 def __setitem__(self, key, value):
Victor Stinner84ae1182010-05-06 22:05:07 +0000685 key = self.encodekey(key)
686 value = self.encodevalue(value)
Skip Montanaro289bc052007-08-17 02:30:27 +0000687 self.putenv(key, value)
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000688 self._data[key] = value
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000689
Skip Montanaro289bc052007-08-17 02:30:27 +0000690 def __delitem__(self, key):
Victor Stinner6d101392013-04-14 16:35:04 +0200691 encodedkey = self.encodekey(key)
692 self.unsetenv(encodedkey)
693 try:
694 del self._data[encodedkey]
695 except KeyError:
696 # raise KeyError with the original key value
Victor Stinner0c2dd0c2013-08-23 19:19:15 +0200697 raise KeyError(key) from None
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000698
Skip Montanaro289bc052007-08-17 02:30:27 +0000699 def __iter__(self):
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000700 for key in self._data:
Victor Stinner84ae1182010-05-06 22:05:07 +0000701 yield self.decodekey(key)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000702
Skip Montanaro289bc052007-08-17 02:30:27 +0000703 def __len__(self):
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000704 return len(self._data)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000705
706 def __repr__(self):
Victor Stinnerbed71172010-07-28 21:25:42 +0000707 return 'environ({{{}}})'.format(', '.join(
Victor Stinnerd73c1a32010-07-28 21:23:23 +0000708 ('{!r}: {!r}'.format(self.decodekey(key), self.decodevalue(value))
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000709 for key, value in self._data.items())))
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000710
Skip Montanaro289bc052007-08-17 02:30:27 +0000711 def copy(self):
712 return dict(self)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000713
Skip Montanaro289bc052007-08-17 02:30:27 +0000714 def setdefault(self, key, value):
715 if key not in self:
716 self[key] = value
717 return self[key]
718
719try:
720 _putenv = putenv
721except NameError:
722 _putenv = lambda key, value: None
Richard Oudkerkc41917f2013-05-07 14:36:51 +0100723else:
724 if "putenv" not in __all__:
725 __all__.append("putenv")
Guido van Rossum3b8e20d1996-07-24 00:55:17 +0000726
Skip Montanaro289bc052007-08-17 02:30:27 +0000727try:
728 _unsetenv = unsetenv
729except NameError:
730 _unsetenv = lambda key: _putenv(key, "")
Richard Oudkerkc41917f2013-05-07 14:36:51 +0100731else:
732 if "unsetenv" not in __all__:
733 __all__.append("unsetenv")
Guido van Rossumc524d952001-10-19 01:31:59 +0000734
Victor Stinner84ae1182010-05-06 22:05:07 +0000735def _createenviron():
Jesus Cea4791a242012-10-05 03:15:39 +0200736 if name == 'nt':
Victor Stinner84ae1182010-05-06 22:05:07 +0000737 # Where Env Var Names Must Be UPPERCASE
738 def check_str(value):
739 if not isinstance(value, str):
740 raise TypeError("str expected, not %s" % type(value).__name__)
741 return value
742 encode = check_str
743 decode = str
744 def encodekey(key):
745 return encode(key).upper()
746 data = {}
747 for key, value in environ.items():
748 data[encodekey(key)] = value
749 else:
750 # Where Env Var Names Can Be Mixed Case
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000751 encoding = sys.getfilesystemencoding()
Victor Stinner84ae1182010-05-06 22:05:07 +0000752 def encode(value):
753 if not isinstance(value, str):
754 raise TypeError("str expected, not %s" % type(value).__name__)
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000755 return value.encode(encoding, 'surrogateescape')
Victor Stinner84ae1182010-05-06 22:05:07 +0000756 def decode(value):
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000757 return value.decode(encoding, 'surrogateescape')
Victor Stinner84ae1182010-05-06 22:05:07 +0000758 encodekey = encode
759 data = environ
760 return _Environ(data,
761 encodekey, decode,
762 encode, decode,
763 _putenv, _unsetenv)
Guido van Rossumc524d952001-10-19 01:31:59 +0000764
Victor Stinner84ae1182010-05-06 22:05:07 +0000765# unicode environ
766environ = _createenviron()
767del _createenviron
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000768
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000769
Jack Jansenb11ce9b2003-01-08 16:33:40 +0000770def getenv(key, default=None):
Tim Peters2c60f7a2003-01-29 03:49:43 +0000771 """Get an environment variable, return None if it doesn't exist.
Victor Stinner84ae1182010-05-06 22:05:07 +0000772 The optional second argument can specify an alternate default.
773 key, default and the result are str."""
Tim Peters2c60f7a2003-01-29 03:49:43 +0000774 return environ.get(key, default)
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000775
Jesus Cea4791a242012-10-05 03:15:39 +0200776supports_bytes_environ = (name != 'nt')
Victor Stinnerb745a742010-05-18 17:17:23 +0000777__all__.extend(("getenv", "supports_bytes_environ"))
778
779if supports_bytes_environ:
Victor Stinner84ae1182010-05-06 22:05:07 +0000780 def _check_bytes(value):
781 if not isinstance(value, bytes):
782 raise TypeError("bytes expected, not %s" % type(value).__name__)
783 return value
784
785 # bytes environ
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000786 environb = _Environ(environ._data,
Victor Stinner84ae1182010-05-06 22:05:07 +0000787 _check_bytes, bytes,
788 _check_bytes, bytes,
789 _putenv, _unsetenv)
790 del _check_bytes
791
792 def getenvb(key, default=None):
793 """Get an environment variable, return None if it doesn't exist.
794 The optional second argument can specify an alternate default.
795 key, default and the result are bytes."""
796 return environb.get(key, default)
Victor Stinner70120e22010-07-29 17:19:38 +0000797
798 __all__.extend(("environb", "getenvb"))
Victor Stinner84ae1182010-05-06 22:05:07 +0000799
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000800def _fscodec():
801 encoding = sys.getfilesystemencoding()
Steve Dowercc16be82016-09-08 10:35:16 -0700802 errors = sys.getfilesystemencodeerrors()
Victor Stinnere8d51452010-08-19 01:05:19 +0000803
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000804 def fsencode(filename):
Brett Cannon5f74ebc2016-06-09 14:29:25 -0700805 """Encode filename (an os.PathLike, bytes, or str) to the filesystem
Ethan Furmanc1cbeed2016-06-04 10:19:27 -0700806 encoding with 'surrogateescape' error handler, return bytes unchanged.
807 On Windows, use 'strict' error handler if the file system encoding is
808 'mbcs' (which is the default encoding).
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000809 """
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700810 filename = fspath(filename) # Does type-checking of `filename`.
811 if isinstance(filename, str):
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000812 return filename.encode(encoding, errors)
Victor Stinnere8d51452010-08-19 01:05:19 +0000813 else:
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700814 return filename
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000815
816 def fsdecode(filename):
Brett Cannon5f74ebc2016-06-09 14:29:25 -0700817 """Decode filename (an os.PathLike, bytes, or str) from the filesystem
Ethan Furmanc1cbeed2016-06-04 10:19:27 -0700818 encoding with 'surrogateescape' error handler, return str unchanged. On
819 Windows, use 'strict' error handler if the file system encoding is
820 'mbcs' (which is the default encoding).
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000821 """
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700822 filename = fspath(filename) # Does type-checking of `filename`.
823 if isinstance(filename, bytes):
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000824 return filename.decode(encoding, errors)
825 else:
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700826 return filename
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000827
828 return fsencode, fsdecode
829
830fsencode, fsdecode = _fscodec()
831del _fscodec
Victor Stinner449c4662010-05-08 11:10:09 +0000832
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000833# Supply spawn*() (probably only for Unix)
834if _exists("fork") and not _exists("spawnv") and _exists("execv"):
835
836 P_WAIT = 0
837 P_NOWAIT = P_NOWAITO = 1
838
Petri Lehtinen3bc37f22012-05-23 21:36:16 +0300839 __all__.extend(["P_WAIT", "P_NOWAIT", "P_NOWAITO"])
840
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000841 # XXX Should we support P_DETACH? I suppose it could fork()**2
842 # and close the std I/O streams. Also, P_OVERLAY is the same
843 # as execv*()?
844
845 def _spawnvef(mode, file, args, env, func):
846 # Internal helper; func is the exec*() function to use
Steve Dowereccaa062016-11-19 20:11:56 -0800847 if not isinstance(args, (tuple, list)):
848 raise TypeError('argv must be a tuple or a list')
Steve Dowerbb08db42016-11-19 21:14:27 -0800849 if not args or not args[0]:
Steve Dowereccaa062016-11-19 20:11:56 -0800850 raise ValueError('argv first element cannot be empty')
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000851 pid = fork()
852 if not pid:
853 # Child
854 try:
855 if env is None:
856 func(file, args)
857 else:
858 func(file, args, env)
859 except:
860 _exit(127)
861 else:
862 # Parent
863 if mode == P_NOWAIT:
864 return pid # Caller is responsible for waiting!
865 while 1:
866 wpid, sts = waitpid(pid, 0)
867 if WIFSTOPPED(sts):
868 continue
869 elif WIFSIGNALED(sts):
870 return -WTERMSIG(sts)
871 elif WIFEXITED(sts):
872 return WEXITSTATUS(sts)
873 else:
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200874 raise OSError("Not stopped, signaled or exited???")
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000875
876 def spawnv(mode, file, args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000877 """spawnv(mode, file, args) -> integer
878
879Execute file with arguments from args in a subprocess.
880If mode == P_NOWAIT return the pid of the process.
881If mode == P_WAIT return the process's exit code if it exits normally;
Tim Peters2344fae2001-01-15 00:50:52 +0000882otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000883 return _spawnvef(mode, file, args, None, execv)
884
885 def spawnve(mode, file, args, env):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000886 """spawnve(mode, file, args, env) -> integer
887
888Execute file with arguments from args in a subprocess with the
889specified environment.
890If mode == P_NOWAIT return the pid of the process.
891If mode == P_WAIT return the process's exit code if it exits normally;
892otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000893 return _spawnvef(mode, file, args, env, execve)
894
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000895 # Note: spawnvp[e] is't currently supported on Windows
896
897 def spawnvp(mode, file, args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000898 """spawnvp(mode, file, args) -> integer
899
900Execute file (which is looked for along $PATH) with arguments from
901args in a subprocess.
902If mode == P_NOWAIT return the pid of the process.
903If mode == P_WAIT return the process's exit code if it exits normally;
904otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000905 return _spawnvef(mode, file, args, None, execvp)
906
907 def spawnvpe(mode, file, args, env):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000908 """spawnvpe(mode, file, args, env) -> integer
909
910Execute file (which is looked for along $PATH) with arguments from
911args in a subprocess with the supplied environment.
912If mode == P_NOWAIT return the pid of the process.
913If mode == P_WAIT return the process's exit code if it exits normally;
914otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000915 return _spawnvef(mode, file, args, env, execvpe)
916
Richard Oudkerkad34ef82013-05-07 14:23:42 +0100917
918 __all__.extend(["spawnv", "spawnve", "spawnvp", "spawnvpe"])
919
920
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000921if _exists("spawnv"):
922 # These aren't supplied by the basic Windows code
923 # but can be easily implemented in Python
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000924
925 def spawnl(mode, file, *args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000926 """spawnl(mode, file, *args) -> integer
927
928Execute file with arguments from args in a subprocess.
929If mode == P_NOWAIT return the pid of the process.
930If mode == P_WAIT return the process's exit code if it exits normally;
931otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000932 return spawnv(mode, file, args)
933
934 def spawnle(mode, file, *args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000935 """spawnle(mode, file, *args, env) -> integer
936
937Execute file with arguments from args in a subprocess with the
938supplied environment.
939If mode == P_NOWAIT return the pid of the process.
940If mode == P_WAIT return the process's exit code if it exits normally;
941otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000942 env = args[-1]
943 return spawnve(mode, file, args[:-1], env)
944
Andrew MacIntyre69e18c92004-04-04 07:11:43 +0000945
Richard Oudkerkad34ef82013-05-07 14:23:42 +0100946 __all__.extend(["spawnl", "spawnle"])
Andrew MacIntyre69e18c92004-04-04 07:11:43 +0000947
948
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000949if _exists("spawnvp"):
950 # At the moment, Windows doesn't implement spawnvp[e],
951 # so it won't have spawnlp[e] either.
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000952 def spawnlp(mode, file, *args):
Neal Norwitzb7f68102003-07-02 02:49:33 +0000953 """spawnlp(mode, file, *args) -> integer
Guido van Rossume0cd2912000-04-21 18:35:36 +0000954
955Execute file (which is looked for along $PATH) with arguments from
956args in a subprocess with the supplied environment.
957If mode == P_NOWAIT return the pid of the process.
958If mode == P_WAIT return the process's exit code if it exits normally;
959otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000960 return spawnvp(mode, file, args)
961
962 def spawnlpe(mode, file, *args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000963 """spawnlpe(mode, file, *args, env) -> integer
964
965Execute file (which is looked for along $PATH) with arguments from
966args in a subprocess with the supplied environment.
967If mode == P_NOWAIT return the pid of the process.
968If mode == P_WAIT return the process's exit code if it exits normally;
969otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000970 env = args[-1]
971 return spawnvpe(mode, file, args[:-1], env)
Guido van Rossume0cd2912000-04-21 18:35:36 +0000972
973
Richard Oudkerkad34ef82013-05-07 14:23:42 +0100974 __all__.extend(["spawnlp", "spawnlpe"])
975
Skip Montanaro269b83b2001-02-06 01:07:02 +0000976
Guido van Rossumc2f93dc2007-05-24 00:50:02 +0000977# Supply os.popen()
Antoine Pitrou877766d2011-03-19 17:00:37 +0100978def popen(cmd, mode="r", buffering=-1):
Guido van Rossum3172c5d2007-10-16 18:12:55 +0000979 if not isinstance(cmd, str):
Guido van Rossumc2f93dc2007-05-24 00:50:02 +0000980 raise TypeError("invalid cmd type (%s, expected string)" % type(cmd))
981 if mode not in ("r", "w"):
982 raise ValueError("invalid mode %r" % mode)
Benjamin Petersonb29614e2012-10-09 11:16:03 -0400983 if buffering == 0 or buffering is None:
Antoine Pitrou877766d2011-03-19 17:00:37 +0100984 raise ValueError("popen() does not support unbuffered streams")
Guido van Rossumc2f93dc2007-05-24 00:50:02 +0000985 import subprocess, io
986 if mode == "r":
987 proc = subprocess.Popen(cmd,
988 shell=True,
989 stdout=subprocess.PIPE,
990 bufsize=buffering)
991 return _wrap_close(io.TextIOWrapper(proc.stdout), proc)
992 else:
993 proc = subprocess.Popen(cmd,
994 shell=True,
995 stdin=subprocess.PIPE,
996 bufsize=buffering)
997 return _wrap_close(io.TextIOWrapper(proc.stdin), proc)
998
999# Helper for popen() -- a proxy for a file whose close waits for the process
1000class _wrap_close:
1001 def __init__(self, stream, proc):
1002 self._stream = stream
1003 self._proc = proc
1004 def close(self):
1005 self._stream.close()
Amaury Forgeot d'Arc97e5f282009-07-11 09:35:13 +00001006 returncode = self._proc.wait()
1007 if returncode == 0:
1008 return None
1009 if name == 'nt':
1010 return returncode
1011 else:
1012 return returncode << 8 # Shift left to match old behavior
Antoine Pitrouac625352009-12-09 00:01:27 +00001013 def __enter__(self):
1014 return self
1015 def __exit__(self, *args):
1016 self.close()
Guido van Rossumc2f93dc2007-05-24 00:50:02 +00001017 def __getattr__(self, name):
1018 return getattr(self._stream, name)
Thomas Heller476157b2007-09-04 11:27:47 +00001019 def __iter__(self):
1020 return iter(self._stream)
Guido van Rossumc2f93dc2007-05-24 00:50:02 +00001021
Amaury Forgeot d'Arcbdbddf82008-08-01 00:06:49 +00001022# Supply os.fdopen()
1023def fdopen(fd, *args, **kwargs):
Guido van Rossumc2f93dc2007-05-24 00:50:02 +00001024 if not isinstance(fd, int):
1025 raise TypeError("invalid fd type (%s, expected integer)" % type(fd))
1026 import io
Amaury Forgeot d'Arcbdbddf82008-08-01 00:06:49 +00001027 return io.open(fd, *args, **kwargs)
Ethan Furmancdc08792016-06-02 15:06:09 -07001028
Brett Cannonc78ca1e2016-06-24 12:03:43 -07001029
1030# For testing purposes, make sure the function is available when the C
1031# implementation exists.
1032def _fspath(path):
1033 """Return the path representation of a path-like object.
1034
1035 If str or bytes is passed in, it is returned unchanged. Otherwise the
1036 os.PathLike interface is used to get the path representation. If the
1037 path representation is not str or bytes, TypeError is raised. If the
1038 provided path is not str, bytes, or os.PathLike, TypeError is raised.
1039 """
1040 if isinstance(path, (str, bytes)):
1041 return path
1042
1043 # Work from the object's type to match method resolution of other magic
1044 # methods.
1045 path_type = type(path)
1046 try:
1047 path_repr = path_type.__fspath__(path)
1048 except AttributeError:
1049 if hasattr(path_type, '__fspath__'):
1050 raise
1051 else:
1052 raise TypeError("expected str, bytes or os.PathLike object, "
1053 "not " + path_type.__name__)
1054 if isinstance(path_repr, (str, bytes)):
1055 return path_repr
1056 else:
1057 raise TypeError("expected {}.__fspath__() to return str or bytes, "
1058 "not {}".format(path_type.__name__,
1059 type(path_repr).__name__))
1060
1061# If there is no C implementation, make the pure Python version the
1062# implementation as transparently as possible.
Ethan Furman410ef8e2016-06-04 12:06:26 -07001063if not _exists('fspath'):
Brett Cannonc78ca1e2016-06-24 12:03:43 -07001064 fspath = _fspath
1065 fspath.__name__ = "fspath"
Ethan Furmancdc08792016-06-02 15:06:09 -07001066
Ethan Furman958b3e42016-06-04 12:49:35 -07001067
1068class PathLike(abc.ABC):
Brett Cannon5f74ebc2016-06-09 14:29:25 -07001069
1070 """Abstract base class for implementing the file system path protocol."""
1071
Ethan Furman958b3e42016-06-04 12:49:35 -07001072 @abc.abstractmethod
1073 def __fspath__(self):
Brett Cannon5f74ebc2016-06-09 14:29:25 -07001074 """Return the file system path representation of the object."""
Ethan Furman958b3e42016-06-04 12:49:35 -07001075 raise NotImplementedError
1076
1077 @classmethod
1078 def __subclasshook__(cls, subclass):
1079 return hasattr(subclass, '__fspath__')