blob: 807ddb56c065586f0d97697f2d8a67b01f112758 [file] [log] [blame]
Ned Deily5c867012014-06-26 23:40:06 -07001r"""OS routines for NT or Posix depending on what system we're on.
Guido van Rossum31104f41992-01-14 18:28:36 +00002
Guido van Rossum54f22ed2000-02-04 15:10:34 +00003This exports:
Larry Hastings10108a72016-09-05 15:11:23 -07004 - all functions from posix or nt, e.g. unlink, stat, etc.
Alexandre Vassalottieca20b62008-05-16 02:54:33 +00005 - os.path is either posixpath or ntpath
Larry Hastings10108a72016-09-05 15:11:23 -07006 - os.name is either 'posix' or 'nt'
Ned Deilybf090e32016-10-01 21:12:35 -04007 - os.curdir is a string representing the current directory (always '.')
8 - os.pardir is a string representing the parent directory (always '..')
9 - os.sep is the (or a most common) pathname separator ('/' or '\\')
Georg Brandled5b9b32008-12-05 07:45:54 +000010 - os.extsep is the extension separator (always '.')
Guido van Rossum4b8c6ea2000-02-04 15:39:30 +000011 - os.altsep is the alternate pathname separator (None or '/')
Guido van Rossum54f22ed2000-02-04 15:10:34 +000012 - os.pathsep is the component separator used in $PATH etc
Guido van Rossum4b8c6ea2000-02-04 15:39:30 +000013 - os.linesep is the line separator in text files ('\r' or '\n' or '\r\n')
Guido van Rossum54f22ed2000-02-04 15:10:34 +000014 - os.defpath is the default search path for executables
Martin v. Löwisbdec50f2004-06-08 08:29:33 +000015 - os.devnull is the file path of the null device ('/dev/null', etc.)
Guido van Rossum31104f41992-01-14 18:28:36 +000016
Guido van Rossum54f22ed2000-02-04 15:10:34 +000017Programs that import and use 'os' stand a better chance of being
18portable between different platforms. Of course, they must then
19only use functions that are defined by all platforms (e.g., unlink
20and opendir), and leave all pathname manipulation to os.path
21(e.g., split and join).
22"""
Guido van Rossum31104f41992-01-14 18:28:36 +000023
Skip Montanaro269b83b2001-02-06 01:07:02 +000024#'
Ethan Furman958b3e42016-06-04 12:49:35 -070025import abc
Christian Heimes45f9af32007-11-27 21:50:00 +000026import sys, errno
Charles-François Natali7372b062012-02-05 15:15:38 +010027import stat as st
Guido van Rossuma28dab51997-08-29 22:36:47 +000028
29_names = sys.builtin_module_names
30
Tim Petersc4e09402003-04-25 07:11:48 +000031# Note: more names are added to __all__ later.
Brett Cannon13962fc2008-08-18 01:45:29 +000032__all__ = ["altsep", "curdir", "pardir", "sep", "pathsep", "linesep",
Petri Lehtinen3bc37f22012-05-23 21:36:16 +030033 "defpath", "name", "path", "devnull", "SEEK_SET", "SEEK_CUR",
34 "SEEK_END", "fsencode", "fsdecode", "get_exec_path", "fdopen",
35 "popen", "extsep"]
Skip Montanaro269b83b2001-02-06 01:07:02 +000036
Charles-François Natali7372b062012-02-05 15:15:38 +010037def _exists(name):
38 return name in globals()
39
Skip Montanaro269b83b2001-02-06 01:07:02 +000040def _get_exports_list(module):
41 try:
42 return list(module.__all__)
43 except AttributeError:
44 return [n for n in dir(module) if n[0] != '_']
45
Brett Cannonfd074152012-04-14 14:10:13 -040046# Any new dependencies of the os module and/or changes in path separator
47# requires updating importlib as well.
Guido van Rossuma28dab51997-08-29 22:36:47 +000048if 'posix' in _names:
Guido van Rossum61de0ac1997-12-05 21:24:30 +000049 name = 'posix'
Guido van Rossume9387ea1998-05-22 15:26:04 +000050 linesep = '\n'
Guido van Rossum61de0ac1997-12-05 21:24:30 +000051 from posix import *
52 try:
53 from posix import _exit
Petri Lehtinen3bc37f22012-05-23 21:36:16 +030054 __all__.append('_exit')
Brett Cannoncd171c82013-07-04 17:43:24 -040055 except ImportError:
Guido van Rossum61de0ac1997-12-05 21:24:30 +000056 pass
Skip Montanaro117910d2003-02-14 19:35:31 +000057 import posixpath as path
Tim Petersf2715e02003-02-19 02:35:07 +000058
Larry Hastings9cf065c2012-06-22 16:30:09 -070059 try:
60 from posix import _have_functions
Brett Cannoncd171c82013-07-04 17:43:24 -040061 except ImportError:
Larry Hastings9cf065c2012-06-22 16:30:09 -070062 pass
Skip Montanaro269b83b2001-02-06 01:07:02 +000063
Yury Selivanov97e2e062014-09-26 12:33:06 -040064 import posix
65 __all__.extend(_get_exports_list(posix))
66 del posix
67
Guido van Rossuma28dab51997-08-29 22:36:47 +000068elif 'nt' in _names:
Guido van Rossum61de0ac1997-12-05 21:24:30 +000069 name = 'nt'
Guido van Rossume9387ea1998-05-22 15:26:04 +000070 linesep = '\r\n'
Guido van Rossum61de0ac1997-12-05 21:24:30 +000071 from nt import *
Tim Peters6757c1e2003-01-08 21:20:57 +000072 try:
73 from nt import _exit
Petri Lehtinen3bc37f22012-05-23 21:36:16 +030074 __all__.append('_exit')
Brett Cannoncd171c82013-07-04 17:43:24 -040075 except ImportError:
Tim Peters6757c1e2003-01-08 21:20:57 +000076 pass
Skip Montanaro117910d2003-02-14 19:35:31 +000077 import ntpath as path
Tim Petersf2715e02003-02-19 02:35:07 +000078
Skip Montanaro269b83b2001-02-06 01:07:02 +000079 import nt
80 __all__.extend(_get_exports_list(nt))
81 del nt
82
Larry Hastings9cf065c2012-06-22 16:30:09 -070083 try:
84 from nt import _have_functions
Brett Cannoncd171c82013-07-04 17:43:24 -040085 except ImportError:
Larry Hastings9cf065c2012-06-22 16:30:09 -070086 pass
87
Guido van Rossum2979b011994-08-01 11:18:30 +000088else:
Brett Cannoncd171c82013-07-04 17:43:24 -040089 raise ImportError('no os specific module found')
Guido van Rossume65cce51993-11-08 15:05:21 +000090
Skip Montanaro117910d2003-02-14 19:35:31 +000091sys.modules['os.path'] = path
Georg Brandled5b9b32008-12-05 07:45:54 +000092from os.path import (curdir, pardir, sep, pathsep, defpath, extsep, altsep,
93 devnull)
Skip Montanaro269b83b2001-02-06 01:07:02 +000094
Guido van Rossuma28dab51997-08-29 22:36:47 +000095del _names
96
Larry Hastings9cf065c2012-06-22 16:30:09 -070097
98if _exists("_have_functions"):
99 _globals = globals()
100 def _add(str, fn):
101 if (fn in _globals) and (str in _have_functions):
102 _set.add(_globals[fn])
103
104 _set = set()
105 _add("HAVE_FACCESSAT", "access")
106 _add("HAVE_FCHMODAT", "chmod")
107 _add("HAVE_FCHOWNAT", "chown")
108 _add("HAVE_FSTATAT", "stat")
109 _add("HAVE_FUTIMESAT", "utime")
110 _add("HAVE_LINKAT", "link")
111 _add("HAVE_MKDIRAT", "mkdir")
112 _add("HAVE_MKFIFOAT", "mkfifo")
113 _add("HAVE_MKNODAT", "mknod")
114 _add("HAVE_OPENAT", "open")
115 _add("HAVE_READLINKAT", "readlink")
116 _add("HAVE_RENAMEAT", "rename")
117 _add("HAVE_SYMLINKAT", "symlink")
118 _add("HAVE_UNLINKAT", "unlink")
Larry Hastingsb698d8e2012-06-23 16:55:07 -0700119 _add("HAVE_UNLINKAT", "rmdir")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700120 _add("HAVE_UTIMENSAT", "utime")
121 supports_dir_fd = _set
122
123 _set = set()
124 _add("HAVE_FACCESSAT", "access")
125 supports_effective_ids = _set
126
127 _set = set()
128 _add("HAVE_FCHDIR", "chdir")
129 _add("HAVE_FCHMOD", "chmod")
130 _add("HAVE_FCHOWN", "chown")
131 _add("HAVE_FDOPENDIR", "listdir")
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300132 _add("HAVE_FDOPENDIR", "scandir")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700133 _add("HAVE_FEXECVE", "execve")
134 _set.add(stat) # fstat always works
Georg Brandl306336b2012-06-24 12:55:33 +0200135 _add("HAVE_FTRUNCATE", "truncate")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700136 _add("HAVE_FUTIMENS", "utime")
137 _add("HAVE_FUTIMES", "utime")
Georg Brandl306336b2012-06-24 12:55:33 +0200138 _add("HAVE_FPATHCONF", "pathconf")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700139 if _exists("statvfs") and _exists("fstatvfs"): # mac os x10.3
140 _add("HAVE_FSTATVFS", "statvfs")
141 supports_fd = _set
142
143 _set = set()
144 _add("HAVE_FACCESSAT", "access")
Larry Hastingsdbbc0c82012-06-22 19:50:21 -0700145 # Some platforms don't support lchmod(). Often the function exists
146 # anyway, as a stub that always returns ENOSUP or perhaps EOPNOTSUPP.
147 # (No, I don't know why that's a good design.) ./configure will detect
148 # this and reject it--so HAVE_LCHMOD still won't be defined on such
149 # platforms. This is Very Helpful.
150 #
151 # However, sometimes platforms without a working lchmod() *do* have
152 # fchmodat(). (Examples: Linux kernel 3.2 with glibc 2.15,
153 # OpenIndiana 3.x.) And fchmodat() has a flag that theoretically makes
154 # it behave like lchmod(). So in theory it would be a suitable
155 # replacement for lchmod(). But when lchmod() doesn't work, fchmodat()'s
156 # flag doesn't work *either*. Sadly ./configure isn't sophisticated
157 # enough to detect this condition--it only determines whether or not
158 # fchmodat() minimally works.
159 #
160 # Therefore we simply ignore fchmodat() when deciding whether or not
161 # os.chmod supports follow_symlinks. Just checking lchmod() is
162 # sufficient. After all--if you have a working fchmodat(), your
163 # lchmod() almost certainly works too.
164 #
165 # _add("HAVE_FCHMODAT", "chmod")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700166 _add("HAVE_FCHOWNAT", "chown")
167 _add("HAVE_FSTATAT", "stat")
168 _add("HAVE_LCHFLAGS", "chflags")
169 _add("HAVE_LCHMOD", "chmod")
170 if _exists("lchown"): # mac os x10.3
171 _add("HAVE_LCHOWN", "chown")
172 _add("HAVE_LINKAT", "link")
173 _add("HAVE_LUTIMES", "utime")
174 _add("HAVE_LSTAT", "stat")
175 _add("HAVE_FSTATAT", "stat")
176 _add("HAVE_UTIMENSAT", "utime")
177 _add("MS_WINDOWS", "stat")
178 supports_follow_symlinks = _set
179
Larry Hastings9cf065c2012-06-22 16:30:09 -0700180 del _set
181 del _have_functions
182 del _globals
183 del _add
184
185
Martin v. Löwis22b457e2005-01-16 08:40:58 +0000186# Python uses fixed values for the SEEK_ constants; they are mapped
187# to native constants if necessary in posixmodule.c
Jesus Cea94363612012-06-22 18:32:07 +0200188# Other possible SEEK values are directly imported from posixmodule.c
Martin v. Löwis22b457e2005-01-16 08:40:58 +0000189SEEK_SET = 0
190SEEK_CUR = 1
191SEEK_END = 2
192
Guido van Rossum4def7de1998-07-24 20:48:03 +0000193# Super directory utilities.
194# (Inspired by Eric Raymond; the doc strings are mostly his)
195
Terry Reedy5a22b652010-12-02 07:05:56 +0000196def makedirs(name, mode=0o777, exist_ok=False):
Zachary Warea22ae212014-03-20 09:42:01 -0500197 """makedirs(name [, mode=0o777][, exist_ok=False])
Guido van Rossum4def7de1998-07-24 20:48:03 +0000198
Benjamin Petersonee5f1c12014-04-01 19:13:18 -0400199 Super-mkdir; create a leaf directory and all intermediate ones. Works like
200 mkdir, except that any intermediate path segment (not just the rightmost)
201 will be created if it does not exist. If the target directory already
202 exists, raise an OSError if exist_ok is False. Otherwise no exception is
Terry Reedy5a22b652010-12-02 07:05:56 +0000203 raised. This is recursive.
Guido van Rossum4def7de1998-07-24 20:48:03 +0000204
205 """
206 head, tail = path.split(name)
Fred Drake9f2550f2000-07-25 15:16:40 +0000207 if not tail:
208 head, tail = path.split(head)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000209 if head and tail and not path.exists(head):
Thomas Wouters89f507f2006-12-13 04:49:30 +0000210 try:
Serhiy Storchakae304e332017-03-24 13:27:42 +0200211 makedirs(head, exist_ok=exist_ok)
Giampaolo Rodola'0166a282013-02-12 15:14:17 +0100212 except FileExistsError:
Martin Pantera82642f2015-11-19 04:48:44 +0000213 # Defeats race condition when another thread created the path
Giampaolo Rodola'0166a282013-02-12 15:14:17 +0100214 pass
Serhiy Storchaka4ab23bf2013-01-08 11:32:58 +0200215 cdir = curdir
216 if isinstance(tail, bytes):
217 cdir = bytes(curdir, 'ASCII')
218 if tail == cdir: # xxx/newdir/. exists if xxx/newdir exists
Andrew M. Kuchling6fccc8a2003-12-23 16:33:28 +0000219 return
Terry Reedy5a22b652010-12-02 07:05:56 +0000220 try:
221 mkdir(name, mode)
Martin Pantera82642f2015-11-19 04:48:44 +0000222 except OSError:
223 # Cannot rely on checking for EEXIST, since the operating system
224 # could give priority to other errors like EACCES or EROFS
225 if not exist_ok or not path.isdir(name):
Terry Reedy5a22b652010-12-02 07:05:56 +0000226 raise
Guido van Rossum4def7de1998-07-24 20:48:03 +0000227
228def removedirs(name):
Zachary Warea22ae212014-03-20 09:42:01 -0500229 """removedirs(name)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000230
Fredrik Lundh96c1c7a2005-11-12 15:55:04 +0000231 Super-rmdir; remove a leaf directory and all empty intermediate
Guido van Rossum4def7de1998-07-24 20:48:03 +0000232 ones. Works like rmdir except that, if the leaf directory is
233 successfully removed, directories corresponding to rightmost path
Tim Petersc4e09402003-04-25 07:11:48 +0000234 segments will be pruned away until either the whole path is
Guido van Rossum4def7de1998-07-24 20:48:03 +0000235 consumed or an error occurs. Errors during this latter phase are
236 ignored -- they generally mean that a directory was not empty.
237
238 """
239 rmdir(name)
240 head, tail = path.split(name)
Fred Drake9f2550f2000-07-25 15:16:40 +0000241 if not tail:
242 head, tail = path.split(head)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000243 while head and tail:
244 try:
245 rmdir(head)
Andrew Svetlov2552bc02012-12-24 21:47:24 +0200246 except OSError:
Guido van Rossum4def7de1998-07-24 20:48:03 +0000247 break
248 head, tail = path.split(head)
249
250def renames(old, new):
Fred Drakecadb9eb2002-07-02 21:28:04 +0000251 """renames(old, new)
Guido van Rossum4def7de1998-07-24 20:48:03 +0000252
253 Super-rename; create directories as necessary and delete any left
254 empty. Works like rename, except creation of any intermediate
255 directories needed to make the new pathname good is attempted
256 first. After the rename, directories corresponding to rightmost
Benjamin Peterson52a3b742015-04-13 20:24:10 -0400257 path segments of the old name will be pruned until either the
Guido van Rossum4def7de1998-07-24 20:48:03 +0000258 whole path is consumed or a nonempty directory is found.
259
260 Note: this function can fail with the new directory structure made
261 if you lack permissions needed to unlink the leaf directory or
262 file.
263
264 """
265 head, tail = path.split(new)
266 if head and tail and not path.exists(head):
267 makedirs(head)
268 rename(old, new)
269 head, tail = path.split(old)
270 if head and tail:
271 try:
272 removedirs(head)
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200273 except OSError:
Guido van Rossum4def7de1998-07-24 20:48:03 +0000274 pass
275
Skip Montanaro269b83b2001-02-06 01:07:02 +0000276__all__.extend(["makedirs", "removedirs", "renames"])
277
Guido van Rossumd8faa362007-04-27 19:54:29 +0000278def walk(top, topdown=True, onerror=None, followlinks=False):
Tim Petersc4e09402003-04-25 07:11:48 +0000279 """Directory tree generator.
280
281 For each directory in the directory tree rooted at top (including top
282 itself, but excluding '.' and '..'), yields a 3-tuple
283
284 dirpath, dirnames, filenames
285
286 dirpath is a string, the path to the directory. dirnames is a list of
287 the names of the subdirectories in dirpath (excluding '.' and '..').
288 filenames is a list of the names of the non-directory files in dirpath.
289 Note that the names in the lists are just names, with no path components.
290 To get a full path (which begins with top) to a file or directory in
291 dirpath, do os.path.join(dirpath, name).
292
293 If optional arg 'topdown' is true or not specified, the triple for a
294 directory is generated before the triples for any of its subdirectories
295 (directories are generated top down). If topdown is false, the triple
296 for a directory is generated after the triples for all of its
297 subdirectories (directories are generated bottom up).
298
299 When topdown is true, the caller can modify the dirnames list in-place
300 (e.g., via del or slice assignment), and walk will only recurse into the
Benjamin Petersone58e0c72014-06-15 20:51:12 -0700301 subdirectories whose names remain in dirnames; this can be used to prune the
302 search, or to impose a specific order of visiting. Modifying dirnames when
303 topdown is false is ineffective, since the directories in dirnames have
304 already been generated by the time dirnames itself is generated. No matter
305 the value of topdown, the list of subdirectories is retrieved before the
306 tuples for the directory and its subdirectories are generated.
Tim Petersc4e09402003-04-25 07:11:48 +0000307
Victor Stinner524a5ba2015-03-10 13:20:34 +0100308 By default errors from the os.scandir() call are ignored. If
Guido van Rossumbf1bef82003-05-13 18:01:19 +0000309 optional arg 'onerror' is specified, it should be a function; it
Andrew Svetlovad28c7f2012-12-18 22:02:39 +0200310 will be called with one argument, an OSError instance. It can
Guido van Rossumbf1bef82003-05-13 18:01:19 +0000311 report the error to continue with the walk, or raise the exception
312 to abort the walk. Note that the filename is available as the
313 filename attribute of the exception object.
314
Guido van Rossumd8faa362007-04-27 19:54:29 +0000315 By default, os.walk does not follow symbolic links to subdirectories on
316 systems that support them. In order to get this functionality, set the
317 optional argument 'followlinks' to true.
318
Tim Petersc4e09402003-04-25 07:11:48 +0000319 Caution: if you pass a relative pathname for top, don't change the
320 current working directory between resumptions of walk. walk never
321 changes the current directory, and assumes that the client doesn't
322 either.
323
324 Example:
325
Christian Heimes5d8da202008-05-06 13:58:24 +0000326 import os
Tim Petersc4e09402003-04-25 07:11:48 +0000327 from os.path import join, getsize
Christian Heimes5d8da202008-05-06 13:58:24 +0000328 for root, dirs, files in os.walk('python/Lib/email'):
Neal Norwitz752abd02008-05-13 04:55:24 +0000329 print(root, "consumes", end="")
330 print(sum([getsize(join(root, name)) for name in files]), end="")
331 print("bytes in", len(files), "non-directory files")
Tim Petersc4e09402003-04-25 07:11:48 +0000332 if 'CVS' in dirs:
333 dirs.remove('CVS') # don't visit CVS directories
Benjamin Petersone58e0c72014-06-15 20:51:12 -0700334
Tim Petersc4e09402003-04-25 07:11:48 +0000335 """
Brett Cannon3f9183b2016-08-26 14:44:48 -0700336 top = fspath(top)
Victor Stinner524a5ba2015-03-10 13:20:34 +0100337 dirs = []
338 nondirs = []
Serhiy Storchaka7c90a822016-02-11 13:31:00 +0200339 walk_dirs = []
Tim Petersc4e09402003-04-25 07:11:48 +0000340
341 # We may not have read permission for top, in which case we can't
Alexandre Vassalotti4e6531e2008-05-09 20:00:17 +0000342 # get a list of the files the directory contains. os.walk
Tim Petersc4e09402003-04-25 07:11:48 +0000343 # always suppressed the exception then, rather than blow up for a
344 # minor reason when (say) a thousand readable directories are still
345 # left to visit. That logic is copied here.
346 try:
Serhiy Storchaka3ae41552016-10-05 23:17:10 +0300347 # Note that scandir is global in this module due
348 # to earlier import-*.
349 scandir_it = scandir(top)
Victor Stinner7fea9742015-03-18 11:29:47 +0100350 except OSError as error:
351 if onerror is not None:
352 onerror(error)
353 return
354
Serhiy Storchakaffe96ae2016-02-11 13:21:30 +0200355 with scandir_it:
356 while True:
Victor Stinner524a5ba2015-03-10 13:20:34 +0100357 try:
Victor Stinner524a5ba2015-03-10 13:20:34 +0100358 try:
Serhiy Storchakaffe96ae2016-02-11 13:21:30 +0200359 entry = next(scandir_it)
360 except StopIteration:
361 break
362 except OSError as error:
363 if onerror is not None:
364 onerror(error)
365 return
Victor Stinner7fea9742015-03-18 11:29:47 +0100366
Serhiy Storchakaffe96ae2016-02-11 13:21:30 +0200367 try:
368 is_dir = entry.is_dir()
369 except OSError:
370 # If is_dir() raises an OSError, consider that the entry is not
371 # a directory, same behaviour than os.path.isdir().
372 is_dir = False
373
374 if is_dir:
375 dirs.append(entry.name)
376 else:
377 nondirs.append(entry.name)
378
379 if not topdown and is_dir:
380 # Bottom-up: recurse into sub-directory, but exclude symlinks to
381 # directories if followlinks is False
382 if followlinks:
383 walk_into = True
384 else:
385 try:
386 is_symlink = entry.is_symlink()
387 except OSError:
388 # If is_symlink() raises an OSError, consider that the
389 # entry is not a symbolic link, same behaviour than
390 # os.path.islink().
391 is_symlink = False
392 walk_into = not is_symlink
393
394 if walk_into:
Serhiy Storchaka7c90a822016-02-11 13:31:00 +0200395 walk_dirs.append(entry.path)
Tim Petersc4e09402003-04-25 07:11:48 +0000396
Victor Stinner524a5ba2015-03-10 13:20:34 +0100397 # Yield before recursion if going top down
Tim Petersc4e09402003-04-25 07:11:48 +0000398 if topdown:
399 yield top, dirs, nondirs
Victor Stinner524a5ba2015-03-10 13:20:34 +0100400
Victor Stinner7fea9742015-03-18 11:29:47 +0100401 # Recurse into sub-directories
402 islink, join = path.islink, path.join
Serhiy Storchaka5f6a0b42016-02-08 16:23:28 +0200403 for dirname in dirs:
404 new_path = join(top, dirname)
Victor Stinner7fea9742015-03-18 11:29:47 +0100405 # Issue #23605: os.path.islink() is used instead of caching
406 # entry.is_symlink() result during the loop on os.scandir() because
407 # the caller can replace the directory entry during the "yield"
408 # above.
409 if followlinks or not islink(new_path):
410 yield from walk(new_path, topdown, onerror, followlinks)
411 else:
Serhiy Storchaka7c90a822016-02-11 13:31:00 +0200412 # Recurse into sub-directories
413 for new_path in walk_dirs:
414 yield from walk(new_path, topdown, onerror, followlinks)
Victor Stinner7fea9742015-03-18 11:29:47 +0100415 # Yield after recursion if going bottom up
Tim Petersc4e09402003-04-25 07:11:48 +0000416 yield top, dirs, nondirs
417
418__all__.append("walk")
419
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300420if {open, stat} <= supports_dir_fd and {scandir, stat} <= supports_fd:
Charles-François Natali7372b062012-02-05 15:15:38 +0100421
Larry Hastingsb4038062012-07-15 10:57:38 -0700422 def fwalk(top=".", topdown=True, onerror=None, *, follow_symlinks=False, dir_fd=None):
Charles-François Natali7372b062012-02-05 15:15:38 +0100423 """Directory tree generator.
424
425 This behaves exactly like walk(), except that it yields a 4-tuple
426
427 dirpath, dirnames, filenames, dirfd
428
429 `dirpath`, `dirnames` and `filenames` are identical to walk() output,
430 and `dirfd` is a file descriptor referring to the directory `dirpath`.
431
Larry Hastingsc48fe982012-06-25 04:49:05 -0700432 The advantage of fwalk() over walk() is that it's safe against symlink
Larry Hastingsb4038062012-07-15 10:57:38 -0700433 races (when follow_symlinks is False).
Charles-François Natali7372b062012-02-05 15:15:38 +0100434
Larry Hastingsc48fe982012-06-25 04:49:05 -0700435 If dir_fd is not None, it should be a file descriptor open to a directory,
436 and top should be relative; top will then be relative to that directory.
437 (dir_fd is always supported for fwalk.)
438
Charles-François Natali7372b062012-02-05 15:15:38 +0100439 Caution:
440 Since fwalk() yields file descriptors, those are only valid until the
441 next iteration step, so you should dup() them if you want to keep them
442 for a longer period.
443
444 Example:
445
446 import os
447 for root, dirs, files, rootfd in os.fwalk('python/Lib/email'):
448 print(root, "consumes", end="")
Larry Hastings9cf065c2012-06-22 16:30:09 -0700449 print(sum([os.stat(name, dir_fd=rootfd).st_size for name in files]),
Charles-François Natali7372b062012-02-05 15:15:38 +0100450 end="")
451 print("bytes in", len(files), "non-directory files")
452 if 'CVS' in dirs:
453 dirs.remove('CVS') # don't visit CVS directories
454 """
Brett Cannon3f9183b2016-08-26 14:44:48 -0700455 if not isinstance(top, int) or not hasattr(top, '__index__'):
456 top = fspath(top)
Charles-François Natali7372b062012-02-05 15:15:38 +0100457 # Note: To guard against symlink races, we use the standard
458 # lstat()/open()/fstat() trick.
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300459 if not follow_symlinks:
460 orig_st = stat(top, follow_symlinks=False, dir_fd=dir_fd)
Larry Hastingsc48fe982012-06-25 04:49:05 -0700461 topfd = open(top, O_RDONLY, dir_fd=dir_fd)
Charles-François Natali7372b062012-02-05 15:15:38 +0100462 try:
Larry Hastingsb4038062012-07-15 10:57:38 -0700463 if (follow_symlinks or (st.S_ISDIR(orig_st.st_mode) and
464 path.samestat(orig_st, stat(topfd)))):
Serhiy Storchaka8f6b3442017-03-07 14:33:21 +0200465 yield from _fwalk(topfd, top, isinstance(top, bytes),
466 topdown, onerror, follow_symlinks)
Charles-François Natali7372b062012-02-05 15:15:38 +0100467 finally:
468 close(topfd)
469
Serhiy Storchaka8f6b3442017-03-07 14:33:21 +0200470 def _fwalk(topfd, toppath, isbytes, topdown, onerror, follow_symlinks):
Charles-François Natali7372b062012-02-05 15:15:38 +0100471 # Note: This uses O(depth of the directory tree) file descriptors: if
472 # necessary, it can be adapted to only require O(1) FDs, see issue
473 # #13734.
474
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300475 scandir_it = scandir(topfd)
476 dirs = []
477 nondirs = []
478 entries = None if topdown or follow_symlinks else []
479 for entry in scandir_it:
480 name = entry.name
481 if isbytes:
482 name = fsencode(name)
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200483 try:
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300484 if entry.is_dir():
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200485 dirs.append(name)
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300486 if entries is not None:
487 entries.append(entry)
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200488 else:
489 nondirs.append(name)
Serhiy Storchaka42babab2016-10-25 14:28:38 +0300490 except OSError:
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200491 try:
492 # Add dangling symlinks, ignore disappeared files
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300493 if entry.is_symlink():
Hynek Schlawack66bfcc12012-05-15 16:32:21 +0200494 nondirs.append(name)
Serhiy Storchaka42babab2016-10-25 14:28:38 +0300495 except OSError:
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300496 pass
Charles-François Natali7372b062012-02-05 15:15:38 +0100497
498 if topdown:
499 yield toppath, dirs, nondirs, topfd
500
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300501 for name in dirs if entries is None else zip(dirs, entries):
Charles-François Natali7372b062012-02-05 15:15:38 +0100502 try:
Serhiy Storchakaea720fe2017-03-30 09:12:31 +0300503 if not follow_symlinks:
504 if topdown:
505 orig_st = stat(name, dir_fd=topfd, follow_symlinks=False)
506 else:
507 assert entries is not None
508 name, entry = name
509 orig_st = entry.stat(follow_symlinks=False)
Larry Hastings9cf065c2012-06-22 16:30:09 -0700510 dirfd = open(name, O_RDONLY, dir_fd=topfd)
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200511 except OSError as err:
Charles-François Natali7372b062012-02-05 15:15:38 +0100512 if onerror is not None:
513 onerror(err)
Serhiy Storchaka0bddc9e2015-12-23 00:08:24 +0200514 continue
Charles-François Natali7372b062012-02-05 15:15:38 +0100515 try:
Larry Hastingsb4038062012-07-15 10:57:38 -0700516 if follow_symlinks or path.samestat(orig_st, stat(dirfd)):
Charles-François Natali7372b062012-02-05 15:15:38 +0100517 dirpath = path.join(toppath, name)
Serhiy Storchaka8f6b3442017-03-07 14:33:21 +0200518 yield from _fwalk(dirfd, dirpath, isbytes,
519 topdown, onerror, follow_symlinks)
Charles-François Natali7372b062012-02-05 15:15:38 +0100520 finally:
521 close(dirfd)
522
523 if not topdown:
524 yield toppath, dirs, nondirs, topfd
525
526 __all__.append("fwalk")
527
Guido van Rossuma28dab51997-08-29 22:36:47 +0000528# Make sure os.environ exists, at least
529try:
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000530 environ
Guido van Rossuma28dab51997-08-29 22:36:47 +0000531except NameError:
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000532 environ = {}
Guido van Rossuma28dab51997-08-29 22:36:47 +0000533
Guido van Rossume65cce51993-11-08 15:05:21 +0000534def execl(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000535 """execl(file, *args)
536
537 Execute the executable file with argument list args, replacing the
538 current process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000539 execv(file, args)
Guido van Rossume65cce51993-11-08 15:05:21 +0000540
541def execle(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000542 """execle(file, *args, env)
543
544 Execute the executable file with argument list args and
545 environment env, replacing the current process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000546 env = args[-1]
547 execve(file, args[:-1], env)
Guido van Rossume65cce51993-11-08 15:05:21 +0000548
549def execlp(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000550 """execlp(file, *args)
551
552 Execute the executable file (which is searched for along $PATH)
553 with argument list args, replacing the current process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000554 execvp(file, args)
Guido van Rossume65cce51993-11-08 15:05:21 +0000555
Guido van Rossum030afb11995-03-14 17:27:18 +0000556def execlpe(file, *args):
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000557 """execlpe(file, *args, env)
558
559 Execute the executable file (which is searched for along $PATH)
560 with argument list args and environment env, replacing the current
Tim Peters2344fae2001-01-15 00:50:52 +0000561 process. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000562 env = args[-1]
563 execvpe(file, args[:-1], env)
Guido van Rossum030afb11995-03-14 17:27:18 +0000564
Guido van Rossume65cce51993-11-08 15:05:21 +0000565def execvp(file, args):
Matthias Klosea09c54f2010-01-31 16:48:44 +0000566 """execvp(file, args)
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000567
568 Execute the executable file (which is searched for along $PATH)
569 with argument list args, replacing the current process.
Thomas Wouters7e474022000-07-16 12:04:32 +0000570 args may be a list or tuple of strings. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000571 _execvpe(file, args)
Guido van Rossum030afb11995-03-14 17:27:18 +0000572
573def execvpe(file, args, env):
Guido van Rossum683c0fe2002-09-03 16:36:17 +0000574 """execvpe(file, args, env)
Guido van Rossum7da3cc52000-04-25 10:53:22 +0000575
576 Execute the executable file (which is searched for along $PATH)
577 with argument list args and environment env , replacing the
578 current process.
Tim Peters2344fae2001-01-15 00:50:52 +0000579 args may be a list or tuple of strings. """
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000580 _execvpe(file, args, env)
Guido van Rossum030afb11995-03-14 17:27:18 +0000581
Skip Montanaro269b83b2001-02-06 01:07:02 +0000582__all__.extend(["execl","execle","execlp","execlpe","execvp","execvpe"])
583
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000584def _execvpe(file, args, env=None):
585 if env is not None:
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000586 exec_func = execve
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000587 argrest = (args, env)
588 else:
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000589 exec_func = execv
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000590 argrest = (args,)
591 env = environ
Guido van Rossumaed51d82002-08-05 16:13:24 +0000592
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000593 head, tail = path.split(file)
594 if head:
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000595 exec_func(file, *argrest)
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000596 return
Guido van Rossume7ba4952007-06-06 23:52:48 +0000597 last_exc = saved_exc = None
Guido van Rossum683c0fe2002-09-03 16:36:17 +0000598 saved_tb = None
Victor Stinnerb745a742010-05-18 17:17:23 +0000599 path_list = get_exec_path(env)
600 if name != 'nt':
601 file = fsencode(file)
602 path_list = map(fsencode, path_list)
603 for dir in path_list:
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000604 fullname = path.join(dir, file)
605 try:
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000606 exec_func(fullname, *argrest)
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200607 except OSError as e:
Guido van Rossume7ba4952007-06-06 23:52:48 +0000608 last_exc = e
Guido van Rossum683c0fe2002-09-03 16:36:17 +0000609 tb = sys.exc_info()[2]
Christian Heimes45f9af32007-11-27 21:50:00 +0000610 if (e.errno != errno.ENOENT and e.errno != errno.ENOTDIR
Guido van Rossum683c0fe2002-09-03 16:36:17 +0000611 and saved_exc is None):
612 saved_exc = e
613 saved_tb = tb
614 if saved_exc:
Benjamin Peterson4b068192009-02-20 03:19:25 +0000615 raise saved_exc.with_traceback(saved_tb)
616 raise last_exc.with_traceback(tb)
Guido van Rossumd74fb6b2001-03-02 06:43:49 +0000617
Guido van Rossumcd16bf62007-06-13 18:07:49 +0000618
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000619def get_exec_path(env=None):
620 """Returns the sequence of directories that will be searched for the
621 named executable (similar to a shell) when launching a process.
622
623 *env* must be an environment variable dict or None. If *env* is None,
624 os.environ will be used.
625 """
Victor Stinner273b7662010-11-06 12:59:33 +0000626 # Use a local import instead of a global import to limit the number of
627 # modules loaded at startup: the os module is always loaded at startup by
628 # Python. It may also avoid a bootstrap issue.
Victor Stinner6f35eda2010-10-29 00:38:58 +0000629 import warnings
630
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000631 if env is None:
632 env = environ
Victor Stinnerb745a742010-05-18 17:17:23 +0000633
Victor Stinnerbb4f2182010-11-07 15:43:39 +0000634 # {b'PATH': ...}.get('PATH') and {'PATH': ...}.get(b'PATH') emit a
635 # BytesWarning when using python -b or python -bb: ignore the warning
Victor Stinner273b7662010-11-06 12:59:33 +0000636 with warnings.catch_warnings():
637 warnings.simplefilter("ignore", BytesWarning)
Victor Stinnerb745a742010-05-18 17:17:23 +0000638
Victor Stinnerb745a742010-05-18 17:17:23 +0000639 try:
Victor Stinner273b7662010-11-06 12:59:33 +0000640 path_list = env.get('PATH')
641 except TypeError:
642 path_list = None
Victor Stinnerb745a742010-05-18 17:17:23 +0000643
Victor Stinner273b7662010-11-06 12:59:33 +0000644 if supports_bytes_environ:
645 try:
646 path_listb = env[b'PATH']
647 except (KeyError, TypeError):
648 pass
649 else:
650 if path_list is not None:
651 raise ValueError(
652 "env cannot contain 'PATH' and b'PATH' keys")
653 path_list = path_listb
654
655 if path_list is not None and isinstance(path_list, bytes):
656 path_list = fsdecode(path_list)
Victor Stinnerb745a742010-05-18 17:17:23 +0000657
658 if path_list is None:
659 path_list = defpath
660 return path_list.split(pathsep)
Gregory P. Smithb6e8c7e2010-02-27 07:22:22 +0000661
662
Skip Montanaro289bc052007-08-17 02:30:27 +0000663# Change environ to automatically call putenv(), unsetenv if they exist.
Christian Heimesf1dc3ee2013-10-13 02:04:20 +0200664from _collections_abc import MutableMapping
Skip Montanaro289bc052007-08-17 02:30:27 +0000665
666class _Environ(MutableMapping):
Victor Stinner84ae1182010-05-06 22:05:07 +0000667 def __init__(self, data, encodekey, decodekey, encodevalue, decodevalue, putenv, unsetenv):
668 self.encodekey = encodekey
669 self.decodekey = decodekey
670 self.encodevalue = encodevalue
671 self.decodevalue = decodevalue
Skip Montanaro289bc052007-08-17 02:30:27 +0000672 self.putenv = putenv
673 self.unsetenv = unsetenv
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000674 self._data = data
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000675
Skip Montanaro289bc052007-08-17 02:30:27 +0000676 def __getitem__(self, key):
Victor Stinner6d101392013-04-14 16:35:04 +0200677 try:
678 value = self._data[self.encodekey(key)]
679 except KeyError:
680 # raise KeyError with the original key value
Victor Stinner0c2dd0c2013-08-23 19:19:15 +0200681 raise KeyError(key) from None
Victor Stinner84ae1182010-05-06 22:05:07 +0000682 return self.decodevalue(value)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000683
Skip Montanaro289bc052007-08-17 02:30:27 +0000684 def __setitem__(self, key, value):
Victor Stinner84ae1182010-05-06 22:05:07 +0000685 key = self.encodekey(key)
686 value = self.encodevalue(value)
Skip Montanaro289bc052007-08-17 02:30:27 +0000687 self.putenv(key, value)
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000688 self._data[key] = value
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000689
Skip Montanaro289bc052007-08-17 02:30:27 +0000690 def __delitem__(self, key):
Victor Stinner6d101392013-04-14 16:35:04 +0200691 encodedkey = self.encodekey(key)
692 self.unsetenv(encodedkey)
693 try:
694 del self._data[encodedkey]
695 except KeyError:
696 # raise KeyError with the original key value
Victor Stinner0c2dd0c2013-08-23 19:19:15 +0200697 raise KeyError(key) from None
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000698
Skip Montanaro289bc052007-08-17 02:30:27 +0000699 def __iter__(self):
Osvaldo Santana Neto8a8d2852017-07-01 14:34:45 -0300700 # list() from dict object is an atomic operation
701 keys = list(self._data)
702 for key in keys:
Victor Stinner84ae1182010-05-06 22:05:07 +0000703 yield self.decodekey(key)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000704
Skip Montanaro289bc052007-08-17 02:30:27 +0000705 def __len__(self):
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000706 return len(self._data)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000707
708 def __repr__(self):
Victor Stinnerbed71172010-07-28 21:25:42 +0000709 return 'environ({{{}}})'.format(', '.join(
Victor Stinnerd73c1a32010-07-28 21:23:23 +0000710 ('{!r}: {!r}'.format(self.decodekey(key), self.decodevalue(value))
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000711 for key, value in self._data.items())))
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000712
Skip Montanaro289bc052007-08-17 02:30:27 +0000713 def copy(self):
714 return dict(self)
Ezio Melotti19e4acf2010-02-22 15:59:01 +0000715
Skip Montanaro289bc052007-08-17 02:30:27 +0000716 def setdefault(self, key, value):
717 if key not in self:
718 self[key] = value
719 return self[key]
720
721try:
722 _putenv = putenv
723except NameError:
724 _putenv = lambda key, value: None
Richard Oudkerkc41917f2013-05-07 14:36:51 +0100725else:
726 if "putenv" not in __all__:
727 __all__.append("putenv")
Guido van Rossum3b8e20d1996-07-24 00:55:17 +0000728
Skip Montanaro289bc052007-08-17 02:30:27 +0000729try:
730 _unsetenv = unsetenv
731except NameError:
732 _unsetenv = lambda key: _putenv(key, "")
Richard Oudkerkc41917f2013-05-07 14:36:51 +0100733else:
734 if "unsetenv" not in __all__:
735 __all__.append("unsetenv")
Guido van Rossumc524d952001-10-19 01:31:59 +0000736
Victor Stinner84ae1182010-05-06 22:05:07 +0000737def _createenviron():
Jesus Cea4791a242012-10-05 03:15:39 +0200738 if name == 'nt':
Victor Stinner84ae1182010-05-06 22:05:07 +0000739 # Where Env Var Names Must Be UPPERCASE
740 def check_str(value):
741 if not isinstance(value, str):
742 raise TypeError("str expected, not %s" % type(value).__name__)
743 return value
744 encode = check_str
745 decode = str
746 def encodekey(key):
747 return encode(key).upper()
748 data = {}
749 for key, value in environ.items():
750 data[encodekey(key)] = value
751 else:
752 # Where Env Var Names Can Be Mixed Case
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000753 encoding = sys.getfilesystemencoding()
Victor Stinner84ae1182010-05-06 22:05:07 +0000754 def encode(value):
755 if not isinstance(value, str):
756 raise TypeError("str expected, not %s" % type(value).__name__)
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000757 return value.encode(encoding, 'surrogateescape')
Victor Stinner84ae1182010-05-06 22:05:07 +0000758 def decode(value):
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000759 return value.decode(encoding, 'surrogateescape')
Victor Stinner84ae1182010-05-06 22:05:07 +0000760 encodekey = encode
761 data = environ
762 return _Environ(data,
763 encodekey, decode,
764 encode, decode,
765 _putenv, _unsetenv)
Guido van Rossumc524d952001-10-19 01:31:59 +0000766
Victor Stinner84ae1182010-05-06 22:05:07 +0000767# unicode environ
768environ = _createenviron()
769del _createenviron
Guido van Rossum61de0ac1997-12-05 21:24:30 +0000770
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000771
Jack Jansenb11ce9b2003-01-08 16:33:40 +0000772def getenv(key, default=None):
Tim Peters2c60f7a2003-01-29 03:49:43 +0000773 """Get an environment variable, return None if it doesn't exist.
Victor Stinner84ae1182010-05-06 22:05:07 +0000774 The optional second argument can specify an alternate default.
775 key, default and the result are str."""
Tim Peters2c60f7a2003-01-29 03:49:43 +0000776 return environ.get(key, default)
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000777
Jesus Cea4791a242012-10-05 03:15:39 +0200778supports_bytes_environ = (name != 'nt')
Victor Stinnerb745a742010-05-18 17:17:23 +0000779__all__.extend(("getenv", "supports_bytes_environ"))
780
781if supports_bytes_environ:
Victor Stinner84ae1182010-05-06 22:05:07 +0000782 def _check_bytes(value):
783 if not isinstance(value, bytes):
784 raise TypeError("bytes expected, not %s" % type(value).__name__)
785 return value
786
787 # bytes environ
Victor Stinner3d75d0c2010-09-10 22:18:16 +0000788 environb = _Environ(environ._data,
Victor Stinner84ae1182010-05-06 22:05:07 +0000789 _check_bytes, bytes,
790 _check_bytes, bytes,
791 _putenv, _unsetenv)
792 del _check_bytes
793
794 def getenvb(key, default=None):
795 """Get an environment variable, return None if it doesn't exist.
796 The optional second argument can specify an alternate default.
797 key, default and the result are bytes."""
798 return environb.get(key, default)
Victor Stinner70120e22010-07-29 17:19:38 +0000799
800 __all__.extend(("environb", "getenvb"))
Victor Stinner84ae1182010-05-06 22:05:07 +0000801
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000802def _fscodec():
803 encoding = sys.getfilesystemencoding()
Steve Dowercc16be82016-09-08 10:35:16 -0700804 errors = sys.getfilesystemencodeerrors()
Victor Stinnere8d51452010-08-19 01:05:19 +0000805
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000806 def fsencode(filename):
Brett Cannon5f74ebc2016-06-09 14:29:25 -0700807 """Encode filename (an os.PathLike, bytes, or str) to the filesystem
Ethan Furmanc1cbeed2016-06-04 10:19:27 -0700808 encoding with 'surrogateescape' error handler, return bytes unchanged.
809 On Windows, use 'strict' error handler if the file system encoding is
810 'mbcs' (which is the default encoding).
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000811 """
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700812 filename = fspath(filename) # Does type-checking of `filename`.
813 if isinstance(filename, str):
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000814 return filename.encode(encoding, errors)
Victor Stinnere8d51452010-08-19 01:05:19 +0000815 else:
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700816 return filename
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000817
818 def fsdecode(filename):
Brett Cannon5f74ebc2016-06-09 14:29:25 -0700819 """Decode filename (an os.PathLike, bytes, or str) from the filesystem
Ethan Furmanc1cbeed2016-06-04 10:19:27 -0700820 encoding with 'surrogateescape' error handler, return str unchanged. On
821 Windows, use 'strict' error handler if the file system encoding is
822 'mbcs' (which is the default encoding).
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000823 """
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700824 filename = fspath(filename) # Does type-checking of `filename`.
825 if isinstance(filename, bytes):
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000826 return filename.decode(encoding, errors)
827 else:
Brett Cannonc78ca1e2016-06-24 12:03:43 -0700828 return filename
Victor Stinnerdf6d6cb2010-10-24 20:32:26 +0000829
830 return fsencode, fsdecode
831
832fsencode, fsdecode = _fscodec()
833del _fscodec
Victor Stinner449c4662010-05-08 11:10:09 +0000834
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000835# Supply spawn*() (probably only for Unix)
836if _exists("fork") and not _exists("spawnv") and _exists("execv"):
837
838 P_WAIT = 0
839 P_NOWAIT = P_NOWAITO = 1
840
Petri Lehtinen3bc37f22012-05-23 21:36:16 +0300841 __all__.extend(["P_WAIT", "P_NOWAIT", "P_NOWAITO"])
842
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000843 # XXX Should we support P_DETACH? I suppose it could fork()**2
844 # and close the std I/O streams. Also, P_OVERLAY is the same
845 # as execv*()?
846
847 def _spawnvef(mode, file, args, env, func):
848 # Internal helper; func is the exec*() function to use
Steve Dowereccaa062016-11-19 20:11:56 -0800849 if not isinstance(args, (tuple, list)):
850 raise TypeError('argv must be a tuple or a list')
Steve Dowerbb08db42016-11-19 21:14:27 -0800851 if not args or not args[0]:
Steve Dowereccaa062016-11-19 20:11:56 -0800852 raise ValueError('argv first element cannot be empty')
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000853 pid = fork()
854 if not pid:
855 # Child
856 try:
857 if env is None:
858 func(file, args)
859 else:
860 func(file, args, env)
861 except:
862 _exit(127)
863 else:
864 # Parent
865 if mode == P_NOWAIT:
866 return pid # Caller is responsible for waiting!
867 while 1:
868 wpid, sts = waitpid(pid, 0)
869 if WIFSTOPPED(sts):
870 continue
871 elif WIFSIGNALED(sts):
872 return -WTERMSIG(sts)
873 elif WIFEXITED(sts):
874 return WEXITSTATUS(sts)
875 else:
Andrew Svetlov8b33dd82012-12-24 19:58:48 +0200876 raise OSError("Not stopped, signaled or exited???")
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000877
878 def spawnv(mode, file, args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000879 """spawnv(mode, file, args) -> integer
880
881Execute file with arguments from args in a subprocess.
882If mode == P_NOWAIT return the pid of the process.
883If mode == P_WAIT return the process's exit code if it exits normally;
Tim Peters2344fae2001-01-15 00:50:52 +0000884otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000885 return _spawnvef(mode, file, args, None, execv)
886
887 def spawnve(mode, file, args, env):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000888 """spawnve(mode, file, args, env) -> integer
889
890Execute file with arguments from args in a subprocess with the
891specified environment.
892If mode == P_NOWAIT return the pid of the process.
893If mode == P_WAIT return the process's exit code if it exits normally;
894otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000895 return _spawnvef(mode, file, args, env, execve)
896
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000897 # Note: spawnvp[e] is't currently supported on Windows
898
899 def spawnvp(mode, file, args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000900 """spawnvp(mode, file, args) -> integer
901
902Execute file (which is looked for along $PATH) with arguments from
903args in a subprocess.
904If mode == P_NOWAIT return the pid of the process.
905If mode == P_WAIT return the process's exit code if it exits normally;
906otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000907 return _spawnvef(mode, file, args, None, execvp)
908
909 def spawnvpe(mode, file, args, env):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000910 """spawnvpe(mode, file, args, env) -> integer
911
912Execute file (which is looked for along $PATH) with arguments from
913args in a subprocess with the supplied environment.
914If mode == P_NOWAIT return the pid of the process.
915If mode == P_WAIT return the process's exit code if it exits normally;
916otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000917 return _spawnvef(mode, file, args, env, execvpe)
918
Richard Oudkerkad34ef82013-05-07 14:23:42 +0100919
920 __all__.extend(["spawnv", "spawnve", "spawnvp", "spawnvpe"])
921
922
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000923if _exists("spawnv"):
924 # These aren't supplied by the basic Windows code
925 # but can be easily implemented in Python
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000926
927 def spawnl(mode, file, *args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000928 """spawnl(mode, file, *args) -> integer
929
930Execute file with arguments from args in a subprocess.
931If mode == P_NOWAIT return the pid of the process.
932If mode == P_WAIT return the process's exit code if it exits normally;
933otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000934 return spawnv(mode, file, args)
935
936 def spawnle(mode, file, *args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000937 """spawnle(mode, file, *args, env) -> integer
938
939Execute file with arguments from args in a subprocess with the
940supplied environment.
941If mode == P_NOWAIT return the pid of the process.
942If mode == P_WAIT return the process's exit code if it exits normally;
943otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000944 env = args[-1]
945 return spawnve(mode, file, args[:-1], env)
946
Andrew MacIntyre69e18c92004-04-04 07:11:43 +0000947
Richard Oudkerkad34ef82013-05-07 14:23:42 +0100948 __all__.extend(["spawnl", "spawnle"])
Andrew MacIntyre69e18c92004-04-04 07:11:43 +0000949
950
Guido van Rossumdd7cbbf1999-11-02 20:44:07 +0000951if _exists("spawnvp"):
952 # At the moment, Windows doesn't implement spawnvp[e],
953 # so it won't have spawnlp[e] either.
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000954 def spawnlp(mode, file, *args):
Neal Norwitzb7f68102003-07-02 02:49:33 +0000955 """spawnlp(mode, file, *args) -> integer
Guido van Rossume0cd2912000-04-21 18:35:36 +0000956
957Execute file (which is looked for along $PATH) with arguments from
958args in a subprocess with the supplied environment.
959If mode == P_NOWAIT return the pid of the process.
960If mode == P_WAIT return the process's exit code if it exits normally;
961otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000962 return spawnvp(mode, file, args)
963
964 def spawnlpe(mode, file, *args):
Guido van Rossume0cd2912000-04-21 18:35:36 +0000965 """spawnlpe(mode, file, *args, env) -> integer
966
967Execute file (which is looked for along $PATH) with arguments from
968args in a subprocess with the supplied environment.
969If mode == P_NOWAIT return the pid of the process.
970If mode == P_WAIT return the process's exit code if it exits normally;
971otherwise return -SIG, where SIG is the signal that killed it. """
Guido van Rossum5a2ca931999-11-02 13:27:32 +0000972 env = args[-1]
973 return spawnvpe(mode, file, args[:-1], env)
Guido van Rossume0cd2912000-04-21 18:35:36 +0000974
975
Richard Oudkerkad34ef82013-05-07 14:23:42 +0100976 __all__.extend(["spawnlp", "spawnlpe"])
977
Skip Montanaro269b83b2001-02-06 01:07:02 +0000978
Guido van Rossumc2f93dc2007-05-24 00:50:02 +0000979# Supply os.popen()
Antoine Pitrou877766d2011-03-19 17:00:37 +0100980def popen(cmd, mode="r", buffering=-1):
Guido van Rossum3172c5d2007-10-16 18:12:55 +0000981 if not isinstance(cmd, str):
Guido van Rossumc2f93dc2007-05-24 00:50:02 +0000982 raise TypeError("invalid cmd type (%s, expected string)" % type(cmd))
983 if mode not in ("r", "w"):
984 raise ValueError("invalid mode %r" % mode)
Benjamin Petersonb29614e2012-10-09 11:16:03 -0400985 if buffering == 0 or buffering is None:
Antoine Pitrou877766d2011-03-19 17:00:37 +0100986 raise ValueError("popen() does not support unbuffered streams")
Guido van Rossumc2f93dc2007-05-24 00:50:02 +0000987 import subprocess, io
988 if mode == "r":
989 proc = subprocess.Popen(cmd,
990 shell=True,
991 stdout=subprocess.PIPE,
992 bufsize=buffering)
993 return _wrap_close(io.TextIOWrapper(proc.stdout), proc)
994 else:
995 proc = subprocess.Popen(cmd,
996 shell=True,
997 stdin=subprocess.PIPE,
998 bufsize=buffering)
999 return _wrap_close(io.TextIOWrapper(proc.stdin), proc)
1000
1001# Helper for popen() -- a proxy for a file whose close waits for the process
1002class _wrap_close:
1003 def __init__(self, stream, proc):
1004 self._stream = stream
1005 self._proc = proc
1006 def close(self):
1007 self._stream.close()
Amaury Forgeot d'Arc97e5f282009-07-11 09:35:13 +00001008 returncode = self._proc.wait()
1009 if returncode == 0:
1010 return None
1011 if name == 'nt':
1012 return returncode
1013 else:
1014 return returncode << 8 # Shift left to match old behavior
Antoine Pitrouac625352009-12-09 00:01:27 +00001015 def __enter__(self):
1016 return self
1017 def __exit__(self, *args):
1018 self.close()
Guido van Rossumc2f93dc2007-05-24 00:50:02 +00001019 def __getattr__(self, name):
1020 return getattr(self._stream, name)
Thomas Heller476157b2007-09-04 11:27:47 +00001021 def __iter__(self):
1022 return iter(self._stream)
Guido van Rossumc2f93dc2007-05-24 00:50:02 +00001023
Amaury Forgeot d'Arcbdbddf82008-08-01 00:06:49 +00001024# Supply os.fdopen()
1025def fdopen(fd, *args, **kwargs):
Guido van Rossumc2f93dc2007-05-24 00:50:02 +00001026 if not isinstance(fd, int):
1027 raise TypeError("invalid fd type (%s, expected integer)" % type(fd))
1028 import io
Amaury Forgeot d'Arcbdbddf82008-08-01 00:06:49 +00001029 return io.open(fd, *args, **kwargs)
Ethan Furmancdc08792016-06-02 15:06:09 -07001030
Brett Cannonc78ca1e2016-06-24 12:03:43 -07001031
1032# For testing purposes, make sure the function is available when the C
1033# implementation exists.
1034def _fspath(path):
1035 """Return the path representation of a path-like object.
1036
1037 If str or bytes is passed in, it is returned unchanged. Otherwise the
1038 os.PathLike interface is used to get the path representation. If the
1039 path representation is not str or bytes, TypeError is raised. If the
1040 provided path is not str, bytes, or os.PathLike, TypeError is raised.
1041 """
1042 if isinstance(path, (str, bytes)):
1043 return path
1044
1045 # Work from the object's type to match method resolution of other magic
1046 # methods.
1047 path_type = type(path)
1048 try:
1049 path_repr = path_type.__fspath__(path)
1050 except AttributeError:
1051 if hasattr(path_type, '__fspath__'):
1052 raise
1053 else:
1054 raise TypeError("expected str, bytes or os.PathLike object, "
1055 "not " + path_type.__name__)
1056 if isinstance(path_repr, (str, bytes)):
1057 return path_repr
1058 else:
1059 raise TypeError("expected {}.__fspath__() to return str or bytes, "
1060 "not {}".format(path_type.__name__,
1061 type(path_repr).__name__))
1062
1063# If there is no C implementation, make the pure Python version the
1064# implementation as transparently as possible.
Ethan Furman410ef8e2016-06-04 12:06:26 -07001065if not _exists('fspath'):
Brett Cannonc78ca1e2016-06-24 12:03:43 -07001066 fspath = _fspath
1067 fspath.__name__ = "fspath"
Ethan Furmancdc08792016-06-02 15:06:09 -07001068
Ethan Furman958b3e42016-06-04 12:49:35 -07001069
1070class PathLike(abc.ABC):
Brett Cannon5f74ebc2016-06-09 14:29:25 -07001071
1072 """Abstract base class for implementing the file system path protocol."""
1073
Ethan Furman958b3e42016-06-04 12:49:35 -07001074 @abc.abstractmethod
1075 def __fspath__(self):
Brett Cannon5f74ebc2016-06-09 14:29:25 -07001076 """Return the file system path representation of the object."""
Ethan Furman958b3e42016-06-04 12:49:35 -07001077 raise NotImplementedError
1078
1079 @classmethod
1080 def __subclasshook__(cls, subclass):
1081 return hasattr(subclass, '__fspath__')