blob: 421db50a3b7f56947229b63409c81348d0ac6a9e [file] [log] [blame]
Guido van Rossum15e22e11997-12-05 19:03:01 +00001# Module 'ntpath' -- common operations on WinNT/Win95 pathnames
Tim Peters2344fae2001-01-15 00:50:52 +00002"""Common pathname manipulations, WindowsNT/95 version.
Guido van Rossum534972b1999-02-03 17:20:50 +00003
4Instead of importing this module directly, import os and refer to this
5module as os.path.
Guido van Rossum15e22e11997-12-05 19:03:01 +00006"""
Guido van Rossum555915a1994-02-24 11:32:59 +00007
Serhiy Storchaka34601982018-01-07 17:54:31 +02008# strings representing various path-related bits and pieces
9# These are primarily for export; internally, they are hardcoded.
10# Should be set before imports for resolving cyclic dependency.
11curdir = '.'
12pardir = '..'
13extsep = '.'
14sep = '\\'
15pathsep = ';'
16altsep = '/'
17defpath = '.;C:\\bin'
18devnull = 'nul'
19
Guido van Rossum555915a1994-02-24 11:32:59 +000020import os
Mark Hammond8696ebc2002-10-08 02:44:31 +000021import sys
Christian Heimes05e8be12008-02-23 18:30:17 +000022import stat
Guido van Rossumd8faa362007-04-27 19:54:29 +000023import genericpath
Thomas Wouters89f507f2006-12-13 04:49:30 +000024from genericpath import *
Skip Montanaro4d5d5bf2000-07-13 01:01:03 +000025
Skip Montanaro269b83b2001-02-06 01:07:02 +000026__all__ = ["normcase","isabs","join","splitdrive","split","splitext",
27 "basename","dirname","commonprefix","getsize","getmtime",
Georg Brandlf0de6a12005-08-22 18:02:59 +000028 "getatime","getctime", "islink","exists","lexists","isdir","isfile",
Benjamin Petersond71ca412008-05-08 23:44:58 +000029 "ismount", "expanduser","expandvars","normpath","abspath",
Serhiy Storchaka9ed707e2017-01-13 20:55:05 +020030 "curdir","pardir","sep","pathsep","defpath","altsep",
Brian Curtind40e6f72010-07-08 21:39:08 +000031 "extsep","devnull","realpath","supports_unicode_filenames","relpath",
Serhiy Storchaka38220932015-03-31 15:31:53 +030032 "samefile", "sameopenfile", "samestat", "commonpath"]
Guido van Rossum555915a1994-02-24 11:32:59 +000033
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +000034def _get_bothseps(path):
35 if isinstance(path, bytes):
36 return b'\\/'
37 else:
38 return '\\/'
39
Guido van Rossume2ad88c1997-08-12 14:46:58 +000040# Normalize the case of a pathname and map slashes to backslashes.
41# Other normalizations (such as optimizing '../' away) are not done
Guido van Rossum555915a1994-02-24 11:32:59 +000042# (this is done by normpath).
Guido van Rossume2ad88c1997-08-12 14:46:58 +000043
Guido van Rossum555915a1994-02-24 11:32:59 +000044def normcase(s):
Guido van Rossum16a0bc21998-02-18 13:48:31 +000045 """Normalize case of pathname.
46
Guido van Rossum534972b1999-02-03 17:20:50 +000047 Makes all characters lowercase and all slashes into backslashes."""
Brett Cannon3f9183b2016-08-26 14:44:48 -070048 s = os.fspath(s)
Wolfgang Maier74510e22019-03-28 22:47:18 +010049 if isinstance(s, bytes):
50 return s.replace(b'/', b'\\').lower()
51 else:
52 return s.replace('/', '\\').lower()
Guido van Rossum555915a1994-02-24 11:32:59 +000053
Guido van Rossum77e1db31997-06-02 23:11:57 +000054
Fred Drakeef0b5dd2000-02-17 17:30:40 +000055# Return whether a path is absolute.
Mark Hammond5a607a32009-05-06 08:04:54 +000056# Trivial in Posix, harder on Windows.
57# For Windows it is absolute if it starts with a slash or backslash (current
58# volume), or if a pathname after the volume-letter-and-colon or UNC-resource
Guido van Rossum534972b1999-02-03 17:20:50 +000059# starts with a slash or backslash.
Guido van Rossum555915a1994-02-24 11:32:59 +000060
61def isabs(s):
Guido van Rossum15e22e11997-12-05 19:03:01 +000062 """Test whether a path is absolute"""
Brett Cannon3f9183b2016-08-26 14:44:48 -070063 s = os.fspath(s)
Steve Dowerabde52c2019-11-15 09:49:21 -080064 # Paths beginning with \\?\ are always absolute, but do not
65 # necessarily contain a drive.
66 if isinstance(s, bytes):
67 if s.replace(b'/', b'\\').startswith(b'\\\\?\\'):
68 return True
69 else:
70 if s.replace('/', '\\').startswith('\\\\?\\'):
71 return True
Guido van Rossum15e22e11997-12-05 19:03:01 +000072 s = splitdrive(s)[1]
Serhiy Storchaka8518b792014-07-23 20:43:13 +030073 return len(s) > 0 and s[0] in _get_bothseps(s)
Guido van Rossum555915a1994-02-24 11:32:59 +000074
75
Guido van Rossum77e1db31997-06-02 23:11:57 +000076# Join two (or more) paths.
Serhiy Storchakac369c2c2014-01-27 23:15:14 +020077def join(path, *paths):
Brett Cannon3f9183b2016-08-26 14:44:48 -070078 path = os.fspath(path)
Serhiy Storchaka8518b792014-07-23 20:43:13 +030079 if isinstance(path, bytes):
80 sep = b'\\'
81 seps = b'\\/'
82 colon = b':'
83 else:
84 sep = '\\'
85 seps = '\\/'
86 colon = ':'
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +030087 try:
Serhiy Storchaka5bfc03f2015-05-19 11:00:07 +030088 if not paths:
89 path[:0] + sep #23780: Ensure compatible data type even if p is null.
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +030090 result_drive, result_path = splitdrive(path)
Brett Cannon3f9183b2016-08-26 14:44:48 -070091 for p in map(os.fspath, paths):
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +030092 p_drive, p_path = splitdrive(p)
93 if p_path and p_path[0] in seps:
94 # Second path is absolute
95 if p_drive or not result_drive:
96 result_drive = p_drive
Serhiy Storchakac369c2c2014-01-27 23:15:14 +020097 result_path = p_path
98 continue
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +030099 elif p_drive and p_drive != result_drive:
100 if p_drive.lower() != result_drive.lower():
101 # Different drives => ignore the first path entirely
102 result_drive = p_drive
103 result_path = p_path
104 continue
105 # Same drive in different case
106 result_drive = p_drive
107 # Second path is relative to the first
108 if result_path and result_path[-1] not in seps:
109 result_path = result_path + sep
110 result_path = result_path + p_path
111 ## add separator between UNC and non-absolute path
112 if (result_path and result_path[0] not in seps and
113 result_drive and result_drive[-1:] != colon):
114 return result_drive + sep + result_path
115 return result_drive + result_path
116 except (TypeError, AttributeError, BytesWarning):
117 genericpath._check_arg_types('join', path, *paths)
118 raise
Guido van Rossum555915a1994-02-24 11:32:59 +0000119
120
121# Split a path in a drive specification (a drive letter followed by a
Guido van Rossumf3c695c1999-04-06 19:32:19 +0000122# colon) and the path specification.
Guido van Rossum555915a1994-02-24 11:32:59 +0000123# It is always true that drivespec + pathspec == p
124def splitdrive(p):
Mark Hammond5a607a32009-05-06 08:04:54 +0000125 """Split a pathname into drive/UNC sharepoint and relative path specifiers.
126 Returns a 2-tuple (drive_or_unc, path); either part may be empty.
127
128 If you assign
129 result = splitdrive(p)
130 It is always true that:
131 result[0] + result[1] == p
132
133 If the path contained a drive letter, drive_or_unc will contain everything
134 up to and including the colon. e.g. splitdrive("c:/dir") returns ("c:", "/dir")
135
136 If the path contained a UNC path, the drive_or_unc will contain the host name
137 and share up to but not including the fourth directory separator character.
138 e.g. splitdrive("//host/computer/dir") returns ("//host/computer", "/dir")
139
140 Paths cannot contain both a drive letter and a UNC path.
141
142 """
Brett Cannon3f9183b2016-08-26 14:44:48 -0700143 p = os.fspath(p)
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300144 if len(p) >= 2:
145 if isinstance(p, bytes):
146 sep = b'\\'
147 altsep = b'/'
148 colon = b':'
149 else:
150 sep = '\\'
151 altsep = '/'
152 colon = ':'
153 normp = p.replace(altsep, sep)
Mark Hammond5a607a32009-05-06 08:04:54 +0000154 if (normp[0:2] == sep*2) and (normp[2:3] != sep):
155 # is a UNC path:
156 # vvvvvvvvvvvvvvvvvvvv drive letter or UNC path
157 # \\machine\mountpoint\directory\etc\...
158 # directory ^^^^^^^^^^^^^^^
159 index = normp.find(sep, 2)
160 if index == -1:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300161 return p[:0], p
Mark Hammond5a607a32009-05-06 08:04:54 +0000162 index2 = normp.find(sep, index + 1)
163 # a UNC path can't have two slashes in a row
164 # (after the initial two)
165 if index2 == index + 1:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300166 return p[:0], p
Mark Hammond5a607a32009-05-06 08:04:54 +0000167 if index2 == -1:
168 index2 = len(p)
169 return p[:index2], p[index2:]
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300170 if normp[1:2] == colon:
Mark Hammond5a607a32009-05-06 08:04:54 +0000171 return p[:2], p[2:]
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300172 return p[:0], p
Guido van Rossumf3c695c1999-04-06 19:32:19 +0000173
174
Guido van Rossum555915a1994-02-24 11:32:59 +0000175# Split a path in head (everything up to the last '/') and tail (the
Guido van Rossum8f0fa9e1999-03-19 21:05:12 +0000176# rest). After the trailing '/' is stripped, the invariant
Guido van Rossum555915a1994-02-24 11:32:59 +0000177# join(head, tail) == p holds.
178# The resulting head won't end in '/' unless it is the root.
179
180def split(p):
Guido van Rossum534972b1999-02-03 17:20:50 +0000181 """Split a pathname.
182
183 Return tuple (head, tail) where tail is everything after the final slash.
184 Either part may be empty."""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700185 p = os.fspath(p)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000186 seps = _get_bothseps(p)
Guido van Rossum15e22e11997-12-05 19:03:01 +0000187 d, p = splitdrive(p)
Guido van Rossum8f0fa9e1999-03-19 21:05:12 +0000188 # set i to index beyond p's last slash
189 i = len(p)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000190 while i and p[i-1] not in seps:
Georg Brandl599b65d2010-07-23 08:46:35 +0000191 i -= 1
Guido van Rossum8f0fa9e1999-03-19 21:05:12 +0000192 head, tail = p[:i], p[i:] # now tail has no slashes
193 # remove trailing slashes from head, unless it's all slashes
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300194 head = head.rstrip(seps) or head
Guido van Rossum15e22e11997-12-05 19:03:01 +0000195 return d + head, tail
Guido van Rossum555915a1994-02-24 11:32:59 +0000196
197
198# Split a path in root and extension.
Guido van Rossum73e122f1997-01-22 00:17:26 +0000199# The extension is everything starting at the last dot in the last
Guido van Rossum555915a1994-02-24 11:32:59 +0000200# pathname component; the root is everything before that.
201# It is always true that root + ext == p.
202
203def splitext(p):
Brett Cannon3f9183b2016-08-26 14:44:48 -0700204 p = os.fspath(p)
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300205 if isinstance(p, bytes):
206 return genericpath._splitext(p, b'\\', b'/', b'.')
207 else:
208 return genericpath._splitext(p, '\\', '/', '.')
Guido van Rossumd8faa362007-04-27 19:54:29 +0000209splitext.__doc__ = genericpath._splitext.__doc__
Guido van Rossum555915a1994-02-24 11:32:59 +0000210
211
212# Return the tail (basename) part of a path.
213
214def basename(p):
Guido van Rossum15e22e11997-12-05 19:03:01 +0000215 """Returns the final component of a pathname"""
216 return split(p)[1]
Guido van Rossum555915a1994-02-24 11:32:59 +0000217
218
219# Return the head (dirname) part of a path.
220
221def dirname(p):
Guido van Rossum15e22e11997-12-05 19:03:01 +0000222 """Returns the directory component of a pathname"""
223 return split(p)[0]
Guido van Rossum555915a1994-02-24 11:32:59 +0000224
Guido van Rossum555915a1994-02-24 11:32:59 +0000225# Is a path a symbolic link?
Brian Curtind40e6f72010-07-08 21:39:08 +0000226# This will always return false on systems where os.lstat doesn't exist.
Guido van Rossum555915a1994-02-24 11:32:59 +0000227
228def islink(path):
Brian Curtind40e6f72010-07-08 21:39:08 +0000229 """Test whether a path is a symbolic link.
Jesus Ceaf1af7052012-10-05 02:48:46 +0200230 This will always return false for Windows prior to 6.0.
Thomas Wouters89f507f2006-12-13 04:49:30 +0000231 """
Brian Curtind40e6f72010-07-08 21:39:08 +0000232 try:
233 st = os.lstat(path)
Serhiy Storchaka0185f342018-09-18 11:28:51 +0300234 except (OSError, ValueError, AttributeError):
Brian Curtind40e6f72010-07-08 21:39:08 +0000235 return False
236 return stat.S_ISLNK(st.st_mode)
Guido van Rossum555915a1994-02-24 11:32:59 +0000237
Brian Curtind40e6f72010-07-08 21:39:08 +0000238# Being true for dangling symbolic links is also useful.
239
240def lexists(path):
241 """Test whether a path exists. Returns True for broken symbolic links"""
242 try:
243 st = os.lstat(path)
Serhiy Storchaka0185f342018-09-18 11:28:51 +0300244 except (OSError, ValueError):
Brian Curtind40e6f72010-07-08 21:39:08 +0000245 return False
246 return True
Johannes Gijsbersae882f72004-08-30 10:19:56 +0000247
Tim Golden6b528062013-08-01 12:44:00 +0100248# Is a path a mount point?
249# Any drive letter root (eg c:\)
250# Any share UNC (eg \\server\share)
251# Any volume mounted on a filesystem folder
252#
253# No one method detects all three situations. Historically we've lexically
254# detected drive letter roots and share UNCs. The canonical approach to
255# detecting mounted volumes (querying the reparse tag) fails for the most
256# common case: drive letter roots. The alternative which uses GetVolumePathName
257# fails if the drive letter is the result of a SUBST.
258try:
259 from nt import _getvolumepathname
260except ImportError:
261 _getvolumepathname = None
Guido van Rossum555915a1994-02-24 11:32:59 +0000262def ismount(path):
Tim Golden6b528062013-08-01 12:44:00 +0100263 """Test whether a path is a mount point (a drive root, the root of a
264 share, or a mounted volume)"""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700265 path = os.fspath(path)
Benjamin Peterson48e24782009-03-29 13:02:52 +0000266 seps = _get_bothseps(path)
Tim Golden6b528062013-08-01 12:44:00 +0100267 path = abspath(path)
Mark Hammond5a607a32009-05-06 08:04:54 +0000268 root, rest = splitdrive(path)
269 if root and root[0] in seps:
270 return (not rest) or (rest in seps)
Tim Golden6b528062013-08-01 12:44:00 +0100271 if rest in seps:
272 return True
273
274 if _getvolumepathname:
275 return path.rstrip(seps) == _getvolumepathname(path).rstrip(seps)
276 else:
277 return False
Guido van Rossum555915a1994-02-24 11:32:59 +0000278
279
Guido van Rossum555915a1994-02-24 11:32:59 +0000280# Expand paths beginning with '~' or '~user'.
281# '~' means $HOME; '~user' means that user's home directory.
282# If the path doesn't begin with '~', or if the user or $HOME is unknown,
283# the path is returned unchanged (leaving error reporting to whatever
284# function is called with the expanded path as argument).
285# See also module 'glob' for expansion of *, ? and [...] in pathnames.
286# (A function should also be defined to do full *sh-style environment
287# variable expansion.)
288
289def expanduser(path):
Guido van Rossum534972b1999-02-03 17:20:50 +0000290 """Expand ~ and ~user constructs.
291
292 If user or $HOME is unknown, do nothing."""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700293 path = os.fspath(path)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000294 if isinstance(path, bytes):
295 tilde = b'~'
296 else:
297 tilde = '~'
298 if not path.startswith(tilde):
Guido van Rossum15e22e11997-12-05 19:03:01 +0000299 return path
300 i, n = 1, len(path)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000301 while i < n and path[i] not in _get_bothseps(path):
Georg Brandl599b65d2010-07-23 08:46:35 +0000302 i += 1
Guido van Rossumd8faa362007-04-27 19:54:29 +0000303
Anthony Sottile25ec4a42019-03-12 08:39:57 -0700304 if 'USERPROFILE' in os.environ:
Guido van Rossumd8faa362007-04-27 19:54:29 +0000305 userhome = os.environ['USERPROFILE']
306 elif not 'HOMEPATH' in os.environ:
Guido van Rossum15e22e11997-12-05 19:03:01 +0000307 return path
Guido van Rossumd8faa362007-04-27 19:54:29 +0000308 else:
309 try:
310 drive = os.environ['HOMEDRIVE']
311 except KeyError:
312 drive = ''
313 userhome = join(drive, os.environ['HOMEPATH'])
314
Barney Gale3f3d82b2021-04-07 23:50:13 +0100315 if i != 1: #~user
316 # Try to guess user home directory. By default all users directories
317 # are located in the same place and are named by corresponding
318 # usernames. If current user home directory points to nonstandard
319 # place, this guess is likely wrong, and so we bail out.
320 current_user = os.environ.get('USERNAME')
321 if current_user != basename(userhome):
322 return path
323
324 target_user = path[1:i]
325 if isinstance(target_user, bytes):
326 target_user = os.fsdecode(target_user)
327 if target_user != current_user:
328 userhome = join(dirname(userhome), target_user)
329
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000330 if isinstance(path, bytes):
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300331 userhome = os.fsencode(userhome)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000332
Guido van Rossum15e22e11997-12-05 19:03:01 +0000333 return userhome + path[i:]
Guido van Rossum555915a1994-02-24 11:32:59 +0000334
335
336# Expand paths containing shell variable substitutions.
337# The following rules apply:
Guido van Rossum15e22e11997-12-05 19:03:01 +0000338# - no expansion within single quotes
Guido van Rossumd8faa362007-04-27 19:54:29 +0000339# - '$$' is translated into '$'
340# - '%%' is translated into '%' if '%%' are not seen in %var1%%var2%
Guido van Rossum15e22e11997-12-05 19:03:01 +0000341# - ${varname} is accepted.
Guido van Rossumd8faa362007-04-27 19:54:29 +0000342# - $varname is accepted.
343# - %varname% is accepted.
344# - varnames can be made out of letters, digits and the characters '_-'
Ezio Melotti13925002011-03-16 11:05:33 +0200345# (though is not verified in the ${varname} and %varname% cases)
Guido van Rossum555915a1994-02-24 11:32:59 +0000346# XXX With COMMAND.COM you can use any characters in a variable name,
347# XXX except '^|<>='.
348
Tim Peters2344fae2001-01-15 00:50:52 +0000349def expandvars(path):
Guido van Rossumd8faa362007-04-27 19:54:29 +0000350 """Expand shell variables of the forms $var, ${var} and %var%.
Guido van Rossum534972b1999-02-03 17:20:50 +0000351
352 Unknown variables are left unchanged."""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700353 path = os.fspath(path)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000354 if isinstance(path, bytes):
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300355 if b'$' not in path and b'%' not in path:
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000356 return path
357 import string
358 varchars = bytes(string.ascii_letters + string.digits + '_-', 'ascii')
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000359 quote = b'\''
360 percent = b'%'
361 brace = b'{'
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300362 rbrace = b'}'
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000363 dollar = b'$'
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200364 environ = getattr(os, 'environb', None)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000365 else:
366 if '$' not in path and '%' not in path:
367 return path
368 import string
369 varchars = string.ascii_letters + string.digits + '_-'
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000370 quote = '\''
371 percent = '%'
372 brace = '{'
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300373 rbrace = '}'
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000374 dollar = '$'
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200375 environ = os.environ
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000376 res = path[:0]
Guido van Rossum15e22e11997-12-05 19:03:01 +0000377 index = 0
378 pathlen = len(path)
379 while index < pathlen:
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000380 c = path[index:index+1]
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000381 if c == quote: # no expansion within single quotes
Guido van Rossum15e22e11997-12-05 19:03:01 +0000382 path = path[index + 1:]
383 pathlen = len(path)
384 try:
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000385 index = path.index(c)
Georg Brandl599b65d2010-07-23 08:46:35 +0000386 res += c + path[:index + 1]
Fred Drakeb4e460a2000-09-28 16:25:20 +0000387 except ValueError:
Serhiy Storchaka1b87ae02015-03-25 16:40:15 +0200388 res += c + path
Fred Drakeb4e460a2000-09-28 16:25:20 +0000389 index = pathlen - 1
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000390 elif c == percent: # variable or '%'
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000391 if path[index + 1:index + 2] == percent:
Georg Brandl599b65d2010-07-23 08:46:35 +0000392 res += c
393 index += 1
Guido van Rossumd8faa362007-04-27 19:54:29 +0000394 else:
395 path = path[index+1:]
396 pathlen = len(path)
397 try:
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000398 index = path.index(percent)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000399 except ValueError:
Georg Brandl599b65d2010-07-23 08:46:35 +0000400 res += percent + path
Guido van Rossumd8faa362007-04-27 19:54:29 +0000401 index = pathlen - 1
402 else:
403 var = path[:index]
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200404 try:
405 if environ is None:
406 value = os.fsencode(os.environ[os.fsdecode(var)])
407 else:
408 value = environ[var]
409 except KeyError:
410 value = percent + var + percent
Georg Brandl599b65d2010-07-23 08:46:35 +0000411 res += value
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000412 elif c == dollar: # variable or '$$'
413 if path[index + 1:index + 2] == dollar:
Georg Brandl599b65d2010-07-23 08:46:35 +0000414 res += c
415 index += 1
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000416 elif path[index + 1:index + 2] == brace:
Guido van Rossum15e22e11997-12-05 19:03:01 +0000417 path = path[index+2:]
418 pathlen = len(path)
419 try:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300420 index = path.index(rbrace)
Fred Drakeb4e460a2000-09-28 16:25:20 +0000421 except ValueError:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300422 res += dollar + brace + path
Guido van Rossum15e22e11997-12-05 19:03:01 +0000423 index = pathlen - 1
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200424 else:
425 var = path[:index]
426 try:
427 if environ is None:
428 value = os.fsencode(os.environ[os.fsdecode(var)])
429 else:
430 value = environ[var]
431 except KeyError:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300432 value = dollar + brace + var + rbrace
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200433 res += value
Guido van Rossum15e22e11997-12-05 19:03:01 +0000434 else:
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200435 var = path[:0]
Georg Brandl599b65d2010-07-23 08:46:35 +0000436 index += 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000437 c = path[index:index + 1]
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000438 while c and c in varchars:
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200439 var += c
Georg Brandl599b65d2010-07-23 08:46:35 +0000440 index += 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000441 c = path[index:index + 1]
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200442 try:
443 if environ is None:
444 value = os.fsencode(os.environ[os.fsdecode(var)])
445 else:
446 value = environ[var]
447 except KeyError:
448 value = dollar + var
Georg Brandl599b65d2010-07-23 08:46:35 +0000449 res += value
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000450 if c:
Georg Brandl599b65d2010-07-23 08:46:35 +0000451 index -= 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000452 else:
Georg Brandl599b65d2010-07-23 08:46:35 +0000453 res += c
454 index += 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000455 return res
Guido van Rossum555915a1994-02-24 11:32:59 +0000456
457
Tim Peters54a14a32001-08-30 22:05:26 +0000458# Normalize a path, e.g. A//B, A/./B and A/foo/../B all become A\B.
Guido van Rossum3df7b5a1996-08-26 16:35:26 +0000459# Previously, this function also truncated pathnames to 8+3 format,
460# but as this module is called "ntpath", that's obviously wrong!
Guido van Rossum555915a1994-02-24 11:32:59 +0000461
462def normpath(path):
Guido van Rossum15e22e11997-12-05 19:03:01 +0000463 """Normalize path, eliminating double slashes, etc."""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700464 path = os.fspath(path)
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300465 if isinstance(path, bytes):
466 sep = b'\\'
467 altsep = b'/'
468 curdir = b'.'
469 pardir = b'..'
470 special_prefixes = (b'\\\\.\\', b'\\\\?\\')
471 else:
472 sep = '\\'
473 altsep = '/'
474 curdir = '.'
475 pardir = '..'
476 special_prefixes = ('\\\\.\\', '\\\\?\\')
Georg Brandlcfb68212010-07-31 21:40:15 +0000477 if path.startswith(special_prefixes):
478 # in the case of paths with these prefixes:
479 # \\.\ -> device names
480 # \\?\ -> literal paths
Steve Dower06be2c72019-08-21 16:45:02 -0700481 # do not do any normalization, but return the path
482 # unchanged apart from the call to os.fspath()
Georg Brandlcfb68212010-07-31 21:40:15 +0000483 return path
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300484 path = path.replace(altsep, sep)
Guido van Rossum15e22e11997-12-05 19:03:01 +0000485 prefix, path = splitdrive(path)
Mark Hammond5a607a32009-05-06 08:04:54 +0000486
487 # collapse initial backslashes
488 if path.startswith(sep):
Georg Brandl599b65d2010-07-23 08:46:35 +0000489 prefix += sep
Mark Hammond5a607a32009-05-06 08:04:54 +0000490 path = path.lstrip(sep)
491
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000492 comps = path.split(sep)
Guido van Rossum15e22e11997-12-05 19:03:01 +0000493 i = 0
494 while i < len(comps):
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300495 if not comps[i] or comps[i] == curdir:
Guido van Rossum15e22e11997-12-05 19:03:01 +0000496 del comps[i]
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300497 elif comps[i] == pardir:
498 if i > 0 and comps[i-1] != pardir:
Tim Peters54a14a32001-08-30 22:05:26 +0000499 del comps[i-1:i+1]
500 i -= 1
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300501 elif i == 0 and prefix.endswith(sep):
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000502 del comps[i]
503 else:
504 i += 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000505 else:
Tim Peters54a14a32001-08-30 22:05:26 +0000506 i += 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000507 # If the path is now empty, substitute '.'
508 if not prefix and not comps:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300509 comps.append(curdir)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000510 return prefix + sep.join(comps)
Guido van Rossume294cf61999-01-29 18:05:18 +0000511
Franz Wöllertd2e902e2018-07-29 14:47:09 +0200512def _abspath_fallback(path):
513 """Return the absolute version of a path as a fallback function in case
514 `nt._getfullpathname` is not available or raises OSError. See bpo-31047 for
515 more.
516
517 """
518
519 path = os.fspath(path)
520 if not isabs(path):
521 if isinstance(path, bytes):
522 cwd = os.getcwdb()
523 else:
524 cwd = os.getcwd()
525 path = join(cwd, path)
526 return normpath(path)
Guido van Rossume294cf61999-01-29 18:05:18 +0000527
528# Return an absolute path.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000529try:
530 from nt import _getfullpathname
Mark Hammondf717f052002-01-17 00:44:26 +0000531
Brett Cannoncd171c82013-07-04 17:43:24 -0400532except ImportError: # not running on Windows - mock up something sensible
Franz Wöllertd2e902e2018-07-29 14:47:09 +0200533 abspath = _abspath_fallback
Thomas Wouters477c8d52006-05-27 19:21:47 +0000534
535else: # use native Windows method on Windows
536 def abspath(path):
537 """Return the absolute version of a path."""
Franz Wöllertd2e902e2018-07-29 14:47:09 +0200538 try:
Tim Grahamd03b7752018-10-25 11:26:38 -0400539 return normpath(_getfullpathname(path))
Serhiy Storchaka0185f342018-09-18 11:28:51 +0300540 except (OSError, ValueError):
Franz Wöllertd2e902e2018-07-29 14:47:09 +0200541 return _abspath_fallback(path)
Guido van Rossum83eeef42001-09-17 15:16:09 +0000542
Steve Dower75e06492019-08-21 13:43:06 -0700543try:
544 from nt import _getfinalpathname, readlink as _nt_readlink
545except ImportError:
546 # realpath is a no-op on systems without _getfinalpathname support.
547 realpath = abspath
548else:
Steve Dowerabde52c2019-11-15 09:49:21 -0800549 def _readlink_deep(path):
Steve Dower89b89332019-09-16 15:25:11 +0100550 # These error codes indicate that we should stop reading links and
551 # return the path we currently have.
552 # 1: ERROR_INVALID_FUNCTION
553 # 2: ERROR_FILE_NOT_FOUND
554 # 3: ERROR_DIRECTORY_NOT_FOUND
555 # 5: ERROR_ACCESS_DENIED
556 # 21: ERROR_NOT_READY (implies drive with no media)
557 # 32: ERROR_SHARING_VIOLATION (probably an NTFS paging file)
558 # 50: ERROR_NOT_SUPPORTED (implies no support for reparse points)
559 # 67: ERROR_BAD_NET_NAME (implies remote server unavailable)
560 # 87: ERROR_INVALID_PARAMETER
561 # 4390: ERROR_NOT_A_REPARSE_POINT
562 # 4392: ERROR_INVALID_REPARSE_DATA
563 # 4393: ERROR_REPARSE_TAG_INVALID
564 allowed_winerror = 1, 2, 3, 5, 21, 32, 50, 67, 87, 4390, 4392, 4393
565
Steve Dowerabde52c2019-11-15 09:49:21 -0800566 seen = set()
Steve Dower75e06492019-08-21 13:43:06 -0700567 while normcase(path) not in seen:
568 seen.add(normcase(path))
569 try:
Steve Dowerabde52c2019-11-15 09:49:21 -0800570 old_path = path
Steve Dower75e06492019-08-21 13:43:06 -0700571 path = _nt_readlink(path)
Steve Dowerabde52c2019-11-15 09:49:21 -0800572 # Links may be relative, so resolve them against their
573 # own location
574 if not isabs(path):
575 # If it's something other than a symlink, we don't know
576 # what it's actually going to be resolved against, so
577 # just return the old path.
578 if not islink(old_path):
579 path = old_path
580 break
581 path = normpath(join(dirname(old_path), path))
Steve Dower75e06492019-08-21 13:43:06 -0700582 except OSError as ex:
Steve Dower89b89332019-09-16 15:25:11 +0100583 if ex.winerror in allowed_winerror:
Steve Dower75e06492019-08-21 13:43:06 -0700584 break
585 raise
586 except ValueError:
587 # Stop on reparse points that are not symlinks
588 break
589 return path
590
591 def _getfinalpathname_nonstrict(path):
Steve Dower89b89332019-09-16 15:25:11 +0100592 # These error codes indicate that we should stop resolving the path
593 # and return the value we currently have.
594 # 1: ERROR_INVALID_FUNCTION
595 # 2: ERROR_FILE_NOT_FOUND
596 # 3: ERROR_DIRECTORY_NOT_FOUND
597 # 5: ERROR_ACCESS_DENIED
598 # 21: ERROR_NOT_READY (implies drive with no media)
599 # 32: ERROR_SHARING_VIOLATION (probably an NTFS paging file)
600 # 50: ERROR_NOT_SUPPORTED
601 # 67: ERROR_BAD_NET_NAME (implies remote server unavailable)
602 # 87: ERROR_INVALID_PARAMETER
603 # 123: ERROR_INVALID_NAME
Steve Dowera0e3d272019-10-03 08:31:03 -0700604 # 1920: ERROR_CANT_ACCESS_FILE
Steve Dower89b89332019-09-16 15:25:11 +0100605 # 1921: ERROR_CANT_RESOLVE_FILENAME (implies unfollowable symlink)
Steve Dowera0e3d272019-10-03 08:31:03 -0700606 allowed_winerror = 1, 2, 3, 5, 21, 32, 50, 67, 87, 123, 1920, 1921
Steve Dower75e06492019-08-21 13:43:06 -0700607
608 # Non-strict algorithm is to find as much of the target directory
609 # as we can and join the rest.
610 tail = ''
Steve Dower75e06492019-08-21 13:43:06 -0700611 while path:
612 try:
Steve Dower75e06492019-08-21 13:43:06 -0700613 path = _getfinalpathname(path)
614 return join(path, tail) if tail else path
615 except OSError as ex:
616 if ex.winerror not in allowed_winerror:
617 raise
Steve Dowerabde52c2019-11-15 09:49:21 -0800618 try:
619 # The OS could not resolve this path fully, so we attempt
620 # to follow the link ourselves. If we succeed, join the tail
621 # and return.
622 new_path = _readlink_deep(path)
623 if new_path != path:
624 return join(new_path, tail) if tail else new_path
625 except OSError:
626 # If we fail to readlink(), let's keep traversing
627 pass
Steve Dower75e06492019-08-21 13:43:06 -0700628 path, name = split(path)
Steve Dower89b89332019-09-16 15:25:11 +0100629 # TODO (bpo-38186): Request the real file name from the directory
630 # entry using FindFirstFileW. For now, we will return the path
631 # as best we have it
Steve Dower75e06492019-08-21 13:43:06 -0700632 if path and not name:
Steve Dowerabde52c2019-11-15 09:49:21 -0800633 return path + tail
Steve Dower75e06492019-08-21 13:43:06 -0700634 tail = join(name, tail) if tail else name
Steve Dowerabde52c2019-11-15 09:49:21 -0800635 return tail
Steve Dower75e06492019-08-21 13:43:06 -0700636
637 def realpath(path):
Steve Dower06be2c72019-08-21 16:45:02 -0700638 path = normpath(path)
Steve Dower75e06492019-08-21 13:43:06 -0700639 if isinstance(path, bytes):
640 prefix = b'\\\\?\\'
641 unc_prefix = b'\\\\?\\UNC\\'
642 new_unc_prefix = b'\\\\'
643 cwd = os.getcwdb()
Steve Dowerabde52c2019-11-15 09:49:21 -0800644 # bpo-38081: Special case for realpath(b'nul')
645 if normcase(path) == normcase(os.fsencode(devnull)):
646 return b'\\\\.\\NUL'
Steve Dower75e06492019-08-21 13:43:06 -0700647 else:
648 prefix = '\\\\?\\'
649 unc_prefix = '\\\\?\\UNC\\'
650 new_unc_prefix = '\\\\'
651 cwd = os.getcwd()
Steve Dowerabde52c2019-11-15 09:49:21 -0800652 # bpo-38081: Special case for realpath('nul')
653 if normcase(path) == normcase(devnull):
654 return '\\\\.\\NUL'
Steve Dower75e06492019-08-21 13:43:06 -0700655 had_prefix = path.startswith(prefix)
Steve Dowerabde52c2019-11-15 09:49:21 -0800656 if not had_prefix and not isabs(path):
657 path = join(cwd, path)
Steve Dowera0e3d272019-10-03 08:31:03 -0700658 try:
659 path = _getfinalpathname(path)
660 initial_winerror = 0
661 except OSError as ex:
662 initial_winerror = ex.winerror
663 path = _getfinalpathname_nonstrict(path)
Steve Dower75e06492019-08-21 13:43:06 -0700664 # The path returned by _getfinalpathname will always start with \\?\ -
665 # strip off that prefix unless it was already provided on the original
666 # path.
667 if not had_prefix and path.startswith(prefix):
668 # For UNC paths, the prefix will actually be \\?\UNC\
669 # Handle that case as well.
670 if path.startswith(unc_prefix):
671 spath = new_unc_prefix + path[len(unc_prefix):]
672 else:
673 spath = path[len(prefix):]
674 # Ensure that the non-prefixed path resolves to the same path
675 try:
676 if _getfinalpathname(spath) == path:
677 path = spath
678 except OSError as ex:
Steve Dower06be2c72019-08-21 16:45:02 -0700679 # If the path does not exist and originally did not exist, then
680 # strip the prefix anyway.
Steve Dowera0e3d272019-10-03 08:31:03 -0700681 if ex.winerror == initial_winerror:
Steve Dower06be2c72019-08-21 16:45:02 -0700682 path = spath
Steve Dower75e06492019-08-21 13:43:06 -0700683 return path
684
685
Mark Hammond8696ebc2002-10-08 02:44:31 +0000686# Win9x family and earlier have no Unicode filename support.
Tim Peters26bc25a2002-10-09 07:56:04 +0000687supports_unicode_filenames = (hasattr(sys, "getwindowsversion") and
688 sys.getwindowsversion()[3] >= 2)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000689
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300690def relpath(path, start=None):
Guido van Rossumd8faa362007-04-27 19:54:29 +0000691 """Return a relative version of a path"""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700692 path = os.fspath(path)
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300693 if isinstance(path, bytes):
694 sep = b'\\'
695 curdir = b'.'
696 pardir = b'..'
697 else:
698 sep = '\\'
699 curdir = '.'
700 pardir = '..'
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000701
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300702 if start is None:
703 start = curdir
Guido van Rossumd8faa362007-04-27 19:54:29 +0000704
705 if not path:
706 raise ValueError("no path specified")
Mark Hammond5a607a32009-05-06 08:04:54 +0000707
Brett Cannon3f9183b2016-08-26 14:44:48 -0700708 start = os.fspath(start)
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +0300709 try:
710 start_abs = abspath(normpath(start))
711 path_abs = abspath(normpath(path))
712 start_drive, start_rest = splitdrive(start_abs)
713 path_drive, path_rest = splitdrive(path_abs)
714 if normcase(start_drive) != normcase(path_drive):
715 raise ValueError("path is on mount %r, start on mount %r" % (
716 path_drive, start_drive))
Mark Hammond5a607a32009-05-06 08:04:54 +0000717
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +0300718 start_list = [x for x in start_rest.split(sep) if x]
719 path_list = [x for x in path_rest.split(sep) if x]
720 # Work out how much of the filepath is shared by start and path.
721 i = 0
722 for e1, e2 in zip(start_list, path_list):
723 if normcase(e1) != normcase(e2):
724 break
725 i += 1
Guido van Rossumd8faa362007-04-27 19:54:29 +0000726
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +0300727 rel_list = [pardir] * (len(start_list)-i) + path_list[i:]
728 if not rel_list:
729 return curdir
730 return join(*rel_list)
Serhiy Storchakae4f47082014-10-04 16:09:02 +0300731 except (TypeError, ValueError, AttributeError, BytesWarning, DeprecationWarning):
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +0300732 genericpath._check_arg_types('relpath', path, start)
733 raise
Brian Curtind40e6f72010-07-08 21:39:08 +0000734
735
Serhiy Storchaka38220932015-03-31 15:31:53 +0300736# Return the longest common sub-path of the sequence of paths given as input.
737# The function is case-insensitive and 'separator-insensitive', i.e. if the
738# only difference between two paths is the use of '\' versus '/' as separator,
739# they are deemed to be equal.
740#
741# However, the returned path will have the standard '\' separator (even if the
742# given paths had the alternative '/' separator) and will have the case of the
743# first path given in the sequence. Additionally, any trailing separator is
744# stripped from the returned path.
745
746def commonpath(paths):
747 """Given a sequence of path names, returns the longest common sub-path."""
748
749 if not paths:
750 raise ValueError('commonpath() arg is an empty sequence')
751
Brett Cannon3f9183b2016-08-26 14:44:48 -0700752 paths = tuple(map(os.fspath, paths))
Serhiy Storchaka38220932015-03-31 15:31:53 +0300753 if isinstance(paths[0], bytes):
754 sep = b'\\'
755 altsep = b'/'
756 curdir = b'.'
757 else:
758 sep = '\\'
759 altsep = '/'
760 curdir = '.'
761
762 try:
763 drivesplits = [splitdrive(p.replace(altsep, sep).lower()) for p in paths]
764 split_paths = [p.split(sep) for d, p in drivesplits]
765
766 try:
767 isabs, = set(p[:1] == sep for d, p in drivesplits)
768 except ValueError:
769 raise ValueError("Can't mix absolute and relative paths") from None
770
771 # Check that all drive letters or UNC paths match. The check is made only
772 # now otherwise type errors for mixing strings and bytes would not be
773 # caught.
774 if len(set(d for d, p in drivesplits)) != 1:
775 raise ValueError("Paths don't have the same drive")
776
777 drive, path = splitdrive(paths[0].replace(altsep, sep))
778 common = path.split(sep)
779 common = [c for c in common if c and c != curdir]
780
781 split_paths = [[c for c in s if c and c != curdir] for s in split_paths]
782 s1 = min(split_paths)
783 s2 = max(split_paths)
784 for i, c in enumerate(s1):
785 if c != s2[i]:
786 common = common[:i]
787 break
788 else:
789 common = common[:len(s1)]
790
791 prefix = drive + sep if isabs else drive
792 return prefix + sep.join(common)
793 except (TypeError, AttributeError):
794 genericpath._check_arg_types('commonpath', *paths)
795 raise
796
797
Brian Curtin9c669cc2011-06-08 18:17:18 -0500798try:
799 # The genericpath.isdir implementation uses os.stat and checks the mode
800 # attribute to tell whether or not the path is a directory.
801 # This is overkill on Windows - just pass the path to GetFileAttributes
802 # and check the attribute from there.
Brian Curtin95d028f2011-06-09 09:10:38 -0500803 from nt import _isdir as isdir
Brett Cannoncd171c82013-07-04 17:43:24 -0400804except ImportError:
Brian Curtin95d028f2011-06-09 09:10:38 -0500805 # Use genericpath.isdir as imported above.
806 pass