blob: 6f771773a7d1b5d600ea172b322a09e7997086fa [file] [log] [blame]
Guido van Rossum15e22e11997-12-05 19:03:01 +00001# Module 'ntpath' -- common operations on WinNT/Win95 pathnames
Tim Peters2344fae2001-01-15 00:50:52 +00002"""Common pathname manipulations, WindowsNT/95 version.
Guido van Rossum534972b1999-02-03 17:20:50 +00003
4Instead of importing this module directly, import os and refer to this
5module as os.path.
Guido van Rossum15e22e11997-12-05 19:03:01 +00006"""
Guido van Rossum555915a1994-02-24 11:32:59 +00007
Serhiy Storchaka34601982018-01-07 17:54:31 +02008# strings representing various path-related bits and pieces
9# These are primarily for export; internally, they are hardcoded.
10# Should be set before imports for resolving cyclic dependency.
11curdir = '.'
12pardir = '..'
13extsep = '.'
14sep = '\\'
15pathsep = ';'
16altsep = '/'
17defpath = '.;C:\\bin'
18devnull = 'nul'
19
Guido van Rossum555915a1994-02-24 11:32:59 +000020import os
Mark Hammond8696ebc2002-10-08 02:44:31 +000021import sys
Christian Heimes05e8be12008-02-23 18:30:17 +000022import stat
Guido van Rossumd8faa362007-04-27 19:54:29 +000023import genericpath
Thomas Wouters89f507f2006-12-13 04:49:30 +000024from genericpath import *
Skip Montanaro4d5d5bf2000-07-13 01:01:03 +000025
Skip Montanaro269b83b2001-02-06 01:07:02 +000026__all__ = ["normcase","isabs","join","splitdrive","split","splitext",
27 "basename","dirname","commonprefix","getsize","getmtime",
Georg Brandlf0de6a12005-08-22 18:02:59 +000028 "getatime","getctime", "islink","exists","lexists","isdir","isfile",
Benjamin Petersond71ca412008-05-08 23:44:58 +000029 "ismount", "expanduser","expandvars","normpath","abspath",
Serhiy Storchaka9ed707e2017-01-13 20:55:05 +020030 "curdir","pardir","sep","pathsep","defpath","altsep",
Brian Curtind40e6f72010-07-08 21:39:08 +000031 "extsep","devnull","realpath","supports_unicode_filenames","relpath",
Serhiy Storchaka38220932015-03-31 15:31:53 +030032 "samefile", "sameopenfile", "samestat", "commonpath"]
Guido van Rossum555915a1994-02-24 11:32:59 +000033
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +000034def _get_bothseps(path):
35 if isinstance(path, bytes):
36 return b'\\/'
37 else:
38 return '\\/'
39
Guido van Rossume2ad88c1997-08-12 14:46:58 +000040# Normalize the case of a pathname and map slashes to backslashes.
41# Other normalizations (such as optimizing '../' away) are not done
Guido van Rossum555915a1994-02-24 11:32:59 +000042# (this is done by normpath).
Guido van Rossume2ad88c1997-08-12 14:46:58 +000043
Guido van Rossum555915a1994-02-24 11:32:59 +000044def normcase(s):
Guido van Rossum16a0bc21998-02-18 13:48:31 +000045 """Normalize case of pathname.
46
Guido van Rossum534972b1999-02-03 17:20:50 +000047 Makes all characters lowercase and all slashes into backslashes."""
Brett Cannon3f9183b2016-08-26 14:44:48 -070048 s = os.fspath(s)
Wolfgang Maier74510e22019-03-28 22:47:18 +010049 if isinstance(s, bytes):
50 return s.replace(b'/', b'\\').lower()
51 else:
52 return s.replace('/', '\\').lower()
Guido van Rossum555915a1994-02-24 11:32:59 +000053
Guido van Rossum77e1db31997-06-02 23:11:57 +000054
Fred Drakeef0b5dd2000-02-17 17:30:40 +000055# Return whether a path is absolute.
Mark Hammond5a607a32009-05-06 08:04:54 +000056# Trivial in Posix, harder on Windows.
57# For Windows it is absolute if it starts with a slash or backslash (current
58# volume), or if a pathname after the volume-letter-and-colon or UNC-resource
Guido van Rossum534972b1999-02-03 17:20:50 +000059# starts with a slash or backslash.
Guido van Rossum555915a1994-02-24 11:32:59 +000060
61def isabs(s):
Guido van Rossum15e22e11997-12-05 19:03:01 +000062 """Test whether a path is absolute"""
Brett Cannon3f9183b2016-08-26 14:44:48 -070063 s = os.fspath(s)
Steve Dowerabde52c2019-11-15 09:49:21 -080064 # Paths beginning with \\?\ are always absolute, but do not
65 # necessarily contain a drive.
66 if isinstance(s, bytes):
67 if s.replace(b'/', b'\\').startswith(b'\\\\?\\'):
68 return True
69 else:
70 if s.replace('/', '\\').startswith('\\\\?\\'):
71 return True
Guido van Rossum15e22e11997-12-05 19:03:01 +000072 s = splitdrive(s)[1]
Serhiy Storchaka8518b792014-07-23 20:43:13 +030073 return len(s) > 0 and s[0] in _get_bothseps(s)
Guido van Rossum555915a1994-02-24 11:32:59 +000074
75
Guido van Rossum77e1db31997-06-02 23:11:57 +000076# Join two (or more) paths.
Serhiy Storchakac369c2c2014-01-27 23:15:14 +020077def join(path, *paths):
Brett Cannon3f9183b2016-08-26 14:44:48 -070078 path = os.fspath(path)
Serhiy Storchaka8518b792014-07-23 20:43:13 +030079 if isinstance(path, bytes):
80 sep = b'\\'
81 seps = b'\\/'
82 colon = b':'
83 else:
84 sep = '\\'
85 seps = '\\/'
86 colon = ':'
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +030087 try:
Serhiy Storchaka5bfc03f2015-05-19 11:00:07 +030088 if not paths:
89 path[:0] + sep #23780: Ensure compatible data type even if p is null.
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +030090 result_drive, result_path = splitdrive(path)
Brett Cannon3f9183b2016-08-26 14:44:48 -070091 for p in map(os.fspath, paths):
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +030092 p_drive, p_path = splitdrive(p)
93 if p_path and p_path[0] in seps:
94 # Second path is absolute
95 if p_drive or not result_drive:
96 result_drive = p_drive
Serhiy Storchakac369c2c2014-01-27 23:15:14 +020097 result_path = p_path
98 continue
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +030099 elif p_drive and p_drive != result_drive:
100 if p_drive.lower() != result_drive.lower():
101 # Different drives => ignore the first path entirely
102 result_drive = p_drive
103 result_path = p_path
104 continue
105 # Same drive in different case
106 result_drive = p_drive
107 # Second path is relative to the first
108 if result_path and result_path[-1] not in seps:
109 result_path = result_path + sep
110 result_path = result_path + p_path
111 ## add separator between UNC and non-absolute path
112 if (result_path and result_path[0] not in seps and
113 result_drive and result_drive[-1:] != colon):
114 return result_drive + sep + result_path
115 return result_drive + result_path
116 except (TypeError, AttributeError, BytesWarning):
117 genericpath._check_arg_types('join', path, *paths)
118 raise
Guido van Rossum555915a1994-02-24 11:32:59 +0000119
120
121# Split a path in a drive specification (a drive letter followed by a
Guido van Rossumf3c695c1999-04-06 19:32:19 +0000122# colon) and the path specification.
Guido van Rossum555915a1994-02-24 11:32:59 +0000123# It is always true that drivespec + pathspec == p
124def splitdrive(p):
Mark Hammond5a607a32009-05-06 08:04:54 +0000125 """Split a pathname into drive/UNC sharepoint and relative path specifiers.
126 Returns a 2-tuple (drive_or_unc, path); either part may be empty.
127
128 If you assign
129 result = splitdrive(p)
130 It is always true that:
131 result[0] + result[1] == p
132
133 If the path contained a drive letter, drive_or_unc will contain everything
134 up to and including the colon. e.g. splitdrive("c:/dir") returns ("c:", "/dir")
135
136 If the path contained a UNC path, the drive_or_unc will contain the host name
137 and share up to but not including the fourth directory separator character.
138 e.g. splitdrive("//host/computer/dir") returns ("//host/computer", "/dir")
139
140 Paths cannot contain both a drive letter and a UNC path.
141
142 """
Brett Cannon3f9183b2016-08-26 14:44:48 -0700143 p = os.fspath(p)
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300144 if len(p) >= 2:
145 if isinstance(p, bytes):
146 sep = b'\\'
147 altsep = b'/'
148 colon = b':'
149 else:
150 sep = '\\'
151 altsep = '/'
152 colon = ':'
153 normp = p.replace(altsep, sep)
Mark Hammond5a607a32009-05-06 08:04:54 +0000154 if (normp[0:2] == sep*2) and (normp[2:3] != sep):
155 # is a UNC path:
156 # vvvvvvvvvvvvvvvvvvvv drive letter or UNC path
157 # \\machine\mountpoint\directory\etc\...
158 # directory ^^^^^^^^^^^^^^^
159 index = normp.find(sep, 2)
160 if index == -1:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300161 return p[:0], p
Mark Hammond5a607a32009-05-06 08:04:54 +0000162 index2 = normp.find(sep, index + 1)
163 # a UNC path can't have two slashes in a row
164 # (after the initial two)
165 if index2 == index + 1:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300166 return p[:0], p
Mark Hammond5a607a32009-05-06 08:04:54 +0000167 if index2 == -1:
168 index2 = len(p)
169 return p[:index2], p[index2:]
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300170 if normp[1:2] == colon:
Mark Hammond5a607a32009-05-06 08:04:54 +0000171 return p[:2], p[2:]
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300172 return p[:0], p
Guido van Rossumf3c695c1999-04-06 19:32:19 +0000173
174
Guido van Rossum555915a1994-02-24 11:32:59 +0000175# Split a path in head (everything up to the last '/') and tail (the
Guido van Rossum8f0fa9e1999-03-19 21:05:12 +0000176# rest). After the trailing '/' is stripped, the invariant
Guido van Rossum555915a1994-02-24 11:32:59 +0000177# join(head, tail) == p holds.
178# The resulting head won't end in '/' unless it is the root.
179
180def split(p):
Guido van Rossum534972b1999-02-03 17:20:50 +0000181 """Split a pathname.
182
183 Return tuple (head, tail) where tail is everything after the final slash.
184 Either part may be empty."""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700185 p = os.fspath(p)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000186 seps = _get_bothseps(p)
Guido van Rossum15e22e11997-12-05 19:03:01 +0000187 d, p = splitdrive(p)
Guido van Rossum8f0fa9e1999-03-19 21:05:12 +0000188 # set i to index beyond p's last slash
189 i = len(p)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000190 while i and p[i-1] not in seps:
Georg Brandl599b65d2010-07-23 08:46:35 +0000191 i -= 1
Guido van Rossum8f0fa9e1999-03-19 21:05:12 +0000192 head, tail = p[:i], p[i:] # now tail has no slashes
193 # remove trailing slashes from head, unless it's all slashes
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300194 head = head.rstrip(seps) or head
Guido van Rossum15e22e11997-12-05 19:03:01 +0000195 return d + head, tail
Guido van Rossum555915a1994-02-24 11:32:59 +0000196
197
198# Split a path in root and extension.
Guido van Rossum73e122f1997-01-22 00:17:26 +0000199# The extension is everything starting at the last dot in the last
Guido van Rossum555915a1994-02-24 11:32:59 +0000200# pathname component; the root is everything before that.
201# It is always true that root + ext == p.
202
203def splitext(p):
Brett Cannon3f9183b2016-08-26 14:44:48 -0700204 p = os.fspath(p)
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300205 if isinstance(p, bytes):
206 return genericpath._splitext(p, b'\\', b'/', b'.')
207 else:
208 return genericpath._splitext(p, '\\', '/', '.')
Guido van Rossumd8faa362007-04-27 19:54:29 +0000209splitext.__doc__ = genericpath._splitext.__doc__
Guido van Rossum555915a1994-02-24 11:32:59 +0000210
211
212# Return the tail (basename) part of a path.
213
214def basename(p):
Guido van Rossum15e22e11997-12-05 19:03:01 +0000215 """Returns the final component of a pathname"""
216 return split(p)[1]
Guido van Rossum555915a1994-02-24 11:32:59 +0000217
218
219# Return the head (dirname) part of a path.
220
221def dirname(p):
Guido van Rossum15e22e11997-12-05 19:03:01 +0000222 """Returns the directory component of a pathname"""
223 return split(p)[0]
Guido van Rossum555915a1994-02-24 11:32:59 +0000224
Guido van Rossum555915a1994-02-24 11:32:59 +0000225# Is a path a symbolic link?
Brian Curtind40e6f72010-07-08 21:39:08 +0000226# This will always return false on systems where os.lstat doesn't exist.
Guido van Rossum555915a1994-02-24 11:32:59 +0000227
228def islink(path):
Brian Curtind40e6f72010-07-08 21:39:08 +0000229 """Test whether a path is a symbolic link.
Jesus Ceaf1af7052012-10-05 02:48:46 +0200230 This will always return false for Windows prior to 6.0.
Thomas Wouters89f507f2006-12-13 04:49:30 +0000231 """
Brian Curtind40e6f72010-07-08 21:39:08 +0000232 try:
233 st = os.lstat(path)
Serhiy Storchaka0185f342018-09-18 11:28:51 +0300234 except (OSError, ValueError, AttributeError):
Brian Curtind40e6f72010-07-08 21:39:08 +0000235 return False
236 return stat.S_ISLNK(st.st_mode)
Guido van Rossum555915a1994-02-24 11:32:59 +0000237
Brian Curtind40e6f72010-07-08 21:39:08 +0000238# Being true for dangling symbolic links is also useful.
239
240def lexists(path):
241 """Test whether a path exists. Returns True for broken symbolic links"""
242 try:
243 st = os.lstat(path)
Serhiy Storchaka0185f342018-09-18 11:28:51 +0300244 except (OSError, ValueError):
Brian Curtind40e6f72010-07-08 21:39:08 +0000245 return False
246 return True
Johannes Gijsbersae882f72004-08-30 10:19:56 +0000247
Tim Golden6b528062013-08-01 12:44:00 +0100248# Is a path a mount point?
249# Any drive letter root (eg c:\)
250# Any share UNC (eg \\server\share)
251# Any volume mounted on a filesystem folder
252#
253# No one method detects all three situations. Historically we've lexically
254# detected drive letter roots and share UNCs. The canonical approach to
255# detecting mounted volumes (querying the reparse tag) fails for the most
256# common case: drive letter roots. The alternative which uses GetVolumePathName
257# fails if the drive letter is the result of a SUBST.
258try:
259 from nt import _getvolumepathname
260except ImportError:
261 _getvolumepathname = None
Guido van Rossum555915a1994-02-24 11:32:59 +0000262def ismount(path):
Tim Golden6b528062013-08-01 12:44:00 +0100263 """Test whether a path is a mount point (a drive root, the root of a
264 share, or a mounted volume)"""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700265 path = os.fspath(path)
Benjamin Peterson48e24782009-03-29 13:02:52 +0000266 seps = _get_bothseps(path)
Tim Golden6b528062013-08-01 12:44:00 +0100267 path = abspath(path)
Mark Hammond5a607a32009-05-06 08:04:54 +0000268 root, rest = splitdrive(path)
269 if root and root[0] in seps:
270 return (not rest) or (rest in seps)
Tim Golden6b528062013-08-01 12:44:00 +0100271 if rest in seps:
272 return True
273
274 if _getvolumepathname:
275 return path.rstrip(seps) == _getvolumepathname(path).rstrip(seps)
276 else:
277 return False
Guido van Rossum555915a1994-02-24 11:32:59 +0000278
279
Guido van Rossum555915a1994-02-24 11:32:59 +0000280# Expand paths beginning with '~' or '~user'.
281# '~' means $HOME; '~user' means that user's home directory.
282# If the path doesn't begin with '~', or if the user or $HOME is unknown,
283# the path is returned unchanged (leaving error reporting to whatever
284# function is called with the expanded path as argument).
285# See also module 'glob' for expansion of *, ? and [...] in pathnames.
286# (A function should also be defined to do full *sh-style environment
287# variable expansion.)
288
289def expanduser(path):
Guido van Rossum534972b1999-02-03 17:20:50 +0000290 """Expand ~ and ~user constructs.
291
292 If user or $HOME is unknown, do nothing."""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700293 path = os.fspath(path)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000294 if isinstance(path, bytes):
295 tilde = b'~'
296 else:
297 tilde = '~'
298 if not path.startswith(tilde):
Guido van Rossum15e22e11997-12-05 19:03:01 +0000299 return path
300 i, n = 1, len(path)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000301 while i < n and path[i] not in _get_bothseps(path):
Georg Brandl599b65d2010-07-23 08:46:35 +0000302 i += 1
Guido van Rossumd8faa362007-04-27 19:54:29 +0000303
Anthony Sottile25ec4a42019-03-12 08:39:57 -0700304 if 'USERPROFILE' in os.environ:
Guido van Rossumd8faa362007-04-27 19:54:29 +0000305 userhome = os.environ['USERPROFILE']
306 elif not 'HOMEPATH' in os.environ:
Guido van Rossum15e22e11997-12-05 19:03:01 +0000307 return path
Guido van Rossumd8faa362007-04-27 19:54:29 +0000308 else:
309 try:
310 drive = os.environ['HOMEDRIVE']
311 except KeyError:
312 drive = ''
313 userhome = join(drive, os.environ['HOMEPATH'])
314
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000315 if isinstance(path, bytes):
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300316 userhome = os.fsencode(userhome)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000317
Guido van Rossumd8faa362007-04-27 19:54:29 +0000318 if i != 1: #~user
319 userhome = join(dirname(userhome), path[1:i])
320
Guido van Rossum15e22e11997-12-05 19:03:01 +0000321 return userhome + path[i:]
Guido van Rossum555915a1994-02-24 11:32:59 +0000322
323
324# Expand paths containing shell variable substitutions.
325# The following rules apply:
Guido van Rossum15e22e11997-12-05 19:03:01 +0000326# - no expansion within single quotes
Guido van Rossumd8faa362007-04-27 19:54:29 +0000327# - '$$' is translated into '$'
328# - '%%' is translated into '%' if '%%' are not seen in %var1%%var2%
Guido van Rossum15e22e11997-12-05 19:03:01 +0000329# - ${varname} is accepted.
Guido van Rossumd8faa362007-04-27 19:54:29 +0000330# - $varname is accepted.
331# - %varname% is accepted.
332# - varnames can be made out of letters, digits and the characters '_-'
Ezio Melotti13925002011-03-16 11:05:33 +0200333# (though is not verified in the ${varname} and %varname% cases)
Guido van Rossum555915a1994-02-24 11:32:59 +0000334# XXX With COMMAND.COM you can use any characters in a variable name,
335# XXX except '^|<>='.
336
Tim Peters2344fae2001-01-15 00:50:52 +0000337def expandvars(path):
Guido van Rossumd8faa362007-04-27 19:54:29 +0000338 """Expand shell variables of the forms $var, ${var} and %var%.
Guido van Rossum534972b1999-02-03 17:20:50 +0000339
340 Unknown variables are left unchanged."""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700341 path = os.fspath(path)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000342 if isinstance(path, bytes):
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300343 if b'$' not in path and b'%' not in path:
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000344 return path
345 import string
346 varchars = bytes(string.ascii_letters + string.digits + '_-', 'ascii')
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000347 quote = b'\''
348 percent = b'%'
349 brace = b'{'
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300350 rbrace = b'}'
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000351 dollar = b'$'
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200352 environ = getattr(os, 'environb', None)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000353 else:
354 if '$' not in path and '%' not in path:
355 return path
356 import string
357 varchars = string.ascii_letters + string.digits + '_-'
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000358 quote = '\''
359 percent = '%'
360 brace = '{'
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300361 rbrace = '}'
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000362 dollar = '$'
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200363 environ = os.environ
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000364 res = path[:0]
Guido van Rossum15e22e11997-12-05 19:03:01 +0000365 index = 0
366 pathlen = len(path)
367 while index < pathlen:
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000368 c = path[index:index+1]
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000369 if c == quote: # no expansion within single quotes
Guido van Rossum15e22e11997-12-05 19:03:01 +0000370 path = path[index + 1:]
371 pathlen = len(path)
372 try:
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000373 index = path.index(c)
Georg Brandl599b65d2010-07-23 08:46:35 +0000374 res += c + path[:index + 1]
Fred Drakeb4e460a2000-09-28 16:25:20 +0000375 except ValueError:
Serhiy Storchaka1b87ae02015-03-25 16:40:15 +0200376 res += c + path
Fred Drakeb4e460a2000-09-28 16:25:20 +0000377 index = pathlen - 1
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000378 elif c == percent: # variable or '%'
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000379 if path[index + 1:index + 2] == percent:
Georg Brandl599b65d2010-07-23 08:46:35 +0000380 res += c
381 index += 1
Guido van Rossumd8faa362007-04-27 19:54:29 +0000382 else:
383 path = path[index+1:]
384 pathlen = len(path)
385 try:
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000386 index = path.index(percent)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000387 except ValueError:
Georg Brandl599b65d2010-07-23 08:46:35 +0000388 res += percent + path
Guido van Rossumd8faa362007-04-27 19:54:29 +0000389 index = pathlen - 1
390 else:
391 var = path[:index]
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200392 try:
393 if environ is None:
394 value = os.fsencode(os.environ[os.fsdecode(var)])
395 else:
396 value = environ[var]
397 except KeyError:
398 value = percent + var + percent
Georg Brandl599b65d2010-07-23 08:46:35 +0000399 res += value
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000400 elif c == dollar: # variable or '$$'
401 if path[index + 1:index + 2] == dollar:
Georg Brandl599b65d2010-07-23 08:46:35 +0000402 res += c
403 index += 1
Amaury Forgeot d'Arc3b44e612008-10-03 20:32:33 +0000404 elif path[index + 1:index + 2] == brace:
Guido van Rossum15e22e11997-12-05 19:03:01 +0000405 path = path[index+2:]
406 pathlen = len(path)
407 try:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300408 index = path.index(rbrace)
Fred Drakeb4e460a2000-09-28 16:25:20 +0000409 except ValueError:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300410 res += dollar + brace + path
Guido van Rossum15e22e11997-12-05 19:03:01 +0000411 index = pathlen - 1
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200412 else:
413 var = path[:index]
414 try:
415 if environ is None:
416 value = os.fsencode(os.environ[os.fsdecode(var)])
417 else:
418 value = environ[var]
419 except KeyError:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300420 value = dollar + brace + var + rbrace
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200421 res += value
Guido van Rossum15e22e11997-12-05 19:03:01 +0000422 else:
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200423 var = path[:0]
Georg Brandl599b65d2010-07-23 08:46:35 +0000424 index += 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000425 c = path[index:index + 1]
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000426 while c and c in varchars:
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200427 var += c
Georg Brandl599b65d2010-07-23 08:46:35 +0000428 index += 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000429 c = path[index:index + 1]
Serhiy Storchakadbb10192014-02-13 10:13:53 +0200430 try:
431 if environ is None:
432 value = os.fsencode(os.environ[os.fsdecode(var)])
433 else:
434 value = environ[var]
435 except KeyError:
436 value = dollar + var
Georg Brandl599b65d2010-07-23 08:46:35 +0000437 res += value
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000438 if c:
Georg Brandl599b65d2010-07-23 08:46:35 +0000439 index -= 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000440 else:
Georg Brandl599b65d2010-07-23 08:46:35 +0000441 res += c
442 index += 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000443 return res
Guido van Rossum555915a1994-02-24 11:32:59 +0000444
445
Tim Peters54a14a32001-08-30 22:05:26 +0000446# Normalize a path, e.g. A//B, A/./B and A/foo/../B all become A\B.
Guido van Rossum3df7b5a1996-08-26 16:35:26 +0000447# Previously, this function also truncated pathnames to 8+3 format,
448# but as this module is called "ntpath", that's obviously wrong!
Guido van Rossum555915a1994-02-24 11:32:59 +0000449
450def normpath(path):
Guido van Rossum15e22e11997-12-05 19:03:01 +0000451 """Normalize path, eliminating double slashes, etc."""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700452 path = os.fspath(path)
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300453 if isinstance(path, bytes):
454 sep = b'\\'
455 altsep = b'/'
456 curdir = b'.'
457 pardir = b'..'
458 special_prefixes = (b'\\\\.\\', b'\\\\?\\')
459 else:
460 sep = '\\'
461 altsep = '/'
462 curdir = '.'
463 pardir = '..'
464 special_prefixes = ('\\\\.\\', '\\\\?\\')
Georg Brandlcfb68212010-07-31 21:40:15 +0000465 if path.startswith(special_prefixes):
466 # in the case of paths with these prefixes:
467 # \\.\ -> device names
468 # \\?\ -> literal paths
Steve Dower06be2c72019-08-21 16:45:02 -0700469 # do not do any normalization, but return the path
470 # unchanged apart from the call to os.fspath()
Georg Brandlcfb68212010-07-31 21:40:15 +0000471 return path
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300472 path = path.replace(altsep, sep)
Guido van Rossum15e22e11997-12-05 19:03:01 +0000473 prefix, path = splitdrive(path)
Mark Hammond5a607a32009-05-06 08:04:54 +0000474
475 # collapse initial backslashes
476 if path.startswith(sep):
Georg Brandl599b65d2010-07-23 08:46:35 +0000477 prefix += sep
Mark Hammond5a607a32009-05-06 08:04:54 +0000478 path = path.lstrip(sep)
479
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000480 comps = path.split(sep)
Guido van Rossum15e22e11997-12-05 19:03:01 +0000481 i = 0
482 while i < len(comps):
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300483 if not comps[i] or comps[i] == curdir:
Guido van Rossum15e22e11997-12-05 19:03:01 +0000484 del comps[i]
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300485 elif comps[i] == pardir:
486 if i > 0 and comps[i-1] != pardir:
Tim Peters54a14a32001-08-30 22:05:26 +0000487 del comps[i-1:i+1]
488 i -= 1
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300489 elif i == 0 and prefix.endswith(sep):
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000490 del comps[i]
491 else:
492 i += 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000493 else:
Tim Peters54a14a32001-08-30 22:05:26 +0000494 i += 1
Guido van Rossum15e22e11997-12-05 19:03:01 +0000495 # If the path is now empty, substitute '.'
496 if not prefix and not comps:
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300497 comps.append(curdir)
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000498 return prefix + sep.join(comps)
Guido van Rossume294cf61999-01-29 18:05:18 +0000499
Franz Wöllertd2e902e2018-07-29 14:47:09 +0200500def _abspath_fallback(path):
501 """Return the absolute version of a path as a fallback function in case
502 `nt._getfullpathname` is not available or raises OSError. See bpo-31047 for
503 more.
504
505 """
506
507 path = os.fspath(path)
508 if not isabs(path):
509 if isinstance(path, bytes):
510 cwd = os.getcwdb()
511 else:
512 cwd = os.getcwd()
513 path = join(cwd, path)
514 return normpath(path)
Guido van Rossume294cf61999-01-29 18:05:18 +0000515
516# Return an absolute path.
Thomas Wouters477c8d52006-05-27 19:21:47 +0000517try:
518 from nt import _getfullpathname
Mark Hammondf717f052002-01-17 00:44:26 +0000519
Brett Cannoncd171c82013-07-04 17:43:24 -0400520except ImportError: # not running on Windows - mock up something sensible
Franz Wöllertd2e902e2018-07-29 14:47:09 +0200521 abspath = _abspath_fallback
Thomas Wouters477c8d52006-05-27 19:21:47 +0000522
523else: # use native Windows method on Windows
524 def abspath(path):
525 """Return the absolute version of a path."""
Franz Wöllertd2e902e2018-07-29 14:47:09 +0200526 try:
Tim Grahamd03b7752018-10-25 11:26:38 -0400527 return normpath(_getfullpathname(path))
Serhiy Storchaka0185f342018-09-18 11:28:51 +0300528 except (OSError, ValueError):
Franz Wöllertd2e902e2018-07-29 14:47:09 +0200529 return _abspath_fallback(path)
Guido van Rossum83eeef42001-09-17 15:16:09 +0000530
Steve Dower75e06492019-08-21 13:43:06 -0700531try:
532 from nt import _getfinalpathname, readlink as _nt_readlink
533except ImportError:
534 # realpath is a no-op on systems without _getfinalpathname support.
535 realpath = abspath
536else:
Steve Dowerabde52c2019-11-15 09:49:21 -0800537 def _readlink_deep(path):
Steve Dower89b89332019-09-16 15:25:11 +0100538 # These error codes indicate that we should stop reading links and
539 # return the path we currently have.
540 # 1: ERROR_INVALID_FUNCTION
541 # 2: ERROR_FILE_NOT_FOUND
542 # 3: ERROR_DIRECTORY_NOT_FOUND
543 # 5: ERROR_ACCESS_DENIED
544 # 21: ERROR_NOT_READY (implies drive with no media)
545 # 32: ERROR_SHARING_VIOLATION (probably an NTFS paging file)
546 # 50: ERROR_NOT_SUPPORTED (implies no support for reparse points)
547 # 67: ERROR_BAD_NET_NAME (implies remote server unavailable)
548 # 87: ERROR_INVALID_PARAMETER
549 # 4390: ERROR_NOT_A_REPARSE_POINT
550 # 4392: ERROR_INVALID_REPARSE_DATA
551 # 4393: ERROR_REPARSE_TAG_INVALID
552 allowed_winerror = 1, 2, 3, 5, 21, 32, 50, 67, 87, 4390, 4392, 4393
553
Steve Dowerabde52c2019-11-15 09:49:21 -0800554 seen = set()
Steve Dower75e06492019-08-21 13:43:06 -0700555 while normcase(path) not in seen:
556 seen.add(normcase(path))
557 try:
Steve Dowerabde52c2019-11-15 09:49:21 -0800558 old_path = path
Steve Dower75e06492019-08-21 13:43:06 -0700559 path = _nt_readlink(path)
Steve Dowerabde52c2019-11-15 09:49:21 -0800560 # Links may be relative, so resolve them against their
561 # own location
562 if not isabs(path):
563 # If it's something other than a symlink, we don't know
564 # what it's actually going to be resolved against, so
565 # just return the old path.
566 if not islink(old_path):
567 path = old_path
568 break
569 path = normpath(join(dirname(old_path), path))
Steve Dower75e06492019-08-21 13:43:06 -0700570 except OSError as ex:
Steve Dower89b89332019-09-16 15:25:11 +0100571 if ex.winerror in allowed_winerror:
Steve Dower75e06492019-08-21 13:43:06 -0700572 break
573 raise
574 except ValueError:
575 # Stop on reparse points that are not symlinks
576 break
577 return path
578
579 def _getfinalpathname_nonstrict(path):
Steve Dower89b89332019-09-16 15:25:11 +0100580 # These error codes indicate that we should stop resolving the path
581 # and return the value we currently have.
582 # 1: ERROR_INVALID_FUNCTION
583 # 2: ERROR_FILE_NOT_FOUND
584 # 3: ERROR_DIRECTORY_NOT_FOUND
585 # 5: ERROR_ACCESS_DENIED
586 # 21: ERROR_NOT_READY (implies drive with no media)
587 # 32: ERROR_SHARING_VIOLATION (probably an NTFS paging file)
588 # 50: ERROR_NOT_SUPPORTED
589 # 67: ERROR_BAD_NET_NAME (implies remote server unavailable)
590 # 87: ERROR_INVALID_PARAMETER
591 # 123: ERROR_INVALID_NAME
Steve Dowera0e3d272019-10-03 08:31:03 -0700592 # 1920: ERROR_CANT_ACCESS_FILE
Steve Dower89b89332019-09-16 15:25:11 +0100593 # 1921: ERROR_CANT_RESOLVE_FILENAME (implies unfollowable symlink)
Steve Dowera0e3d272019-10-03 08:31:03 -0700594 allowed_winerror = 1, 2, 3, 5, 21, 32, 50, 67, 87, 123, 1920, 1921
Steve Dower75e06492019-08-21 13:43:06 -0700595
596 # Non-strict algorithm is to find as much of the target directory
597 # as we can and join the rest.
598 tail = ''
Steve Dower75e06492019-08-21 13:43:06 -0700599 while path:
600 try:
Steve Dower75e06492019-08-21 13:43:06 -0700601 path = _getfinalpathname(path)
602 return join(path, tail) if tail else path
603 except OSError as ex:
604 if ex.winerror not in allowed_winerror:
605 raise
Steve Dowerabde52c2019-11-15 09:49:21 -0800606 try:
607 # The OS could not resolve this path fully, so we attempt
608 # to follow the link ourselves. If we succeed, join the tail
609 # and return.
610 new_path = _readlink_deep(path)
611 if new_path != path:
612 return join(new_path, tail) if tail else new_path
613 except OSError:
614 # If we fail to readlink(), let's keep traversing
615 pass
Steve Dower75e06492019-08-21 13:43:06 -0700616 path, name = split(path)
Steve Dower89b89332019-09-16 15:25:11 +0100617 # TODO (bpo-38186): Request the real file name from the directory
618 # entry using FindFirstFileW. For now, we will return the path
619 # as best we have it
Steve Dower75e06492019-08-21 13:43:06 -0700620 if path and not name:
Steve Dowerabde52c2019-11-15 09:49:21 -0800621 return path + tail
Steve Dower75e06492019-08-21 13:43:06 -0700622 tail = join(name, tail) if tail else name
Steve Dowerabde52c2019-11-15 09:49:21 -0800623 return tail
Steve Dower75e06492019-08-21 13:43:06 -0700624
625 def realpath(path):
Steve Dower06be2c72019-08-21 16:45:02 -0700626 path = normpath(path)
Steve Dower75e06492019-08-21 13:43:06 -0700627 if isinstance(path, bytes):
628 prefix = b'\\\\?\\'
629 unc_prefix = b'\\\\?\\UNC\\'
630 new_unc_prefix = b'\\\\'
631 cwd = os.getcwdb()
Steve Dowerabde52c2019-11-15 09:49:21 -0800632 # bpo-38081: Special case for realpath(b'nul')
633 if normcase(path) == normcase(os.fsencode(devnull)):
634 return b'\\\\.\\NUL'
Steve Dower75e06492019-08-21 13:43:06 -0700635 else:
636 prefix = '\\\\?\\'
637 unc_prefix = '\\\\?\\UNC\\'
638 new_unc_prefix = '\\\\'
639 cwd = os.getcwd()
Steve Dowerabde52c2019-11-15 09:49:21 -0800640 # bpo-38081: Special case for realpath('nul')
641 if normcase(path) == normcase(devnull):
642 return '\\\\.\\NUL'
Steve Dower75e06492019-08-21 13:43:06 -0700643 had_prefix = path.startswith(prefix)
Steve Dowerabde52c2019-11-15 09:49:21 -0800644 if not had_prefix and not isabs(path):
645 path = join(cwd, path)
Steve Dowera0e3d272019-10-03 08:31:03 -0700646 try:
647 path = _getfinalpathname(path)
648 initial_winerror = 0
649 except OSError as ex:
650 initial_winerror = ex.winerror
651 path = _getfinalpathname_nonstrict(path)
Steve Dower75e06492019-08-21 13:43:06 -0700652 # The path returned by _getfinalpathname will always start with \\?\ -
653 # strip off that prefix unless it was already provided on the original
654 # path.
655 if not had_prefix and path.startswith(prefix):
656 # For UNC paths, the prefix will actually be \\?\UNC\
657 # Handle that case as well.
658 if path.startswith(unc_prefix):
659 spath = new_unc_prefix + path[len(unc_prefix):]
660 else:
661 spath = path[len(prefix):]
662 # Ensure that the non-prefixed path resolves to the same path
663 try:
664 if _getfinalpathname(spath) == path:
665 path = spath
666 except OSError as ex:
Steve Dower06be2c72019-08-21 16:45:02 -0700667 # If the path does not exist and originally did not exist, then
668 # strip the prefix anyway.
Steve Dowera0e3d272019-10-03 08:31:03 -0700669 if ex.winerror == initial_winerror:
Steve Dower06be2c72019-08-21 16:45:02 -0700670 path = spath
Steve Dower75e06492019-08-21 13:43:06 -0700671 return path
672
673
Mark Hammond8696ebc2002-10-08 02:44:31 +0000674# Win9x family and earlier have no Unicode filename support.
Tim Peters26bc25a2002-10-09 07:56:04 +0000675supports_unicode_filenames = (hasattr(sys, "getwindowsversion") and
676 sys.getwindowsversion()[3] >= 2)
Guido van Rossumd8faa362007-04-27 19:54:29 +0000677
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300678def relpath(path, start=None):
Guido van Rossumd8faa362007-04-27 19:54:29 +0000679 """Return a relative version of a path"""
Brett Cannon3f9183b2016-08-26 14:44:48 -0700680 path = os.fspath(path)
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300681 if isinstance(path, bytes):
682 sep = b'\\'
683 curdir = b'.'
684 pardir = b'..'
685 else:
686 sep = '\\'
687 curdir = '.'
688 pardir = '..'
Amaury Forgeot d'Arcc72ef8b2008-10-03 18:38:26 +0000689
Serhiy Storchaka8518b792014-07-23 20:43:13 +0300690 if start is None:
691 start = curdir
Guido van Rossumd8faa362007-04-27 19:54:29 +0000692
693 if not path:
694 raise ValueError("no path specified")
Mark Hammond5a607a32009-05-06 08:04:54 +0000695
Brett Cannon3f9183b2016-08-26 14:44:48 -0700696 start = os.fspath(start)
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +0300697 try:
698 start_abs = abspath(normpath(start))
699 path_abs = abspath(normpath(path))
700 start_drive, start_rest = splitdrive(start_abs)
701 path_drive, path_rest = splitdrive(path_abs)
702 if normcase(start_drive) != normcase(path_drive):
703 raise ValueError("path is on mount %r, start on mount %r" % (
704 path_drive, start_drive))
Mark Hammond5a607a32009-05-06 08:04:54 +0000705
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +0300706 start_list = [x for x in start_rest.split(sep) if x]
707 path_list = [x for x in path_rest.split(sep) if x]
708 # Work out how much of the filepath is shared by start and path.
709 i = 0
710 for e1, e2 in zip(start_list, path_list):
711 if normcase(e1) != normcase(e2):
712 break
713 i += 1
Guido van Rossumd8faa362007-04-27 19:54:29 +0000714
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +0300715 rel_list = [pardir] * (len(start_list)-i) + path_list[i:]
716 if not rel_list:
717 return curdir
718 return join(*rel_list)
Serhiy Storchakae4f47082014-10-04 16:09:02 +0300719 except (TypeError, ValueError, AttributeError, BytesWarning, DeprecationWarning):
Serhiy Storchaka3deeeb02014-10-04 14:58:43 +0300720 genericpath._check_arg_types('relpath', path, start)
721 raise
Brian Curtind40e6f72010-07-08 21:39:08 +0000722
723
Serhiy Storchaka38220932015-03-31 15:31:53 +0300724# Return the longest common sub-path of the sequence of paths given as input.
725# The function is case-insensitive and 'separator-insensitive', i.e. if the
726# only difference between two paths is the use of '\' versus '/' as separator,
727# they are deemed to be equal.
728#
729# However, the returned path will have the standard '\' separator (even if the
730# given paths had the alternative '/' separator) and will have the case of the
731# first path given in the sequence. Additionally, any trailing separator is
732# stripped from the returned path.
733
734def commonpath(paths):
735 """Given a sequence of path names, returns the longest common sub-path."""
736
737 if not paths:
738 raise ValueError('commonpath() arg is an empty sequence')
739
Brett Cannon3f9183b2016-08-26 14:44:48 -0700740 paths = tuple(map(os.fspath, paths))
Serhiy Storchaka38220932015-03-31 15:31:53 +0300741 if isinstance(paths[0], bytes):
742 sep = b'\\'
743 altsep = b'/'
744 curdir = b'.'
745 else:
746 sep = '\\'
747 altsep = '/'
748 curdir = '.'
749
750 try:
751 drivesplits = [splitdrive(p.replace(altsep, sep).lower()) for p in paths]
752 split_paths = [p.split(sep) for d, p in drivesplits]
753
754 try:
755 isabs, = set(p[:1] == sep for d, p in drivesplits)
756 except ValueError:
757 raise ValueError("Can't mix absolute and relative paths") from None
758
759 # Check that all drive letters or UNC paths match. The check is made only
760 # now otherwise type errors for mixing strings and bytes would not be
761 # caught.
762 if len(set(d for d, p in drivesplits)) != 1:
763 raise ValueError("Paths don't have the same drive")
764
765 drive, path = splitdrive(paths[0].replace(altsep, sep))
766 common = path.split(sep)
767 common = [c for c in common if c and c != curdir]
768
769 split_paths = [[c for c in s if c and c != curdir] for s in split_paths]
770 s1 = min(split_paths)
771 s2 = max(split_paths)
772 for i, c in enumerate(s1):
773 if c != s2[i]:
774 common = common[:i]
775 break
776 else:
777 common = common[:len(s1)]
778
779 prefix = drive + sep if isabs else drive
780 return prefix + sep.join(common)
781 except (TypeError, AttributeError):
782 genericpath._check_arg_types('commonpath', *paths)
783 raise
784
785
Brian Curtin9c669cc2011-06-08 18:17:18 -0500786try:
787 # The genericpath.isdir implementation uses os.stat and checks the mode
788 # attribute to tell whether or not the path is a directory.
789 # This is overkill on Windows - just pass the path to GetFileAttributes
790 # and check the attribute from there.
Brian Curtin95d028f2011-06-09 09:10:38 -0500791 from nt import _isdir as isdir
Brett Cannoncd171c82013-07-04 17:43:24 -0400792except ImportError:
Brian Curtin95d028f2011-06-09 09:10:38 -0500793 # Use genericpath.isdir as imported above.
794 pass