blob: 661d8dbb76c5637fdb70266c5498b3af28fd72ed [file] [log] [blame]
Guido van Rossum54f22ed2000-02-04 15:10:34 +00001"""Common operations on Posix pathnames.
2
3Instead of importing this module directly, import os and refer to
4this module as os.path. The "os.path" name is an alias for this
5module on Posix systems; on other systems (e.g. Mac, Windows),
6os.path provides the same operations in a manner specific to that
7platform, and is an alias to another module (e.g. macpath, ntpath).
8
9Some of this can actually be useful on non-Posix systems too, e.g.
10for manipulation of the pathname component of URLs.
Guido van Rossum346f7af1997-12-05 19:04:51 +000011"""
Guido van Rossumc6360141990-10-13 19:23:40 +000012
Guido van Rossumd3876d31996-07-23 03:47:28 +000013import os
Guido van Rossum40d93041990-10-21 16:17:34 +000014import stat
Martin v. Löwis05c075d2007-03-07 11:04:33 +000015import genericpath
Jack Diederich7b604642006-08-26 18:42:06 +000016from genericpath import *
Guido van Rossumc6360141990-10-13 19:23:40 +000017
Skip Montanaroc62c81e2001-02-12 02:00:42 +000018__all__ = ["normcase","isabs","join","splitdrive","split","splitext",
19 "basename","dirname","commonprefix","getsize","getmtime",
Georg Brandlf0de6a12005-08-22 18:02:59 +000020 "getatime","getctime","islink","exists","lexists","isdir","isfile",
21 "ismount","walk","expanduser","expandvars","normpath","abspath",
Neal Norwitz61cdac62003-01-03 18:01:57 +000022 "samefile","sameopenfile","samestat",
Skip Montanaro117910d2003-02-14 19:35:31 +000023 "curdir","pardir","sep","pathsep","defpath","altsep","extsep",
Martin v. Löwisbdec50f2004-06-08 08:29:33 +000024 "devnull","realpath","supports_unicode_filenames"]
Guido van Rossumc6360141990-10-13 19:23:40 +000025
Skip Montanaro117910d2003-02-14 19:35:31 +000026# strings representing various path-related bits and pieces
27curdir = '.'
28pardir = '..'
29extsep = '.'
30sep = '/'
31pathsep = ':'
32defpath = ':/bin:/usr/bin'
33altsep = None
Martin v. Löwisbdec50f2004-06-08 08:29:33 +000034devnull = '/dev/null'
Skip Montanaro117910d2003-02-14 19:35:31 +000035
Guido van Rossum7ac48781992-01-14 18:29:32 +000036# Normalize the case of a pathname. Trivial in Posix, string.lower on Mac.
37# On MS-DOS this may also turn slashes into backslashes; however, other
38# normalizations (such as optimizing '../' away) are not allowed
39# (another function should be defined to do that).
40
41def normcase(s):
Guido van Rossum346f7af1997-12-05 19:04:51 +000042 """Normalize case of pathname. Has no effect under Posix"""
43 return s
Guido van Rossum7ac48781992-01-14 18:29:32 +000044
45
Jeremy Hyltona05e2932000-06-28 14:48:01 +000046# Return whether a path is absolute.
Guido van Rossum7ac48781992-01-14 18:29:32 +000047# Trivial in Posix, harder on the Mac or MS-DOS.
48
49def isabs(s):
Guido van Rossum346f7af1997-12-05 19:04:51 +000050 """Test whether a path is absolute"""
Walter Dörwald77cdeaf2003-06-17 13:13:40 +000051 return s.startswith('/')
Guido van Rossum7ac48781992-01-14 18:29:32 +000052
53
Barry Warsaw384d2491997-02-18 21:53:25 +000054# Join pathnames.
55# Ignore the previous parts if a part is absolute.
Guido van Rossum4d0fdc31991-08-16 13:27:58 +000056# Insert a '/' unless the first part is empty or already ends in '/'.
Guido van Rossum7ac48781992-01-14 18:29:32 +000057
Barry Warsaw384d2491997-02-18 21:53:25 +000058def join(a, *p):
Guido van Rossum346f7af1997-12-05 19:04:51 +000059 """Join two or more pathname components, inserting '/' as needed"""
60 path = a
61 for b in p:
Walter Dörwald77cdeaf2003-06-17 13:13:40 +000062 if b.startswith('/'):
Guido van Rossum346f7af1997-12-05 19:04:51 +000063 path = b
Walter Dörwald77cdeaf2003-06-17 13:13:40 +000064 elif path == '' or path.endswith('/'):
65 path += b
Guido van Rossum346f7af1997-12-05 19:04:51 +000066 else:
Walter Dörwald77cdeaf2003-06-17 13:13:40 +000067 path += '/' + b
Guido van Rossum346f7af1997-12-05 19:04:51 +000068 return path
Guido van Rossumc6360141990-10-13 19:23:40 +000069
70
Guido van Rossum26847381992-03-31 18:54:35 +000071# Split a path in head (everything up to the last '/') and tail (the
Guido van Rossuma89b1ba1995-09-01 20:32:21 +000072# rest). If the path ends in '/', tail will be empty. If there is no
73# '/' in the path, head will be empty.
74# Trailing '/'es are stripped from head unless it is the root.
Guido van Rossum7ac48781992-01-14 18:29:32 +000075
Guido van Rossumc6360141990-10-13 19:23:40 +000076def split(p):
Tim Peters2344fae2001-01-15 00:50:52 +000077 """Split a pathname. Returns tuple "(head, tail)" where "tail" is
Fred Drakec0ab93e2000-09-28 16:22:52 +000078 everything after the final slash. Either part may be empty."""
Fred Drake22fb8392000-09-28 15:04:39 +000079 i = p.rfind('/') + 1
Guido van Rossum346f7af1997-12-05 19:04:51 +000080 head, tail = p[:i], p[i:]
Fred Drake8152d322000-12-12 23:20:45 +000081 if head and head != '/'*len(head):
Walter Dörwald77cdeaf2003-06-17 13:13:40 +000082 head = head.rstrip('/')
Guido van Rossum346f7af1997-12-05 19:04:51 +000083 return head, tail
Guido van Rossumc6360141990-10-13 19:23:40 +000084
85
Guido van Rossum4d0fdc31991-08-16 13:27:58 +000086# Split a path in root and extension.
Guido van Rossum422869a1996-08-20 20:24:17 +000087# The extension is everything starting at the last dot in the last
Guido van Rossum4d0fdc31991-08-16 13:27:58 +000088# pathname component; the root is everything before that.
Guido van Rossum7ac48781992-01-14 18:29:32 +000089# It is always true that root + ext == p.
90
Guido van Rossum4d0fdc31991-08-16 13:27:58 +000091def splitext(p):
Martin v. Löwis05c075d2007-03-07 11:04:33 +000092 return genericpath._splitext(p, sep, altsep, extsep)
93splitext.__doc__ = genericpath._splitext.__doc__
Guido van Rossum4d0fdc31991-08-16 13:27:58 +000094
Guido van Rossum221df241995-08-07 20:17:55 +000095# Split a pathname into a drive specification and the rest of the
96# path. Useful on DOS/Windows/NT; on Unix, the drive is always empty.
97
98def splitdrive(p):
Tim Peters2344fae2001-01-15 00:50:52 +000099 """Split a pathname into drive and path. On Posix, drive is always
Fred Drakec0ab93e2000-09-28 16:22:52 +0000100 empty."""
Guido van Rossum346f7af1997-12-05 19:04:51 +0000101 return '', p
Guido van Rossum221df241995-08-07 20:17:55 +0000102
103
Georg Brandl65ad0432006-10-12 13:08:16 +0000104# Return the tail (basename) part of a path, same as split(path)[1].
Guido van Rossum7ac48781992-01-14 18:29:32 +0000105
Guido van Rossumc6360141990-10-13 19:23:40 +0000106def basename(p):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000107 """Returns the final component of a pathname"""
Georg Brandl65ad0432006-10-12 13:08:16 +0000108 i = p.rfind('/') + 1
109 return p[i:]
Guido van Rossumc6360141990-10-13 19:23:40 +0000110
111
Georg Brandl65ad0432006-10-12 13:08:16 +0000112# Return the head (dirname) part of a path, same as split(path)[0].
Guido van Rossumc629d341992-11-05 10:43:02 +0000113
114def dirname(p):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000115 """Returns the directory component of a pathname"""
Georg Brandl65ad0432006-10-12 13:08:16 +0000116 i = p.rfind('/') + 1
117 head = p[:i]
118 if head and head != '/'*len(head):
119 head = head.rstrip('/')
120 return head
Guido van Rossumc629d341992-11-05 10:43:02 +0000121
122
Guido van Rossum7ac48781992-01-14 18:29:32 +0000123# Is a path a symbolic link?
Guido van Rossumd3876d31996-07-23 03:47:28 +0000124# This will always return false on systems where os.lstat doesn't exist.
Guido van Rossum7ac48781992-01-14 18:29:32 +0000125
126def islink(path):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000127 """Test whether a path is a symbolic link"""
128 try:
129 st = os.lstat(path)
130 except (os.error, AttributeError):
Guido van Rossum8ca162f2002-04-07 06:36:23 +0000131 return False
Raymond Hettinger32200ae2002-06-01 19:51:15 +0000132 return stat.S_ISLNK(st.st_mode)
Guido van Rossum7ac48781992-01-14 18:29:32 +0000133
Johannes Gijsbersae882f72004-08-30 10:19:56 +0000134# Being true for dangling symbolic links is also useful.
135
136def lexists(path):
137 """Test whether a path exists. Returns True for broken symbolic links"""
138 try:
139 st = os.lstat(path)
140 except os.error:
141 return False
142 return True
143
144
Guido van Rossumd3778f91991-11-12 15:37:40 +0000145# Are two filenames really pointing to the same file?
Guido van Rossum7ac48781992-01-14 18:29:32 +0000146
Guido van Rossumd3778f91991-11-12 15:37:40 +0000147def samefile(f1, f2):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000148 """Test whether two pathnames reference the same actual file"""
149 s1 = os.stat(f1)
150 s2 = os.stat(f2)
151 return samestat(s1, s2)
Guido van Rossumd3778f91991-11-12 15:37:40 +0000152
153
154# Are two open files really referencing the same file?
155# (Not necessarily the same file descriptor!)
Guido van Rossum7ac48781992-01-14 18:29:32 +0000156
Guido van Rossumd3778f91991-11-12 15:37:40 +0000157def sameopenfile(fp1, fp2):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000158 """Test whether two open file objects reference the same file"""
159 s1 = os.fstat(fp1)
160 s2 = os.fstat(fp2)
161 return samestat(s1, s2)
Guido van Rossumd3778f91991-11-12 15:37:40 +0000162
163
164# Are two stat buffers (obtained from stat, fstat or lstat)
165# describing the same file?
Guido van Rossum7ac48781992-01-14 18:29:32 +0000166
Guido van Rossumd3778f91991-11-12 15:37:40 +0000167def samestat(s1, s2):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000168 """Test whether two stat buffers reference the same file"""
Raymond Hettinger32200ae2002-06-01 19:51:15 +0000169 return s1.st_ino == s2.st_ino and \
170 s1.st_dev == s2.st_dev
Guido van Rossumc6360141990-10-13 19:23:40 +0000171
172
173# Is a path a mount point?
Guido van Rossumd3876d31996-07-23 03:47:28 +0000174# (Does this work for all UNIXes? Is it even guaranteed to work by Posix?)
Guido van Rossum7ac48781992-01-14 18:29:32 +0000175
Guido van Rossumc6360141990-10-13 19:23:40 +0000176def ismount(path):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000177 """Test whether a path is a mount point"""
178 try:
179 s1 = os.stat(path)
180 s2 = os.stat(join(path, '..'))
181 except os.error:
Tim Petersbc0e9102002-04-04 22:55:58 +0000182 return False # It doesn't exist -- so not a mount point :-)
Raymond Hettinger32200ae2002-06-01 19:51:15 +0000183 dev1 = s1.st_dev
184 dev2 = s2.st_dev
Guido van Rossum346f7af1997-12-05 19:04:51 +0000185 if dev1 != dev2:
Tim Petersbc0e9102002-04-04 22:55:58 +0000186 return True # path/.. on a different device as path
Raymond Hettinger32200ae2002-06-01 19:51:15 +0000187 ino1 = s1.st_ino
188 ino2 = s2.st_ino
Guido van Rossum346f7af1997-12-05 19:04:51 +0000189 if ino1 == ino2:
Tim Petersbc0e9102002-04-04 22:55:58 +0000190 return True # path/.. is the same i-node as path
191 return False
Guido van Rossumc6360141990-10-13 19:23:40 +0000192
193
194# Directory tree walk.
Guido van Rossum7ac48781992-01-14 18:29:32 +0000195# For each directory under top (including top itself, but excluding
196# '.' and '..'), func(arg, dirname, filenames) is called, where
197# dirname is the name of the directory and filenames is the list
Guido van Rossum346f7af1997-12-05 19:04:51 +0000198# of files (and subdirectories etc.) in the directory.
Guido van Rossum7ac48781992-01-14 18:29:32 +0000199# The func may modify the filenames list, to implement a filter,
Guido van Rossumc6360141990-10-13 19:23:40 +0000200# or to impose a different order of visiting.
Guido van Rossum7ac48781992-01-14 18:29:32 +0000201
Guido van Rossumc6360141990-10-13 19:23:40 +0000202def walk(top, func, arg):
Tim Peterscf5e6a42001-10-10 04:16:20 +0000203 """Directory tree walk with callback function.
204
205 For each directory in the directory tree rooted at top (including top
206 itself, but excluding '.' and '..'), call func(arg, dirname, fnames).
207 dirname is the name of the directory, and fnames a list of the names of
208 the files and subdirectories in dirname (excluding '.' and '..'). func
209 may modify the fnames list in-place (e.g. via del or slice assignment),
210 and walk will only recurse into the subdirectories whose names remain in
211 fnames; this can be used to implement a filter, or to impose a specific
212 order of visiting. No semantics are defined for, or required of, arg,
213 beyond that arg is always passed to func. It can be used, e.g., to pass
214 a filename pattern, or a mutable object designed to accumulate
215 statistics. Passing None for arg is common."""
216
Guido van Rossum346f7af1997-12-05 19:04:51 +0000217 try:
218 names = os.listdir(top)
219 except os.error:
220 return
221 func(arg, top, names)
Guido van Rossum346f7af1997-12-05 19:04:51 +0000222 for name in names:
Tim Peters2344fae2001-01-15 00:50:52 +0000223 name = join(top, name)
Guido van Rossuma490d582001-04-16 18:12:04 +0000224 try:
225 st = os.lstat(name)
226 except os.error:
227 continue
Neal Norwitzec7cf132002-06-06 18:16:14 +0000228 if stat.S_ISDIR(st.st_mode):
Tim Peters2344fae2001-01-15 00:50:52 +0000229 walk(name, func, arg)
Guido van Rossum7ac48781992-01-14 18:29:32 +0000230
231
232# Expand paths beginning with '~' or '~user'.
233# '~' means $HOME; '~user' means that user's home directory.
234# If the path doesn't begin with '~', or if the user or $HOME is unknown,
235# the path is returned unchanged (leaving error reporting to whatever
236# function is called with the expanded path as argument).
237# See also module 'glob' for expansion of *, ? and [...] in pathnames.
238# (A function should also be defined to do full *sh-style environment
239# variable expansion.)
240
241def expanduser(path):
Tim Peters2344fae2001-01-15 00:50:52 +0000242 """Expand ~ and ~user constructions. If user or $HOME is unknown,
Fred Drakec0ab93e2000-09-28 16:22:52 +0000243 do nothing."""
Walter Dörwald77cdeaf2003-06-17 13:13:40 +0000244 if not path.startswith('~'):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000245 return path
Walter Dörwalda9da5ae2003-06-19 10:21:14 +0000246 i = path.find('/', 1)
247 if i < 0:
248 i = len(path)
Guido van Rossum346f7af1997-12-05 19:04:51 +0000249 if i == 1:
Walter Dörwalda9da5ae2003-06-19 10:21:14 +0000250 if 'HOME' not in os.environ:
Neal Norwitz609ba812002-09-05 21:08:25 +0000251 import pwd
Walter Dörwald77cdeaf2003-06-17 13:13:40 +0000252 userhome = pwd.getpwuid(os.getuid()).pw_dir
Neal Norwitz609ba812002-09-05 21:08:25 +0000253 else:
254 userhome = os.environ['HOME']
Guido van Rossum346f7af1997-12-05 19:04:51 +0000255 else:
256 import pwd
257 try:
258 pwent = pwd.getpwnam(path[1:i])
259 except KeyError:
260 return path
Walter Dörwald77cdeaf2003-06-17 13:13:40 +0000261 userhome = pwent.pw_dir
Georg Brandl8d1e5bf2006-09-30 09:13:21 +0000262 userhome = userhome.rstrip('/')
Guido van Rossum346f7af1997-12-05 19:04:51 +0000263 return userhome + path[i:]
Guido van Rossum4732ccf1992-08-09 13:54:50 +0000264
265
266# Expand paths containing shell variable substitutions.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000267# This expands the forms $variable and ${variable} only.
Jeremy Hyltona05e2932000-06-28 14:48:01 +0000268# Non-existent variables are left unchanged.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000269
270_varprog = None
Guido van Rossum4732ccf1992-08-09 13:54:50 +0000271
272def expandvars(path):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000273 """Expand shell variables of form $var and ${var}. Unknown variables
Fred Drakec0ab93e2000-09-28 16:22:52 +0000274 are left unchanged."""
Guido van Rossum346f7af1997-12-05 19:04:51 +0000275 global _varprog
276 if '$' not in path:
277 return path
278 if not _varprog:
279 import re
280 _varprog = re.compile(r'\$(\w+|\{[^}]*\})')
281 i = 0
Guido van Rossum8ca162f2002-04-07 06:36:23 +0000282 while True:
Guido van Rossum346f7af1997-12-05 19:04:51 +0000283 m = _varprog.search(path, i)
284 if not m:
285 break
286 i, j = m.span(0)
287 name = m.group(1)
Walter Dörwald77cdeaf2003-06-17 13:13:40 +0000288 if name.startswith('{') and name.endswith('}'):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000289 name = name[1:-1]
Raymond Hettinger54f02222002-06-01 14:18:47 +0000290 if name in os.environ:
Guido van Rossum346f7af1997-12-05 19:04:51 +0000291 tail = path[j:]
292 path = path[:i] + os.environ[name]
293 i = len(path)
Walter Dörwald77cdeaf2003-06-17 13:13:40 +0000294 path += tail
Guido van Rossum346f7af1997-12-05 19:04:51 +0000295 else:
296 i = j
297 return path
Guido van Rossumc629d341992-11-05 10:43:02 +0000298
299
300# Normalize a path, e.g. A//B, A/./B and A/foo/../B all become A/B.
301# It should be understood that this may change the meaning of the path
302# if it contains symbolic links!
303
304def normpath(path):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000305 """Normalize path, eliminating double slashes, etc."""
Skip Montanaro018dfae2000-07-19 17:09:51 +0000306 if path == '':
307 return '.'
Marc-André Lemburgbf222c92001-01-29 11:29:44 +0000308 initial_slashes = path.startswith('/')
309 # POSIX allows one or two initial slashes, but treats three or more
310 # as single slash.
Tim Peters658cba62001-02-09 20:06:00 +0000311 if (initial_slashes and
Marc-André Lemburgbf222c92001-01-29 11:29:44 +0000312 path.startswith('//') and not path.startswith('///')):
313 initial_slashes = 2
Fred Drake22fb8392000-09-28 15:04:39 +0000314 comps = path.split('/')
Skip Montanaro018dfae2000-07-19 17:09:51 +0000315 new_comps = []
316 for comp in comps:
317 if comp in ('', '.'):
318 continue
Marc-André Lemburgbf222c92001-01-29 11:29:44 +0000319 if (comp != '..' or (not initial_slashes and not new_comps) or
Skip Montanaro018dfae2000-07-19 17:09:51 +0000320 (new_comps and new_comps[-1] == '..')):
321 new_comps.append(comp)
322 elif new_comps:
323 new_comps.pop()
324 comps = new_comps
Fred Drake22fb8392000-09-28 15:04:39 +0000325 path = '/'.join(comps)
Marc-André Lemburgbf222c92001-01-29 11:29:44 +0000326 if initial_slashes:
327 path = '/'*initial_slashes + path
Skip Montanaro018dfae2000-07-19 17:09:51 +0000328 return path or '.'
Guido van Rossume294cf61999-01-29 18:05:18 +0000329
330
Guido van Rossume294cf61999-01-29 18:05:18 +0000331def abspath(path):
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000332 """Return an absolute path."""
Guido van Rossume294cf61999-01-29 18:05:18 +0000333 if not isabs(path):
334 path = join(os.getcwd(), path)
335 return normpath(path)
Guido van Rossum83eeef42001-09-17 15:16:09 +0000336
337
338# Return a canonical path (i.e. the absolute location of a file on the
339# filesystem).
340
341def realpath(filename):
342 """Return the canonical path of the specified filename, eliminating any
343symbolic links encountered in the path."""
Johannes Gijsbers4ec40642004-08-14 15:01:53 +0000344 if isabs(filename):
345 bits = ['/'] + filename.split('/')[1:]
346 else:
Georg Brandl268e61c2005-06-03 14:28:50 +0000347 bits = [''] + filename.split('/')
Tim Petersa45cacf2004-08-20 03:47:14 +0000348
Guido van Rossum83eeef42001-09-17 15:16:09 +0000349 for i in range(2, len(bits)+1):
350 component = join(*bits[0:i])
Brett Cannonf50299c2004-07-10 22:55:15 +0000351 # Resolve symbolic links.
Brett Cannondfa5d952004-07-11 19:16:21 +0000352 if islink(component):
Brett Cannonf50299c2004-07-10 22:55:15 +0000353 resolved = _resolve_link(component)
354 if resolved is None:
355 # Infinite loop -- return original component + rest of the path
Johannes Gijsbers4ec40642004-08-14 15:01:53 +0000356 return abspath(join(*([component] + bits[i:])))
Brett Cannonf50299c2004-07-10 22:55:15 +0000357 else:
358 newpath = join(*([resolved] + bits[i:]))
Tim Petersa45cacf2004-08-20 03:47:14 +0000359 return realpath(newpath)
Tim Petersb64bec32001-09-18 02:26:39 +0000360
Johannes Gijsbers4ec40642004-08-14 15:01:53 +0000361 return abspath(filename)
Tim Petersa45cacf2004-08-20 03:47:14 +0000362
Brett Cannonf50299c2004-07-10 22:55:15 +0000363
364def _resolve_link(path):
365 """Internal helper function. Takes a path and follows symlinks
Tim Peters182b5ac2004-07-18 06:16:08 +0000366 until we either arrive at something that isn't a symlink, or
Brett Cannonf50299c2004-07-10 22:55:15 +0000367 encounter a path we've seen before (meaning that there's a loop).
368 """
369 paths_seen = []
370 while islink(path):
Brett Cannondfa5d952004-07-11 19:16:21 +0000371 if path in paths_seen:
Brett Cannonf50299c2004-07-10 22:55:15 +0000372 # Already seen this path, so we must have a symlink loop
373 return None
Brett Cannondfa5d952004-07-11 19:16:21 +0000374 paths_seen.append(path)
Brett Cannonf50299c2004-07-10 22:55:15 +0000375 # Resolve where the link points to
Brett Cannondfa5d952004-07-11 19:16:21 +0000376 resolved = os.readlink(path)
Andrew M. Kuchlingc75f1122004-08-02 14:54:16 +0000377 if not isabs(resolved):
Brett Cannonf50299c2004-07-10 22:55:15 +0000378 dir = dirname(path)
379 path = normpath(join(dir, resolved))
380 else:
381 path = normpath(resolved)
382 return path
383
Just van Rossum2d4e9882003-07-17 15:11:49 +0000384supports_unicode_filenames = False