blob: cceb2d2be71e9b669d39b0710dacb5120d3cfd19 [file] [log] [blame]
Guido van Rossum54f22ed2000-02-04 15:10:34 +00001"""Common operations on Posix pathnames.
2
3Instead of importing this module directly, import os and refer to
4this module as os.path. The "os.path" name is an alias for this
5module on Posix systems; on other systems (e.g. Mac, Windows),
6os.path provides the same operations in a manner specific to that
7platform, and is an alias to another module (e.g. macpath, ntpath).
8
9Some of this can actually be useful on non-Posix systems too, e.g.
10for manipulation of the pathname component of URLs.
Guido van Rossum346f7af1997-12-05 19:04:51 +000011"""
Guido van Rossumc6360141990-10-13 19:23:40 +000012
Guido van Rossumd3876d31996-07-23 03:47:28 +000013import os
Guido van Rossum40d93041990-10-21 16:17:34 +000014import stat
Guido van Rossumc6360141990-10-13 19:23:40 +000015
Skip Montanaroc62c81e2001-02-12 02:00:42 +000016__all__ = ["normcase","isabs","join","splitdrive","split","splitext",
17 "basename","dirname","commonprefix","getsize","getmtime",
18 "getatime","islink","exists","isdir","isfile","ismount",
19 "walk","expanduser","expandvars","normpath","abspath",
20 "samefile","sameopenfile","samestat"]
Guido van Rossumc6360141990-10-13 19:23:40 +000021
Guido van Rossum7ac48781992-01-14 18:29:32 +000022# Normalize the case of a pathname. Trivial in Posix, string.lower on Mac.
23# On MS-DOS this may also turn slashes into backslashes; however, other
24# normalizations (such as optimizing '../' away) are not allowed
25# (another function should be defined to do that).
26
27def normcase(s):
Guido van Rossum346f7af1997-12-05 19:04:51 +000028 """Normalize case of pathname. Has no effect under Posix"""
29 return s
Guido van Rossum7ac48781992-01-14 18:29:32 +000030
31
Jeremy Hyltona05e2932000-06-28 14:48:01 +000032# Return whether a path is absolute.
Guido van Rossum7ac48781992-01-14 18:29:32 +000033# Trivial in Posix, harder on the Mac or MS-DOS.
34
35def isabs(s):
Guido van Rossum346f7af1997-12-05 19:04:51 +000036 """Test whether a path is absolute"""
37 return s[:1] == '/'
Guido van Rossum7ac48781992-01-14 18:29:32 +000038
39
Barry Warsaw384d2491997-02-18 21:53:25 +000040# Join pathnames.
41# Ignore the previous parts if a part is absolute.
Guido van Rossum4d0fdc31991-08-16 13:27:58 +000042# Insert a '/' unless the first part is empty or already ends in '/'.
Guido van Rossum7ac48781992-01-14 18:29:32 +000043
Barry Warsaw384d2491997-02-18 21:53:25 +000044def join(a, *p):
Guido van Rossum346f7af1997-12-05 19:04:51 +000045 """Join two or more pathname components, inserting '/' as needed"""
46 path = a
47 for b in p:
48 if b[:1] == '/':
49 path = b
50 elif path == '' or path[-1:] == '/':
51 path = path + b
52 else:
53 path = path + '/' + b
54 return path
Guido van Rossumc6360141990-10-13 19:23:40 +000055
56
Guido van Rossum26847381992-03-31 18:54:35 +000057# Split a path in head (everything up to the last '/') and tail (the
Guido van Rossuma89b1ba1995-09-01 20:32:21 +000058# rest). If the path ends in '/', tail will be empty. If there is no
59# '/' in the path, head will be empty.
60# Trailing '/'es are stripped from head unless it is the root.
Guido van Rossum7ac48781992-01-14 18:29:32 +000061
Guido van Rossumc6360141990-10-13 19:23:40 +000062def split(p):
Tim Peters2344fae2001-01-15 00:50:52 +000063 """Split a pathname. Returns tuple "(head, tail)" where "tail" is
Fred Drakec0ab93e2000-09-28 16:22:52 +000064 everything after the final slash. Either part may be empty."""
Fred Drake22fb8392000-09-28 15:04:39 +000065 i = p.rfind('/') + 1
Guido van Rossum346f7af1997-12-05 19:04:51 +000066 head, tail = p[:i], p[i:]
Fred Drake8152d322000-12-12 23:20:45 +000067 if head and head != '/'*len(head):
Guido van Rossum346f7af1997-12-05 19:04:51 +000068 while head[-1] == '/':
69 head = head[:-1]
70 return head, tail
Guido van Rossumc6360141990-10-13 19:23:40 +000071
72
Guido van Rossum4d0fdc31991-08-16 13:27:58 +000073# Split a path in root and extension.
Guido van Rossum422869a1996-08-20 20:24:17 +000074# The extension is everything starting at the last dot in the last
Guido van Rossum4d0fdc31991-08-16 13:27:58 +000075# pathname component; the root is everything before that.
Guido van Rossum7ac48781992-01-14 18:29:32 +000076# It is always true that root + ext == p.
77
Guido van Rossum4d0fdc31991-08-16 13:27:58 +000078def splitext(p):
Guido van Rossum346f7af1997-12-05 19:04:51 +000079 """Split the extension from a pathname. Extension is everything from the
Fred Drakec0ab93e2000-09-28 16:22:52 +000080 last dot to the end. Returns "(root, ext)", either part may be empty."""
Guido van Rossum346f7af1997-12-05 19:04:51 +000081 root, ext = '', ''
82 for c in p:
83 if c == '/':
84 root, ext = root + ext + c, ''
85 elif c == '.':
86 if ext:
87 root, ext = root + ext, c
88 else:
89 ext = c
90 elif ext:
91 ext = ext + c
92 else:
93 root = root + c
94 return root, ext
Guido van Rossum4d0fdc31991-08-16 13:27:58 +000095
96
Guido van Rossum221df241995-08-07 20:17:55 +000097# Split a pathname into a drive specification and the rest of the
98# path. Useful on DOS/Windows/NT; on Unix, the drive is always empty.
99
100def splitdrive(p):
Tim Peters2344fae2001-01-15 00:50:52 +0000101 """Split a pathname into drive and path. On Posix, drive is always
Fred Drakec0ab93e2000-09-28 16:22:52 +0000102 empty."""
Guido van Rossum346f7af1997-12-05 19:04:51 +0000103 return '', p
Guido van Rossum221df241995-08-07 20:17:55 +0000104
105
Guido van Rossumc6360141990-10-13 19:23:40 +0000106# Return the tail (basename) part of a path.
Guido van Rossum7ac48781992-01-14 18:29:32 +0000107
Guido van Rossumc6360141990-10-13 19:23:40 +0000108def basename(p):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000109 """Returns the final component of a pathname"""
110 return split(p)[1]
Guido van Rossumc6360141990-10-13 19:23:40 +0000111
112
Guido van Rossumc629d341992-11-05 10:43:02 +0000113# Return the head (dirname) part of a path.
114
115def dirname(p):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000116 """Returns the directory component of a pathname"""
117 return split(p)[0]
Guido van Rossumc629d341992-11-05 10:43:02 +0000118
119
Guido van Rossumc6360141990-10-13 19:23:40 +0000120# Return the longest prefix of all list elements.
Guido van Rossum7ac48781992-01-14 18:29:32 +0000121
Guido van Rossumc6360141990-10-13 19:23:40 +0000122def commonprefix(m):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000123 "Given a list of pathnames, returns the longest common leading component"
124 if not m: return ''
Skip Montanaro62358312000-08-22 13:01:53 +0000125 prefix = m[0]
126 for item in m:
Guido van Rossum346f7af1997-12-05 19:04:51 +0000127 for i in range(len(prefix)):
Fred Drake8152d322000-12-12 23:20:45 +0000128 if prefix[:i+1] != item[:i+1]:
Guido van Rossum346f7af1997-12-05 19:04:51 +0000129 prefix = prefix[:i]
130 if i == 0: return ''
131 break
Skip Montanaro62358312000-08-22 13:01:53 +0000132 return prefix
Guido van Rossumc6360141990-10-13 19:23:40 +0000133
134
Guido van Rossum2bc1f8f1998-07-24 20:49:26 +0000135# Get size, mtime, atime of files.
136
137def getsize(filename):
138 """Return the size of a file, reported by os.stat()."""
139 st = os.stat(filename)
140 return st[stat.ST_SIZE]
141
142def getmtime(filename):
143 """Return the last modification time of a file, reported by os.stat()."""
144 st = os.stat(filename)
145 return st[stat.ST_MTIME]
146
147def getatime(filename):
148 """Return the last access time of a file, reported by os.stat()."""
149 st = os.stat(filename)
Guido van Rossum98118612000-02-24 02:26:51 +0000150 return st[stat.ST_ATIME]
Guido van Rossum2bc1f8f1998-07-24 20:49:26 +0000151
152
Guido van Rossum7ac48781992-01-14 18:29:32 +0000153# Is a path a symbolic link?
Guido van Rossumd3876d31996-07-23 03:47:28 +0000154# This will always return false on systems where os.lstat doesn't exist.
Guido van Rossum7ac48781992-01-14 18:29:32 +0000155
156def islink(path):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000157 """Test whether a path is a symbolic link"""
158 try:
159 st = os.lstat(path)
160 except (os.error, AttributeError):
161 return 0
162 return stat.S_ISLNK(st[stat.ST_MODE])
Guido van Rossum7ac48781992-01-14 18:29:32 +0000163
164
165# Does a path exist?
166# This is false for dangling symbolic links.
167
Guido van Rossumc6360141990-10-13 19:23:40 +0000168def exists(path):
Tim Petersbc0e9102002-04-04 22:55:58 +0000169 """Test whether a path exists. Returns False for broken symbolic links"""
Guido van Rossum346f7af1997-12-05 19:04:51 +0000170 try:
171 st = os.stat(path)
172 except os.error:
Tim Petersbc0e9102002-04-04 22:55:58 +0000173 return False
174 return True
Guido van Rossumc6360141990-10-13 19:23:40 +0000175
176
Guido van Rossumd3876d31996-07-23 03:47:28 +0000177# Is a path a directory?
Guido van Rossum7ac48781992-01-14 18:29:32 +0000178# This follows symbolic links, so both islink() and isdir() can be true
179# for the same path.
180
Guido van Rossumc6360141990-10-13 19:23:40 +0000181def isdir(path):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000182 """Test whether a path is a directory"""
183 try:
184 st = os.stat(path)
185 except os.error:
186 return 0
187 return stat.S_ISDIR(st[stat.ST_MODE])
Guido van Rossumc6360141990-10-13 19:23:40 +0000188
189
Guido van Rossum26847381992-03-31 18:54:35 +0000190# Is a path a regular file?
Guido van Rossumb6775db1994-08-01 11:34:53 +0000191# This follows symbolic links, so both islink() and isfile() can be true
Guido van Rossum7ac48781992-01-14 18:29:32 +0000192# for the same path.
193
194def isfile(path):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000195 """Test whether a path is a regular file"""
196 try:
197 st = os.stat(path)
198 except os.error:
199 return 0
200 return stat.S_ISREG(st[stat.ST_MODE])
Guido van Rossumc6360141990-10-13 19:23:40 +0000201
202
Guido van Rossumd3778f91991-11-12 15:37:40 +0000203# Are two filenames really pointing to the same file?
Guido van Rossum7ac48781992-01-14 18:29:32 +0000204
Guido van Rossumd3778f91991-11-12 15:37:40 +0000205def samefile(f1, f2):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000206 """Test whether two pathnames reference the same actual file"""
207 s1 = os.stat(f1)
208 s2 = os.stat(f2)
209 return samestat(s1, s2)
Guido van Rossumd3778f91991-11-12 15:37:40 +0000210
211
212# Are two open files really referencing the same file?
213# (Not necessarily the same file descriptor!)
Guido van Rossum7ac48781992-01-14 18:29:32 +0000214
Guido van Rossumd3778f91991-11-12 15:37:40 +0000215def sameopenfile(fp1, fp2):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000216 """Test whether two open file objects reference the same file"""
217 s1 = os.fstat(fp1)
218 s2 = os.fstat(fp2)
219 return samestat(s1, s2)
Guido van Rossumd3778f91991-11-12 15:37:40 +0000220
221
222# Are two stat buffers (obtained from stat, fstat or lstat)
223# describing the same file?
Guido van Rossum7ac48781992-01-14 18:29:32 +0000224
Guido van Rossumd3778f91991-11-12 15:37:40 +0000225def samestat(s1, s2):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000226 """Test whether two stat buffers reference the same file"""
227 return s1[stat.ST_INO] == s2[stat.ST_INO] and \
Tim Peters2344fae2001-01-15 00:50:52 +0000228 s1[stat.ST_DEV] == s2[stat.ST_DEV]
Guido van Rossumc6360141990-10-13 19:23:40 +0000229
230
231# Is a path a mount point?
Guido van Rossumd3876d31996-07-23 03:47:28 +0000232# (Does this work for all UNIXes? Is it even guaranteed to work by Posix?)
Guido van Rossum7ac48781992-01-14 18:29:32 +0000233
Guido van Rossumc6360141990-10-13 19:23:40 +0000234def ismount(path):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000235 """Test whether a path is a mount point"""
236 try:
237 s1 = os.stat(path)
238 s2 = os.stat(join(path, '..'))
239 except os.error:
Tim Petersbc0e9102002-04-04 22:55:58 +0000240 return False # It doesn't exist -- so not a mount point :-)
Guido van Rossum346f7af1997-12-05 19:04:51 +0000241 dev1 = s1[stat.ST_DEV]
242 dev2 = s2[stat.ST_DEV]
243 if dev1 != dev2:
Tim Petersbc0e9102002-04-04 22:55:58 +0000244 return True # path/.. on a different device as path
Guido van Rossum346f7af1997-12-05 19:04:51 +0000245 ino1 = s1[stat.ST_INO]
246 ino2 = s2[stat.ST_INO]
247 if ino1 == ino2:
Tim Petersbc0e9102002-04-04 22:55:58 +0000248 return True # path/.. is the same i-node as path
249 return False
Guido van Rossumc6360141990-10-13 19:23:40 +0000250
251
252# Directory tree walk.
Guido van Rossum7ac48781992-01-14 18:29:32 +0000253# For each directory under top (including top itself, but excluding
254# '.' and '..'), func(arg, dirname, filenames) is called, where
255# dirname is the name of the directory and filenames is the list
Guido van Rossum346f7af1997-12-05 19:04:51 +0000256# of files (and subdirectories etc.) in the directory.
Guido van Rossum7ac48781992-01-14 18:29:32 +0000257# The func may modify the filenames list, to implement a filter,
Guido van Rossumc6360141990-10-13 19:23:40 +0000258# or to impose a different order of visiting.
Guido van Rossum7ac48781992-01-14 18:29:32 +0000259
Guido van Rossumc6360141990-10-13 19:23:40 +0000260def walk(top, func, arg):
Tim Peterscf5e6a42001-10-10 04:16:20 +0000261 """Directory tree walk with callback function.
262
263 For each directory in the directory tree rooted at top (including top
264 itself, but excluding '.' and '..'), call func(arg, dirname, fnames).
265 dirname is the name of the directory, and fnames a list of the names of
266 the files and subdirectories in dirname (excluding '.' and '..'). func
267 may modify the fnames list in-place (e.g. via del or slice assignment),
268 and walk will only recurse into the subdirectories whose names remain in
269 fnames; this can be used to implement a filter, or to impose a specific
270 order of visiting. No semantics are defined for, or required of, arg,
271 beyond that arg is always passed to func. It can be used, e.g., to pass
272 a filename pattern, or a mutable object designed to accumulate
273 statistics. Passing None for arg is common."""
274
Guido van Rossum346f7af1997-12-05 19:04:51 +0000275 try:
276 names = os.listdir(top)
277 except os.error:
278 return
279 func(arg, top, names)
Guido van Rossum346f7af1997-12-05 19:04:51 +0000280 for name in names:
Tim Peters2344fae2001-01-15 00:50:52 +0000281 name = join(top, name)
Guido van Rossuma490d582001-04-16 18:12:04 +0000282 try:
283 st = os.lstat(name)
284 except os.error:
285 continue
Tim Peters2344fae2001-01-15 00:50:52 +0000286 if stat.S_ISDIR(st[stat.ST_MODE]):
287 walk(name, func, arg)
Guido van Rossum7ac48781992-01-14 18:29:32 +0000288
289
290# Expand paths beginning with '~' or '~user'.
291# '~' means $HOME; '~user' means that user's home directory.
292# If the path doesn't begin with '~', or if the user or $HOME is unknown,
293# the path is returned unchanged (leaving error reporting to whatever
294# function is called with the expanded path as argument).
295# See also module 'glob' for expansion of *, ? and [...] in pathnames.
296# (A function should also be defined to do full *sh-style environment
297# variable expansion.)
298
299def expanduser(path):
Tim Peters2344fae2001-01-15 00:50:52 +0000300 """Expand ~ and ~user constructions. If user or $HOME is unknown,
Fred Drakec0ab93e2000-09-28 16:22:52 +0000301 do nothing."""
Fred Drake8152d322000-12-12 23:20:45 +0000302 if path[:1] != '~':
Guido van Rossum346f7af1997-12-05 19:04:51 +0000303 return path
304 i, n = 1, len(path)
Fred Drake8152d322000-12-12 23:20:45 +0000305 while i < n and path[i] != '/':
Fred Drakec0ab93e2000-09-28 16:22:52 +0000306 i = i + 1
Guido van Rossum346f7af1997-12-05 19:04:51 +0000307 if i == 1:
308 if not os.environ.has_key('HOME'):
309 return path
310 userhome = os.environ['HOME']
311 else:
312 import pwd
313 try:
314 pwent = pwd.getpwnam(path[1:i])
315 except KeyError:
316 return path
317 userhome = pwent[5]
Fred Drakec0ab93e2000-09-28 16:22:52 +0000318 if userhome[-1:] == '/': i = i + 1
Guido van Rossum346f7af1997-12-05 19:04:51 +0000319 return userhome + path[i:]
Guido van Rossum4732ccf1992-08-09 13:54:50 +0000320
321
322# Expand paths containing shell variable substitutions.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000323# This expands the forms $variable and ${variable} only.
Jeremy Hyltona05e2932000-06-28 14:48:01 +0000324# Non-existent variables are left unchanged.
Guido van Rossumb6775db1994-08-01 11:34:53 +0000325
326_varprog = None
Guido van Rossum4732ccf1992-08-09 13:54:50 +0000327
328def expandvars(path):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000329 """Expand shell variables of form $var and ${var}. Unknown variables
Fred Drakec0ab93e2000-09-28 16:22:52 +0000330 are left unchanged."""
Guido van Rossum346f7af1997-12-05 19:04:51 +0000331 global _varprog
332 if '$' not in path:
333 return path
334 if not _varprog:
335 import re
336 _varprog = re.compile(r'\$(\w+|\{[^}]*\})')
337 i = 0
338 while 1:
339 m = _varprog.search(path, i)
340 if not m:
341 break
342 i, j = m.span(0)
343 name = m.group(1)
344 if name[:1] == '{' and name[-1:] == '}':
345 name = name[1:-1]
346 if os.environ.has_key(name):
347 tail = path[j:]
348 path = path[:i] + os.environ[name]
349 i = len(path)
350 path = path + tail
351 else:
352 i = j
353 return path
Guido van Rossumc629d341992-11-05 10:43:02 +0000354
355
356# Normalize a path, e.g. A//B, A/./B and A/foo/../B all become A/B.
357# It should be understood that this may change the meaning of the path
358# if it contains symbolic links!
359
360def normpath(path):
Guido van Rossum346f7af1997-12-05 19:04:51 +0000361 """Normalize path, eliminating double slashes, etc."""
Skip Montanaro018dfae2000-07-19 17:09:51 +0000362 if path == '':
363 return '.'
Marc-André Lemburgbf222c92001-01-29 11:29:44 +0000364 initial_slashes = path.startswith('/')
365 # POSIX allows one or two initial slashes, but treats three or more
366 # as single slash.
Tim Peters658cba62001-02-09 20:06:00 +0000367 if (initial_slashes and
Marc-André Lemburgbf222c92001-01-29 11:29:44 +0000368 path.startswith('//') and not path.startswith('///')):
369 initial_slashes = 2
Fred Drake22fb8392000-09-28 15:04:39 +0000370 comps = path.split('/')
Skip Montanaro018dfae2000-07-19 17:09:51 +0000371 new_comps = []
372 for comp in comps:
373 if comp in ('', '.'):
374 continue
Marc-André Lemburgbf222c92001-01-29 11:29:44 +0000375 if (comp != '..' or (not initial_slashes and not new_comps) or
Skip Montanaro018dfae2000-07-19 17:09:51 +0000376 (new_comps and new_comps[-1] == '..')):
377 new_comps.append(comp)
378 elif new_comps:
379 new_comps.pop()
380 comps = new_comps
Fred Drake22fb8392000-09-28 15:04:39 +0000381 path = '/'.join(comps)
Marc-André Lemburgbf222c92001-01-29 11:29:44 +0000382 if initial_slashes:
383 path = '/'*initial_slashes + path
Skip Montanaro018dfae2000-07-19 17:09:51 +0000384 return path or '.'
Guido van Rossume294cf61999-01-29 18:05:18 +0000385
386
Guido van Rossume294cf61999-01-29 18:05:18 +0000387def abspath(path):
Guido van Rossum54f22ed2000-02-04 15:10:34 +0000388 """Return an absolute path."""
Guido van Rossume294cf61999-01-29 18:05:18 +0000389 if not isabs(path):
390 path = join(os.getcwd(), path)
391 return normpath(path)
Guido van Rossum83eeef42001-09-17 15:16:09 +0000392
393
394# Return a canonical path (i.e. the absolute location of a file on the
395# filesystem).
396
397def realpath(filename):
398 """Return the canonical path of the specified filename, eliminating any
399symbolic links encountered in the path."""
400 filename = abspath(filename)
401
402 bits = ['/'] + filename.split('/')[1:]
403 for i in range(2, len(bits)+1):
404 component = join(*bits[0:i])
405 if islink(component):
406 resolved = os.readlink(component)
407 (dir, file) = split(component)
408 resolved = normpath(join(dir, resolved))
409 newpath = join(*([resolved] + bits[i:]))
410 return realpath(newpath)
Tim Petersb64bec32001-09-18 02:26:39 +0000411
Guido van Rossum83eeef42001-09-17 15:16:09 +0000412 return filename