blob: 2a304a2f4aa6ad13abb5cefd133c825ec98c6c2e [file] [log] [blame]
Fred Drakeb23ee1d1999-02-01 20:20:39 +00001\section{\module{os.path} ---
2 Common pathname manipulations}
3\declaremodule{standard}{os.path}
Fred Drakeb91e9341998-07-23 17:59:49 +00004
Fred Drakeb23ee1d1999-02-01 20:20:39 +00005\modulesynopsis{Common pathname manipulations.}
Guido van Rossum470be141995-03-17 16:07:09 +00006
Fred Drakeb23ee1d1999-02-01 20:20:39 +00007This module implements some useful functions on pathnames.
Fred Drake203b4f11998-05-14 15:16:12 +00008\index{path!operations}
Guido van Rossum470be141995-03-17 16:07:09 +00009
Fred Drake0aa811c2001-10-20 04:24:09 +000010\warning{On Windows, many of these functions do not properly
Fred Drakebbf7a402001-09-28 16:14:18 +000011support UNC pathnames. \function{splitunc()} and \function{ismount()}
Fred Drake0aa811c2001-10-20 04:24:09 +000012do handle them correctly.}
Fred Drakebbf7a402001-09-28 16:14:18 +000013
Fred Drakeb23ee1d1999-02-01 20:20:39 +000014
Fred Drakea9b9bf91999-02-02 18:58:33 +000015\begin{funcdesc}{abspath}{path}
16Return a normalized absolutized version of the pathname \var{path}.
17On most platforms, this is equivalent to
Fred Drake39d4a021999-10-18 14:10:06 +000018\code{normpath(join(os.getcwd(), \var{path}))}.
Fred Drake154d9091999-03-17 22:25:11 +000019\versionadded{1.5.2}
Guido van Rossum1804dc31999-01-29 18:05:05 +000020\end{funcdesc}
21
Fred Drakea9b9bf91999-02-02 18:58:33 +000022\begin{funcdesc}{basename}{path}
23Return the base name of pathname \var{path}. This is the second half
Fred Drake3aecfc92000-10-26 21:38:23 +000024of the pair returned by \code{split(\var{path})}. Note that the
25result of this function is different from the
26\UNIX{} \program{basename} program; where \program{basename} for
27\code{'/foo/bar/'} returns \code{'bar'}, the \function{basename()}
28function returns an empty string (\code{''}).
Guido van Rossum5fdeeea1994-01-02 01:22:07 +000029\end{funcdesc}
30
31\begin{funcdesc}{commonprefix}{list}
Skip Montanaro297bf7c2000-08-23 16:58:32 +000032Return the longest path prefix (taken character-by-character) that is a
33prefix of all paths in
Fred Drakeb23ee1d1999-02-01 20:20:39 +000034\var{list}. If \var{list} is empty, return the empty string
Skip Montanaro297bf7c2000-08-23 16:58:32 +000035(\code{''}). Note that this may return invalid paths because it works a
36character at a time.
Fred Drakeb23ee1d1999-02-01 20:20:39 +000037\end{funcdesc}
38
Fred Drakea9b9bf91999-02-02 18:58:33 +000039\begin{funcdesc}{dirname}{path}
40Return the directory name of pathname \var{path}. This is the first
41half of the pair returned by \code{split(\var{path})}.
Guido van Rossum5fdeeea1994-01-02 01:22:07 +000042\end{funcdesc}
43
Fred Drakea9b9bf91999-02-02 18:58:33 +000044\begin{funcdesc}{exists}{path}
Neal Norwitzd3dab2b2002-04-05 02:21:09 +000045Return \code{True} if \var{path} refers to an existing path.
Johannes Gijsbersae882f72004-08-30 10:19:56 +000046Returns \code{False} for broken symbolic links.
47\end{funcdesc}
48
49\begin{funcdesc}{lexists}{path}
50Return \code{True} if \var{path} refers to an existing path.
51Returns \code{True} for broken symbolic links.
52Equivalent to \function{exists()} on platforms lacking
53\function{os.lstat()}.
54\versionadded{2.4}
Guido van Rossum5fdeeea1994-01-02 01:22:07 +000055\end{funcdesc}
56
Fred Drakea9b9bf91999-02-02 18:58:33 +000057\begin{funcdesc}{expanduser}{path}
Guido van Rossum5fdeeea1994-01-02 01:22:07 +000058Return the argument with an initial component of \samp{\~} or
59\samp{\~\var{user}} replaced by that \var{user}'s home directory. An
Fred Drake203b4f11998-05-14 15:16:12 +000060initial \samp{\~{}} is replaced by the environment variable
Fred Drake23a16341998-08-06 15:33:55 +000061\envvar{HOME}; an initial \samp{\~\var{user}} is looked up in the
62password directory through the built-in module
Fred Drakeb23ee1d1999-02-01 20:20:39 +000063\refmodule{pwd}\refbimodindex{pwd}. If the expansion fails, or if the
Brett Cannon19021462004-12-22 05:40:45 +000064path does not begin with a tilde, the path is returned unchanged.
Guido van Rossum5fdeeea1994-01-02 01:22:07 +000065\end{funcdesc}
66
Fred Drakea9b9bf91999-02-02 18:58:33 +000067\begin{funcdesc}{expandvars}{path}
Guido van Rossum17383111994-04-21 10:32:28 +000068Return the argument with environment variables expanded. Substrings
69of the form \samp{\$\var{name}} or \samp{\$\{\var{name}\}} are
70replaced by the value of environment variable \var{name}. Malformed
71variable names and references to non-existing variables are left
Fred Drakea9b9bf91999-02-02 18:58:33 +000072unchanged.
Guido van Rossum17383111994-04-21 10:32:28 +000073\end{funcdesc}
74
Fred Draked8a41e61999-02-19 17:54:10 +000075\begin{funcdesc}{getatime}{path}
Neal Norwitzf3edea52002-12-31 13:38:28 +000076Return the time of last access of \var{path}. The return
Martin v. Löwis96a60e42002-12-31 13:11:54 +000077value is a number giving the number of seconds since the epoch (see the
Fred Draked8a41e61999-02-19 17:54:10 +000078\refmodule{time} module). Raise \exception{os.error} if the file does
79not exist or is inaccessible.
Fred Drakea9b9bf91999-02-02 18:58:33 +000080\versionadded{1.5.2}
Martin v. Löwis96a60e42002-12-31 13:11:54 +000081\versionchanged[If \function{os.stat_float_times()} returns True, the result is a floating point number]{2.3}
Guido van Rossum2babd7b1998-07-24 20:49:39 +000082\end{funcdesc}
83
Fred Drakea9b9bf91999-02-02 18:58:33 +000084\begin{funcdesc}{getmtime}{path}
Neal Norwitzf3edea52002-12-31 13:38:28 +000085Return the time of last modification of \var{path}. The return
Martin v. Löwis96a60e42002-12-31 13:11:54 +000086value is a number giving the number of seconds since the epoch (see the
Fred Drakeb23ee1d1999-02-01 20:20:39 +000087\refmodule{time} module). Raise \exception{os.error} if the file does
88not exist or is inaccessible.
Fred Drakea9b9bf91999-02-02 18:58:33 +000089\versionadded{1.5.2}
Martin v. Löwis96a60e42002-12-31 13:11:54 +000090\versionchanged[If \function{os.stat_float_times()} returns True, the result is a floating point number]{2.3}
91\end{funcdesc}
92
93\begin{funcdesc}{getctime}{path}
Raymond Hettingerc43a7e72003-10-29 00:46:19 +000094Return the system's ctime which, on some systems (like \UNIX) is the
95time of the last change, and, on others (like Windows), is the
96creation time for \var{path}. The return
Martin v. Löwis96a60e42002-12-31 13:11:54 +000097value is a number giving the number of seconds since the epoch (see the
98\refmodule{time} module). Raise \exception{os.error} if the file does
99not exist or is inaccessible.
100\versionadded{2.3}
Guido van Rossum2babd7b1998-07-24 20:49:39 +0000101\end{funcdesc}
102
Fred Draked8a41e61999-02-19 17:54:10 +0000103\begin{funcdesc}{getsize}{path}
Neal Norwitzf3edea52002-12-31 13:38:28 +0000104Return the size, in bytes, of \var{path}. Raise
Fred Draked8a41e61999-02-19 17:54:10 +0000105\exception{os.error} if the file does not exist or is inaccessible.
Fred Drakea9b9bf91999-02-02 18:58:33 +0000106\versionadded{1.5.2}
Guido van Rossum2babd7b1998-07-24 20:49:39 +0000107\end{funcdesc}
108
Fred Drakea9b9bf91999-02-02 18:58:33 +0000109\begin{funcdesc}{isabs}{path}
Neal Norwitzd3dab2b2002-04-05 02:21:09 +0000110Return \code{True} if \var{path} is an absolute pathname (begins with a
Fred Drakea9b9bf91999-02-02 18:58:33 +0000111slash).
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000112\end{funcdesc}
113
Fred Drakea9b9bf91999-02-02 18:58:33 +0000114\begin{funcdesc}{isfile}{path}
Neal Norwitzd3dab2b2002-04-05 02:21:09 +0000115Return \code{True} if \var{path} is an existing regular file. This follows
Fred Drakedb9693e1998-03-11 05:50:42 +0000116symbolic links, so both \function{islink()} and \function{isfile()}
117can be true for the same path.
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000118\end{funcdesc}
119
Fred Drakea9b9bf91999-02-02 18:58:33 +0000120\begin{funcdesc}{isdir}{path}
Neal Norwitzd3dab2b2002-04-05 02:21:09 +0000121Return \code{True} if \var{path} is an existing directory. This follows
Fred Drakedb9693e1998-03-11 05:50:42 +0000122symbolic links, so both \function{islink()} and \function{isdir()} can
123be true for the same path.
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000124\end{funcdesc}
125
Fred Drakea9b9bf91999-02-02 18:58:33 +0000126\begin{funcdesc}{islink}{path}
Neal Norwitzd3dab2b2002-04-05 02:21:09 +0000127Return \code{True} if \var{path} refers to a directory entry that is a
128symbolic link. Always \code{False} if symbolic links are not supported.
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000129\end{funcdesc}
130
Fred Drakea9b9bf91999-02-02 18:58:33 +0000131\begin{funcdesc}{ismount}{path}
Neal Norwitzd3dab2b2002-04-05 02:21:09 +0000132Return \code{True} if pathname \var{path} is a \dfn{mount point}: a point in
Fred Drakea9b9bf91999-02-02 18:58:33 +0000133a file system where a different file system has been mounted. The
134function checks whether \var{path}'s parent, \file{\var{path}/..}, is
135on a different device than \var{path}, or whether \file{\var{path}/..}
136and \var{path} point to the same i-node on the same device --- this
137should detect mount points for all \UNIX{} and \POSIX{} variants.
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000138\end{funcdesc}
139
Fred Drakea9b9bf91999-02-02 18:58:33 +0000140\begin{funcdesc}{join}{path1\optional{, path2\optional{, ...}}}
Barry Warsaw75745871997-02-18 21:53:53 +0000141Joins one or more path components intelligently. If any component is
142an absolute path, all previous components are thrown away, and joining
Fred Drakea9b9bf91999-02-02 18:58:33 +0000143continues. The return value is the concatenation of \var{path1}, and
Fred Drakec1ddc502002-09-12 18:01:26 +0000144optionally \var{path2}, etc., with exactly one directory separator
Martin v. Löwis04791042002-12-11 12:55:53 +0000145(\code{os.sep}) inserted between components, unless \var{path2} is
Fred Drakec1ddc502002-09-12 18:01:26 +0000146empty. Note that on Windows, since there is a current directory for
147each drive, \function{os.path.join("c:", "foo")} represents a path
148relative to the current directory on drive \file{C:} (\file{c:foo}), not
149\file{c:\textbackslash\textbackslash foo}.
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000150\end{funcdesc}
151
Fred Drakea9b9bf91999-02-02 18:58:33 +0000152\begin{funcdesc}{normcase}{path}
Fred Drakec37b65e2001-11-28 07:26:15 +0000153Normalize the case of a pathname. On \UNIX, this returns the path
Guido van Rossum1931c0c1998-02-18 14:00:05 +0000154unchanged; on case-insensitive filesystems, it converts the path to
155lowercase. On Windows, it also converts forward slashes to backward
156slashes.
157\end{funcdesc}
158
Fred Drakea9b9bf91999-02-02 18:58:33 +0000159\begin{funcdesc}{normpath}{path}
Guido van Rossum1931c0c1998-02-18 14:00:05 +0000160Normalize a pathname. This collapses redundant separators and
161up-level references, e.g. \code{A//B}, \code{A/./B} and
162\code{A/foo/../B} all become \code{A/B}. It does not normalize the
Fred Drake38e5d272000-04-03 20:13:55 +0000163case (use \function{normcase()} for that). On Windows, it converts
Johannes Gijsbersb112d6e2004-08-14 14:41:32 +0000164forward slashes to backward slashes. It should be understood that this may
165change the meaning of the path if it contains symbolic links!
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000166\end{funcdesc}
167
Guido van Rossum83eeef42001-09-17 15:16:09 +0000168\begin{funcdesc}{realpath}{path}
169Return the canonical path of the specified filename, eliminating any
170symbolic links encountered in the path.
Fred Drakec37b65e2001-11-28 07:26:15 +0000171Availability: \UNIX.
Guido van Rossum83eeef42001-09-17 15:16:09 +0000172\versionadded{2.2}
173\end{funcdesc}
174
Fred Drakea9b9bf91999-02-02 18:58:33 +0000175\begin{funcdesc}{samefile}{path1, path2}
Neal Norwitzd3dab2b2002-04-05 02:21:09 +0000176Return \code{True} if both pathname arguments refer to the same file or
Fred Drakedb9693e1998-03-11 05:50:42 +0000177directory (as indicated by device number and i-node number).
178Raise an exception if a \function{os.stat()} call on either pathname
179fails.
Fred Drakec37b65e2001-11-28 07:26:15 +0000180Availability: Macintosh, \UNIX.
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000181\end{funcdesc}
182
Fred Draked673d481999-02-03 22:31:30 +0000183\begin{funcdesc}{sameopenfile}{fp1, fp2}
Neal Norwitzd3dab2b2002-04-05 02:21:09 +0000184Return \code{True} if the file objects \var{fp1} and \var{fp2} refer to the
Fred Draked673d481999-02-03 22:31:30 +0000185same file. The two file objects may represent different file
186descriptors.
Fred Drakec37b65e2001-11-28 07:26:15 +0000187Availability: Macintosh, \UNIX.
Fred Draked673d481999-02-03 22:31:30 +0000188\end{funcdesc}
189
190\begin{funcdesc}{samestat}{stat1, stat2}
Neal Norwitzd3dab2b2002-04-05 02:21:09 +0000191Return \code{True} if the stat tuples \var{stat1} and \var{stat2} refer to
Fred Draked673d481999-02-03 22:31:30 +0000192the same file. These structures may have been returned by
193\function{fstat()}, \function{lstat()}, or \function{stat()}. This
194function implements the underlying comparison used by
195\function{samefile()} and \function{sameopenfile()}.
Fred Drakec37b65e2001-11-28 07:26:15 +0000196Availability: Macintosh, \UNIX.
Fred Draked673d481999-02-03 22:31:30 +0000197\end{funcdesc}
198
Fred Drakea9b9bf91999-02-02 18:58:33 +0000199\begin{funcdesc}{split}{path}
Fred Draked673d481999-02-03 22:31:30 +0000200Split the pathname \var{path} into a pair, \code{(\var{head},
201\var{tail})} where \var{tail} is the last pathname component and
Fred Drakea9b9bf91999-02-02 18:58:33 +0000202\var{head} is everything leading up to that. The \var{tail} part will
203never contain a slash; if \var{path} ends in a slash, \var{tail} will
204be empty. If there is no slash in \var{path}, \var{head} will be
205empty. If \var{path} is empty, both \var{head} and \var{tail} are
206empty. Trailing slashes are stripped from \var{head} unless it is the
207root (one or more slashes only). In nearly all cases,
208\code{join(\var{head}, \var{tail})} equals \var{path} (the only
209exception being when there were multiple slashes separating \var{head}
210from \var{tail}).
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000211\end{funcdesc}
212
Fred Drake0256c1f1999-02-03 19:24:44 +0000213\begin{funcdesc}{splitdrive}{path}
214Split the pathname \var{path} into a pair \code{(\var{drive},
Fred Draked673d481999-02-03 22:31:30 +0000215\var{tail})} where \var{drive} is either a drive specification or the
Fred Drake0256c1f1999-02-03 19:24:44 +0000216empty string. On systems which do not use drive specifications,
217\var{drive} will always be the empty string. In all cases,
218\code{\var{drive} + \var{tail}} will be the same as \var{path}.
Fred Drake56a71ee2001-05-25 16:21:00 +0000219\versionadded{1.3}
Fred Drake0256c1f1999-02-03 19:24:44 +0000220\end{funcdesc}
221
Fred Drakea9b9bf91999-02-02 18:58:33 +0000222\begin{funcdesc}{splitext}{path}
Fred Drake0256c1f1999-02-03 19:24:44 +0000223Split the pathname \var{path} into a pair \code{(\var{root}, \var{ext})}
Fred Drakea9b9bf91999-02-02 18:58:33 +0000224such that \code{\var{root} + \var{ext} == \var{path}},
Guido van Rossum56b30ea1996-08-19 23:00:50 +0000225and \var{ext} is empty or begins with a period and contains
226at most one period.
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000227\end{funcdesc}
228
Fred Drakea9b9bf91999-02-02 18:58:33 +0000229\begin{funcdesc}{walk}{path, visit, arg}
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000230Calls the function \var{visit} with arguments
231\code{(\var{arg}, \var{dirname}, \var{names})} for each directory in the
Fred Drakea9b9bf91999-02-02 18:58:33 +0000232directory tree rooted at \var{path} (including \var{path} itself, if it
233is a directory). The argument \var{dirname} specifies the visited
234directory, the argument \var{names} lists the files in the directory
235(gotten from \code{os.listdir(\var{dirname})}).
Guido van Rossume8e87991997-03-25 15:25:54 +0000236The \var{visit} function may modify \var{names} to
Guido van Rossum470be141995-03-17 16:07:09 +0000237influence the set of directories visited below \var{dirname}, e.g., to
238avoid visiting certain parts of the tree. (The object referred to by
Fred Drakedb9693e1998-03-11 05:50:42 +0000239\var{names} must be modified in place, using \keyword{del} or slice
Guido van Rossum470be141995-03-17 16:07:09 +0000240assignment.)
Steve Holden545092b2002-08-06 16:07:07 +0000241
Fred Drake95fa4dd2002-08-07 12:39:33 +0000242\begin{notice}
243Symbolic links to directories are not treated as subdirectories, and
244that \function{walk()} therefore will not visit them. To visit linked
245directories you must identify them with
246\code{os.path.islink(\var{file})} and
247\code{os.path.isdir(\var{file})}, and invoke \function{walk()} as
248necessary.
249\end{notice}
Tim Petersc4e09402003-04-25 07:11:48 +0000250
Fred Drake9f480452003-04-25 15:12:47 +0000251\note{The newer \function{\refmodule{os}.walk()} generator supplies
252 similar functionality and can be easier to use.}
Guido van Rossum5fdeeea1994-01-02 01:22:07 +0000253\end{funcdesc}
Fred Drake604ade42003-02-04 19:13:07 +0000254
255\begin{datadesc}{supports_unicode_filenames}
256True if arbitrary Unicode strings can be used as file names (within
257limitations imposed by the file system), and if
258\function{os.listdir()} returns Unicode strings for a Unicode
259argument.
260\versionadded{2.3}
261\end{datadesc}