blob: 1f602656d0881bb3758638ef7b73151acda4038a [file] [log] [blame]
Guido van Rossumab096c91997-04-02 05:47:11 +00001"""Filename globbing utility."""
Guido van Rossum65a96201991-01-01 18:17:49 +00002
Guido van Rossumbba77af1992-01-12 23:26:24 +00003import os
Guido van Rossum9694fca1997-10-22 21:00:49 +00004import re
Guido van Rossumd8faa362007-04-27 19:54:29 +00005import fnmatch
Guido van Rossum65a96201991-01-01 18:17:49 +00006
Johannes Gijsbers836f5432005-01-08 13:13:19 +00007__all__ = ["glob", "iglob"]
Guido van Rossumbba77af1992-01-12 23:26:24 +00008
Guido van Rossum65a96201991-01-01 18:17:49 +00009def glob(pathname):
Tim Peters07e99cb2001-01-14 23:47:14 +000010 """Return a list of paths matching a pathname pattern.
Guido van Rossumab096c91997-04-02 05:47:11 +000011
Petri Lehtinenee4a20b2013-02-23 19:53:03 +010012 The pattern may contain simple shell-style wildcards a la
13 fnmatch. However, unlike fnmatch, filenames starting with a
14 dot are special cases that are not matched by '*' and '?'
15 patterns.
Guido van Rossumab096c91997-04-02 05:47:11 +000016
Tim Peters07e99cb2001-01-14 23:47:14 +000017 """
Johannes Gijsbers836f5432005-01-08 13:13:19 +000018 return list(iglob(pathname))
19
20def iglob(pathname):
Benjamin Petersond23f8222009-04-05 19:13:16 +000021 """Return an iterator which yields the paths matching a pathname pattern.
Johannes Gijsbers836f5432005-01-08 13:13:19 +000022
Petri Lehtinenee4a20b2013-02-23 19:53:03 +010023 The pattern may contain simple shell-style wildcards a la
24 fnmatch. However, unlike fnmatch, filenames starting with a
25 dot are special cases that are not matched by '*' and '?'
26 patterns.
Johannes Gijsbers836f5432005-01-08 13:13:19 +000027
28 """
Tim Peters07e99cb2001-01-14 23:47:14 +000029 if not has_magic(pathname):
Johannes Gijsbersae882f72004-08-30 10:19:56 +000030 if os.path.lexists(pathname):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000031 yield pathname
32 return
Tim Peters07e99cb2001-01-14 23:47:14 +000033 dirname, basename = os.path.split(pathname)
Martin v. Löwisb5d4d2a2001-06-06 06:24:38 +000034 if not dirname:
Guido van Rossumf0af3e32008-10-02 18:55:37 +000035 for name in glob1(None, basename):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000036 yield name
37 return
Antoine Pitrou3d068b22012-12-16 13:49:37 +010038 # `os.path.split()` returns the argument itself as a dirname if it is a
39 # drive or UNC path. Prevent an infinite recursion if a drive or UNC path
40 # contains magic characters (i.e. r'\\?\C:').
41 if dirname != pathname and has_magic(dirname):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000042 dirs = iglob(dirname)
Tim Peters07e99cb2001-01-14 23:47:14 +000043 else:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000044 dirs = [dirname]
45 if has_magic(basename):
46 glob_in_dir = glob1
Tim Peters07e99cb2001-01-14 23:47:14 +000047 else:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000048 glob_in_dir = glob0
49 for dirname in dirs:
50 for name in glob_in_dir(dirname, basename):
51 yield os.path.join(dirname, name)
52
53# These 2 helper functions non-recursively glob inside a literal directory.
54# They return a list of basenames. `glob1` accepts a pattern while `glob0`
55# takes a literal basename (so it only has to check for its existence).
Guido van Rossum65a96201991-01-01 18:17:49 +000056
57def glob1(dirname, pattern):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000058 if not dirname:
Guido van Rossumf0af3e32008-10-02 18:55:37 +000059 if isinstance(pattern, bytes):
60 dirname = bytes(os.curdir, 'ASCII')
61 else:
62 dirname = os.curdir
Tim Peters07e99cb2001-01-14 23:47:14 +000063 try:
64 names = os.listdir(dirname)
65 except os.error:
66 return []
Hynek Schlawacke26568f2012-12-27 10:10:11 +010067 if not _ishidden(pattern):
68 names = [x for x in names if not _ishidden(x)]
Guido van Rossumd8faa362007-04-27 19:54:29 +000069 return fnmatch.filter(names, pattern)
Guido van Rossum65a96201991-01-01 18:17:49 +000070
Johannes Gijsbers836f5432005-01-08 13:13:19 +000071def glob0(dirname, basename):
Antoine Pitrou54615582012-12-16 16:03:01 +010072 if not basename:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000073 # `os.path.split()` returns an empty basename for paths ending with a
74 # directory separator. 'q*x/' should match only directories.
Thomas Wouters49fd7fa2006-04-21 10:40:58 +000075 if os.path.isdir(dirname):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000076 return [basename]
77 else:
78 if os.path.lexists(os.path.join(dirname, basename)):
79 return [basename]
80 return []
81
Guido van Rossumc2ef5c21992-01-12 23:32:11 +000082
Guido van Rossum9694fca1997-10-22 21:00:49 +000083magic_check = re.compile('[*?[]')
Guido van Rossumf0af3e32008-10-02 18:55:37 +000084magic_check_bytes = re.compile(b'[*?[]')
Guido van Rossumc2ef5c21992-01-12 23:32:11 +000085
Guido van Rossum65a96201991-01-01 18:17:49 +000086def has_magic(s):
Guido van Rossumf0af3e32008-10-02 18:55:37 +000087 if isinstance(s, bytes):
88 match = magic_check_bytes.search(s)
89 else:
90 match = magic_check.search(s)
91 return match is not None
Hynek Schlawacke26568f2012-12-27 10:10:11 +010092
93def _ishidden(path):
94 return path[0] in ('.', b'.'[0])