blob: f16e8e16e420295f201fa59d37f88e00b038c022 [file] [log] [blame]
Guido van Rossumab096c91997-04-02 05:47:11 +00001"""Filename globbing utility."""
Guido van Rossum65a96201991-01-01 18:17:49 +00002
Guido van Rossumbba77af1992-01-12 23:26:24 +00003import os
Guido van Rossum9694fca1997-10-22 21:00:49 +00004import re
Guido van Rossumd8faa362007-04-27 19:54:29 +00005import fnmatch
Guido van Rossum65a96201991-01-01 18:17:49 +00006
Johannes Gijsbers836f5432005-01-08 13:13:19 +00007__all__ = ["glob", "iglob"]
Guido van Rossumbba77af1992-01-12 23:26:24 +00008
Guido van Rossum65a96201991-01-01 18:17:49 +00009def glob(pathname):
Tim Peters07e99cb2001-01-14 23:47:14 +000010 """Return a list of paths matching a pathname pattern.
Guido van Rossumab096c91997-04-02 05:47:11 +000011
Tim Peters07e99cb2001-01-14 23:47:14 +000012 The pattern may contain simple shell-style wildcards a la fnmatch.
Guido van Rossumab096c91997-04-02 05:47:11 +000013
Tim Peters07e99cb2001-01-14 23:47:14 +000014 """
Johannes Gijsbers836f5432005-01-08 13:13:19 +000015 return list(iglob(pathname))
16
17def iglob(pathname):
Benjamin Petersond23f8222009-04-05 19:13:16 +000018 """Return an iterator which yields the paths matching a pathname pattern.
Johannes Gijsbers836f5432005-01-08 13:13:19 +000019
20 The pattern may contain simple shell-style wildcards a la fnmatch.
21
22 """
Tim Peters07e99cb2001-01-14 23:47:14 +000023 if not has_magic(pathname):
Johannes Gijsbersae882f72004-08-30 10:19:56 +000024 if os.path.lexists(pathname):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000025 yield pathname
26 return
Tim Peters07e99cb2001-01-14 23:47:14 +000027 dirname, basename = os.path.split(pathname)
Martin v. Löwisb5d4d2a2001-06-06 06:24:38 +000028 if not dirname:
Guido van Rossumf0af3e32008-10-02 18:55:37 +000029 for name in glob1(None, basename):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000030 yield name
31 return
Antoine Pitrou3d068b22012-12-16 13:49:37 +010032 # `os.path.split()` returns the argument itself as a dirname if it is a
33 # drive or UNC path. Prevent an infinite recursion if a drive or UNC path
34 # contains magic characters (i.e. r'\\?\C:').
35 if dirname != pathname and has_magic(dirname):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000036 dirs = iglob(dirname)
Tim Peters07e99cb2001-01-14 23:47:14 +000037 else:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000038 dirs = [dirname]
39 if has_magic(basename):
40 glob_in_dir = glob1
Tim Peters07e99cb2001-01-14 23:47:14 +000041 else:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000042 glob_in_dir = glob0
43 for dirname in dirs:
44 for name in glob_in_dir(dirname, basename):
45 yield os.path.join(dirname, name)
46
47# These 2 helper functions non-recursively glob inside a literal directory.
48# They return a list of basenames. `glob1` accepts a pattern while `glob0`
49# takes a literal basename (so it only has to check for its existence).
Guido van Rossum65a96201991-01-01 18:17:49 +000050
51def glob1(dirname, pattern):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000052 if not dirname:
Guido van Rossumf0af3e32008-10-02 18:55:37 +000053 if isinstance(pattern, bytes):
54 dirname = bytes(os.curdir, 'ASCII')
55 else:
56 dirname = os.curdir
Tim Peters07e99cb2001-01-14 23:47:14 +000057 try:
58 names = os.listdir(dirname)
59 except os.error:
60 return []
Hynek Schlawacke26568f2012-12-27 10:10:11 +010061 if not _ishidden(pattern):
62 names = [x for x in names if not _ishidden(x)]
Guido van Rossumd8faa362007-04-27 19:54:29 +000063 return fnmatch.filter(names, pattern)
Guido van Rossum65a96201991-01-01 18:17:49 +000064
Johannes Gijsbers836f5432005-01-08 13:13:19 +000065def glob0(dirname, basename):
Antoine Pitrou54615582012-12-16 16:03:01 +010066 if not basename:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000067 # `os.path.split()` returns an empty basename for paths ending with a
68 # directory separator. 'q*x/' should match only directories.
Thomas Wouters49fd7fa2006-04-21 10:40:58 +000069 if os.path.isdir(dirname):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000070 return [basename]
71 else:
72 if os.path.lexists(os.path.join(dirname, basename)):
73 return [basename]
74 return []
75
Guido van Rossumc2ef5c21992-01-12 23:32:11 +000076
Guido van Rossum9694fca1997-10-22 21:00:49 +000077magic_check = re.compile('[*?[]')
Guido van Rossumf0af3e32008-10-02 18:55:37 +000078magic_check_bytes = re.compile(b'[*?[]')
Guido van Rossumc2ef5c21992-01-12 23:32:11 +000079
Guido van Rossum65a96201991-01-01 18:17:49 +000080def has_magic(s):
Guido van Rossumf0af3e32008-10-02 18:55:37 +000081 if isinstance(s, bytes):
82 match = magic_check_bytes.search(s)
83 else:
84 match = magic_check.search(s)
85 return match is not None
Hynek Schlawacke26568f2012-12-27 10:10:11 +010086
87def _ishidden(path):
88 return path[0] in ('.', b'.'[0])