blob: d6ddaadc90de33d4c855ff132e5009cdf96fca3c [file] [log] [blame]
Guido van Rossumab096c91997-04-02 05:47:11 +00001"""Filename globbing utility."""
Guido van Rossum65a96201991-01-01 18:17:49 +00002
Georg Brandl71ff6462007-03-07 08:31:51 +00003import sys
Guido van Rossumbba77af1992-01-12 23:26:24 +00004import os
Guido van Rossum9694fca1997-10-22 21:00:49 +00005import re
Georg Brandl71ff6462007-03-07 08:31:51 +00006import fnmatch
Guido van Rossum65a96201991-01-01 18:17:49 +00007
Martin v. Löwised11a5d2012-05-20 10:42:17 +02008try:
9 _unicode = unicode
10except NameError:
11 # If Python is built without Unicode support, the unicode type
12 # will not exist. Fake one.
13 class _unicode(object):
14 pass
15
Johannes Gijsbers836f5432005-01-08 13:13:19 +000016__all__ = ["glob", "iglob"]
Guido van Rossumbba77af1992-01-12 23:26:24 +000017
Guido van Rossum65a96201991-01-01 18:17:49 +000018def glob(pathname):
Tim Peters07e99cb2001-01-14 23:47:14 +000019 """Return a list of paths matching a pathname pattern.
Guido van Rossumab096c91997-04-02 05:47:11 +000020
Tim Peters07e99cb2001-01-14 23:47:14 +000021 The pattern may contain simple shell-style wildcards a la fnmatch.
Guido van Rossumab096c91997-04-02 05:47:11 +000022
Tim Peters07e99cb2001-01-14 23:47:14 +000023 """
Johannes Gijsbers836f5432005-01-08 13:13:19 +000024 return list(iglob(pathname))
25
26def iglob(pathname):
Georg Brandl3ade7612009-04-01 17:46:01 +000027 """Return an iterator which yields the paths matching a pathname pattern.
Johannes Gijsbers836f5432005-01-08 13:13:19 +000028
29 The pattern may contain simple shell-style wildcards a la fnmatch.
30
31 """
Tim Peters07e99cb2001-01-14 23:47:14 +000032 if not has_magic(pathname):
Johannes Gijsbersae882f72004-08-30 10:19:56 +000033 if os.path.lexists(pathname):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000034 yield pathname
35 return
Tim Peters07e99cb2001-01-14 23:47:14 +000036 dirname, basename = os.path.split(pathname)
Martin v. Löwisb5d4d2a2001-06-06 06:24:38 +000037 if not dirname:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000038 for name in glob1(os.curdir, basename):
39 yield name
40 return
41 if has_magic(dirname):
42 dirs = iglob(dirname)
Tim Peters07e99cb2001-01-14 23:47:14 +000043 else:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000044 dirs = [dirname]
45 if has_magic(basename):
46 glob_in_dir = glob1
Tim Peters07e99cb2001-01-14 23:47:14 +000047 else:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000048 glob_in_dir = glob0
49 for dirname in dirs:
50 for name in glob_in_dir(dirname, basename):
51 yield os.path.join(dirname, name)
52
53# These 2 helper functions non-recursively glob inside a literal directory.
54# They return a list of basenames. `glob1` accepts a pattern while `glob0`
55# takes a literal basename (so it only has to check for its existence).
Guido van Rossum65a96201991-01-01 18:17:49 +000056
57def glob1(dirname, pattern):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000058 if not dirname:
59 dirname = os.curdir
Martin v. Löwised11a5d2012-05-20 10:42:17 +020060 if isinstance(pattern, _unicode) and not isinstance(dirname, unicode):
Georg Brandlb54a8092007-03-20 23:05:14 +000061 dirname = unicode(dirname, sys.getfilesystemencoding() or
62 sys.getdefaultencoding())
Tim Peters07e99cb2001-01-14 23:47:14 +000063 try:
64 names = os.listdir(dirname)
65 except os.error:
66 return []
Georg Brandl71ff6462007-03-07 08:31:51 +000067 if pattern[0] != '.':
68 names = filter(lambda x: x[0] != '.', names)
69 return fnmatch.filter(names, pattern)
Guido van Rossum65a96201991-01-01 18:17:49 +000070
Johannes Gijsbers836f5432005-01-08 13:13:19 +000071def glob0(dirname, basename):
72 if basename == '':
73 # `os.path.split()` returns an empty basename for paths ending with a
74 # directory separator. 'q*x/' should match only directories.
Neal Norwitza31bf182006-04-09 03:35:43 +000075 if os.path.isdir(dirname):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000076 return [basename]
77 else:
78 if os.path.lexists(os.path.join(dirname, basename)):
79 return [basename]
80 return []
81
Guido van Rossumc2ef5c21992-01-12 23:32:11 +000082
Guido van Rossum9694fca1997-10-22 21:00:49 +000083magic_check = re.compile('[*?[]')
Guido van Rossumc2ef5c21992-01-12 23:32:11 +000084
Guido van Rossum65a96201991-01-01 18:17:49 +000085def has_magic(s):
Tim Peters07e99cb2001-01-14 23:47:14 +000086 return magic_check.search(s) is not None