blob: 0aee60561faa7edea4343aae1cb657dc3736fe0b [file] [log] [blame]
Guido van Rossumab096c91997-04-02 05:47:11 +00001"""Filename globbing utility."""
Guido van Rossum65a96201991-01-01 18:17:49 +00002
Georg Brandl71ff6462007-03-07 08:31:51 +00003import sys
Guido van Rossumbba77af1992-01-12 23:26:24 +00004import os
Guido van Rossum9694fca1997-10-22 21:00:49 +00005import re
Georg Brandl71ff6462007-03-07 08:31:51 +00006import fnmatch
Guido van Rossum65a96201991-01-01 18:17:49 +00007
Martin v. Löwised11a5d2012-05-20 10:42:17 +02008try:
9 _unicode = unicode
10except NameError:
11 # If Python is built without Unicode support, the unicode type
12 # will not exist. Fake one.
13 class _unicode(object):
14 pass
15
Johannes Gijsbers836f5432005-01-08 13:13:19 +000016__all__ = ["glob", "iglob"]
Guido van Rossumbba77af1992-01-12 23:26:24 +000017
Guido van Rossum65a96201991-01-01 18:17:49 +000018def glob(pathname):
Tim Peters07e99cb2001-01-14 23:47:14 +000019 """Return a list of paths matching a pathname pattern.
Guido van Rossumab096c91997-04-02 05:47:11 +000020
Tim Peters07e99cb2001-01-14 23:47:14 +000021 The pattern may contain simple shell-style wildcards a la fnmatch.
Guido van Rossumab096c91997-04-02 05:47:11 +000022
Tim Peters07e99cb2001-01-14 23:47:14 +000023 """
Johannes Gijsbers836f5432005-01-08 13:13:19 +000024 return list(iglob(pathname))
25
26def iglob(pathname):
Georg Brandl3ade7612009-04-01 17:46:01 +000027 """Return an iterator which yields the paths matching a pathname pattern.
Johannes Gijsbers836f5432005-01-08 13:13:19 +000028
29 The pattern may contain simple shell-style wildcards a la fnmatch.
30
31 """
Tim Peters07e99cb2001-01-14 23:47:14 +000032 if not has_magic(pathname):
Johannes Gijsbersae882f72004-08-30 10:19:56 +000033 if os.path.lexists(pathname):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000034 yield pathname
35 return
Tim Peters07e99cb2001-01-14 23:47:14 +000036 dirname, basename = os.path.split(pathname)
Martin v. Löwisb5d4d2a2001-06-06 06:24:38 +000037 if not dirname:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000038 for name in glob1(os.curdir, basename):
39 yield name
40 return
Antoine Pitrou124ee8b2012-12-16 13:55:47 +010041 # `os.path.split()` returns the argument itself as a dirname if it is a
42 # drive or UNC path. Prevent an infinite recursion if a drive or UNC path
43 # contains magic characters (i.e. r'\\?\C:').
44 if dirname != pathname and has_magic(dirname):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000045 dirs = iglob(dirname)
Tim Peters07e99cb2001-01-14 23:47:14 +000046 else:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000047 dirs = [dirname]
48 if has_magic(basename):
49 glob_in_dir = glob1
Tim Peters07e99cb2001-01-14 23:47:14 +000050 else:
Johannes Gijsbers836f5432005-01-08 13:13:19 +000051 glob_in_dir = glob0
52 for dirname in dirs:
53 for name in glob_in_dir(dirname, basename):
54 yield os.path.join(dirname, name)
55
56# These 2 helper functions non-recursively glob inside a literal directory.
57# They return a list of basenames. `glob1` accepts a pattern while `glob0`
58# takes a literal basename (so it only has to check for its existence).
Guido van Rossum65a96201991-01-01 18:17:49 +000059
60def glob1(dirname, pattern):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000061 if not dirname:
62 dirname = os.curdir
Martin v. Löwised11a5d2012-05-20 10:42:17 +020063 if isinstance(pattern, _unicode) and not isinstance(dirname, unicode):
Georg Brandlb54a8092007-03-20 23:05:14 +000064 dirname = unicode(dirname, sys.getfilesystemencoding() or
65 sys.getdefaultencoding())
Tim Peters07e99cb2001-01-14 23:47:14 +000066 try:
67 names = os.listdir(dirname)
68 except os.error:
69 return []
Georg Brandl71ff6462007-03-07 08:31:51 +000070 if pattern[0] != '.':
71 names = filter(lambda x: x[0] != '.', names)
72 return fnmatch.filter(names, pattern)
Guido van Rossum65a96201991-01-01 18:17:49 +000073
Johannes Gijsbers836f5432005-01-08 13:13:19 +000074def glob0(dirname, basename):
75 if basename == '':
76 # `os.path.split()` returns an empty basename for paths ending with a
77 # directory separator. 'q*x/' should match only directories.
Neal Norwitza31bf182006-04-09 03:35:43 +000078 if os.path.isdir(dirname):
Johannes Gijsbers836f5432005-01-08 13:13:19 +000079 return [basename]
80 else:
81 if os.path.lexists(os.path.join(dirname, basename)):
82 return [basename]
83 return []
84
Guido van Rossumc2ef5c21992-01-12 23:32:11 +000085
Guido van Rossum9694fca1997-10-22 21:00:49 +000086magic_check = re.compile('[*?[]')
Guido van Rossumc2ef5c21992-01-12 23:32:11 +000087
Guido van Rossum65a96201991-01-01 18:17:49 +000088def has_magic(s):
Tim Peters07e99cb2001-01-14 23:47:14 +000089 return magic_check.search(s) is not None