blob: 10320a74d94249c0112a813ae59364294e08d2f8 [file] [log] [blame]
Guido van Rossum75dc4961998-03-05 03:42:00 +00001"""Find modules used by a script, using introspection."""
Thomas Heller919000e2002-11-25 20:21:59 +00002
Guido van Rossum75dc4961998-03-05 03:42:00 +00003import dis
Eric Snow32439d62015-05-02 19:15:18 -06004import importlib._bootstrap_external
Brett Cannon73b969e2012-12-22 19:34:21 -05005import importlib.machinery
Guido van Rossum75dc4961998-03-05 03:42:00 +00006import marshal
7import os
Guido van Rossum75dc4961998-03-05 03:42:00 +00008import sys
Christian Heimes45f9af32007-11-27 21:50:00 +00009import types
Brett Cannone4f41de2013-06-16 13:13:40 -040010import warnings
11with warnings.catch_warnings():
Brett Cannon213b4052015-10-30 14:41:06 -070012 warnings.simplefilter('ignore', DeprecationWarning)
Brett Cannone4f41de2013-06-16 13:13:40 -040013 import imp
Guido van Rossum75dc4961998-03-05 03:42:00 +000014
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +030015LOAD_CONST = dis.opmap['LOAD_CONST']
16IMPORT_NAME = dis.opmap['IMPORT_NAME']
17STORE_NAME = dis.opmap['STORE_NAME']
18STORE_GLOBAL = dis.opmap['STORE_GLOBAL']
Victor Stinner7e509782016-04-12 18:17:06 +020019STORE_OPS = STORE_NAME, STORE_GLOBAL
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +030020EXTENDED_ARG = dis.EXTENDED_ARG
Guido van Rossum75dc4961998-03-05 03:42:00 +000021
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +000022# Modulefinder does a good job at simulating Python's, but it can not
23# handle __path__ modifications packages make at runtime. Therefore there
24# is a mechanism whereby you can register extra paths in this map for a
Thomas Wouters7e474022000-07-16 12:04:32 +000025# package, and it will be honored.
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +000026
27# Note this is a mapping is lists of paths.
28packagePathMap = {}
29
30# A Public interface
31def AddPackagePath(packagename, path):
Éric Araujocee6bb52011-08-01 15:29:07 +020032 packagePathMap.setdefault(packagename, []).append(path)
Guido van Rossum75dc4961998-03-05 03:42:00 +000033
Thomas Hellerc7aaf952002-11-14 18:45:11 +000034replacePackageMap = {}
35
Martin v. Löwis2f48d892011-05-09 08:05:43 +020036# This ReplacePackage mechanism allows modulefinder to work around
37# situations in which a package injects itself under the name
38# of another package into sys.modules at runtime by calling
39# ReplacePackage("real_package_name", "faked_package_name")
Thomas Hellerc7aaf952002-11-14 18:45:11 +000040# before running ModuleFinder.
41
42def ReplacePackage(oldname, newname):
43 replacePackageMap[oldname] = newname
44
45
Guido van Rossum75dc4961998-03-05 03:42:00 +000046class Module:
47
48 def __init__(self, name, file=None, path=None):
Guido van Rossum912a14c1998-03-05 04:56:37 +000049 self.__name__ = name
50 self.__file__ = file
51 self.__path__ = path
52 self.__code__ = None
Just van Rossume29310a2002-12-31 16:33:00 +000053 # The set of global names that are assigned to in the module.
54 # This includes those names imported through starimports of
55 # Python modules.
56 self.globalnames = {}
57 # The set of starimports this module did that could not be
58 # resolved, ie. a starimport from a non-Python module.
59 self.starimports = {}
Guido van Rossum75dc4961998-03-05 03:42:00 +000060
61 def __repr__(self):
Neil Schemenauer32d23c92004-02-15 16:43:20 +000062 s = "Module(%r" % (self.__name__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +000063 if self.__file__ is not None:
Walter Dörwald70a6b492004-02-12 17:35:32 +000064 s = s + ", %r" % (self.__file__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +000065 if self.__path__ is not None:
Walter Dörwald70a6b492004-02-12 17:35:32 +000066 s = s + ", %r" % (self.__path__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +000067 s = s + ")"
68 return s
Guido van Rossum75dc4961998-03-05 03:42:00 +000069
Guido van Rossum75dc4961998-03-05 03:42:00 +000070class ModuleFinder:
71
Just van Rossume29310a2002-12-31 16:33:00 +000072 def __init__(self, path=None, debug=0, excludes=[], replace_paths=[]):
Guido van Rossum912a14c1998-03-05 04:56:37 +000073 if path is None:
74 path = sys.path
75 self.path = path
76 self.modules = {}
77 self.badmodules = {}
78 self.debug = debug
79 self.indent = 0
Guido van Rossum78fc3631998-03-20 17:37:24 +000080 self.excludes = excludes
Guido van Rossum6b767ac2001-03-20 20:43:34 +000081 self.replace_paths = replace_paths
82 self.processed_paths = [] # Used in debugging only
Guido van Rossum75dc4961998-03-05 03:42:00 +000083
84 def msg(self, level, str, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +000085 if level <= self.debug:
86 for i in range(self.indent):
Guido van Rossumbe19ed72007-02-09 05:37:30 +000087 print(" ", end=' ')
88 print(str, end=' ')
Guido van Rossum912a14c1998-03-05 04:56:37 +000089 for arg in args:
Guido van Rossumbe19ed72007-02-09 05:37:30 +000090 print(repr(arg), end=' ')
91 print()
Guido van Rossum75dc4961998-03-05 03:42:00 +000092
93 def msgin(self, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +000094 level = args[0]
95 if level <= self.debug:
96 self.indent = self.indent + 1
Guido van Rossum68468eb2003-02-27 20:14:51 +000097 self.msg(*args)
Guido van Rossum75dc4961998-03-05 03:42:00 +000098
99 def msgout(self, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000100 level = args[0]
101 if level <= self.debug:
102 self.indent = self.indent - 1
Guido van Rossum68468eb2003-02-27 20:14:51 +0000103 self.msg(*args)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000104
105 def run_script(self, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000106 self.msg(2, "run_script", pathname)
Éric Araujo1e3a68d2011-07-28 23:35:29 +0200107 with open(pathname) as fp:
Brett Cannon028011f2010-10-30 00:26:48 +0000108 stuff = ("", "r", imp.PY_SOURCE)
109 self.load_module('__main__', fp, pathname, stuff)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000110
111 def load_file(self, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000112 dir, name = os.path.split(pathname)
113 name, ext = os.path.splitext(name)
Éric Araujo1e3a68d2011-07-28 23:35:29 +0200114 with open(pathname) as fp:
Brett Cannon028011f2010-10-30 00:26:48 +0000115 stuff = (ext, "r", imp.PY_SOURCE)
116 self.load_module(name, fp, pathname, stuff)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000117
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000118 def import_hook(self, name, caller=None, fromlist=None, level=-1):
119 self.msg(3, "import_hook", name, caller, fromlist, level)
120 parent = self.determine_parent(caller, level=level)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000121 q, tail = self.find_head_package(parent, name)
122 m = self.load_tail(q, tail)
123 if not fromlist:
124 return q
125 if m.__path__:
126 self.ensure_fromlist(m, fromlist)
Thomas Heller318b7b92002-11-26 08:06:50 +0000127 return None
Guido van Rossum75dc4961998-03-05 03:42:00 +0000128
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000129 def determine_parent(self, caller, level=-1):
130 self.msgin(4, "determine_parent", caller, level)
131 if not caller or level == 0:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000132 self.msgout(4, "determine_parent -> None")
133 return None
134 pname = caller.__name__
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000135 if level >= 1: # relative import
136 if caller.__path__:
137 level -= 1
138 if level == 0:
139 parent = self.modules[pname]
140 assert parent is caller
141 self.msgout(4, "determine_parent ->", parent)
142 return parent
143 if pname.count(".") < level:
Collin Winterce36ad82007-08-30 01:19:48 +0000144 raise ImportError("relative importpath too deep")
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000145 pname = ".".join(pname.split(".")[:-level])
146 parent = self.modules[pname]
147 self.msgout(4, "determine_parent ->", parent)
148 return parent
Guido van Rossum912a14c1998-03-05 04:56:37 +0000149 if caller.__path__:
150 parent = self.modules[pname]
151 assert caller is parent
152 self.msgout(4, "determine_parent ->", parent)
153 return parent
154 if '.' in pname:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000155 i = pname.rfind('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000156 pname = pname[:i]
157 parent = self.modules[pname]
158 assert parent.__name__ == pname
159 self.msgout(4, "determine_parent ->", parent)
160 return parent
161 self.msgout(4, "determine_parent -> None")
162 return None
Guido van Rossum75dc4961998-03-05 03:42:00 +0000163
164 def find_head_package(self, parent, name):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000165 self.msgin(4, "find_head_package", parent, name)
166 if '.' in name:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000167 i = name.find('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000168 head = name[:i]
169 tail = name[i+1:]
170 else:
171 head = name
172 tail = ""
173 if parent:
174 qname = "%s.%s" % (parent.__name__, head)
175 else:
176 qname = head
177 q = self.import_module(head, qname, parent)
178 if q:
179 self.msgout(4, "find_head_package ->", (q, tail))
180 return q, tail
181 if parent:
182 qname = head
183 parent = None
184 q = self.import_module(head, qname, parent)
185 if q:
186 self.msgout(4, "find_head_package ->", (q, tail))
187 return q, tail
188 self.msgout(4, "raise ImportError: No module named", qname)
Collin Winterce36ad82007-08-30 01:19:48 +0000189 raise ImportError("No module named " + qname)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000190
191 def load_tail(self, q, tail):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000192 self.msgin(4, "load_tail", q, tail)
193 m = q
194 while tail:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000195 i = tail.find('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000196 if i < 0: i = len(tail)
197 head, tail = tail[:i], tail[i+1:]
198 mname = "%s.%s" % (m.__name__, head)
199 m = self.import_module(head, mname, m)
200 if not m:
201 self.msgout(4, "raise ImportError: No module named", mname)
Collin Winterce36ad82007-08-30 01:19:48 +0000202 raise ImportError("No module named " + mname)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000203 self.msgout(4, "load_tail ->", m)
204 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000205
206 def ensure_fromlist(self, m, fromlist, recursive=0):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000207 self.msg(4, "ensure_fromlist", m, fromlist, recursive)
208 for sub in fromlist:
209 if sub == "*":
210 if not recursive:
211 all = self.find_all_submodules(m)
212 if all:
213 self.ensure_fromlist(m, all, 1)
214 elif not hasattr(m, sub):
215 subname = "%s.%s" % (m.__name__, sub)
216 submod = self.import_module(sub, subname, m)
217 if not submod:
Collin Winterce36ad82007-08-30 01:19:48 +0000218 raise ImportError("No module named " + subname)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000219
220 def find_all_submodules(self, m):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000221 if not m.__path__:
222 return
223 modules = {}
Brett Cannonf299abd2015-04-13 14:21:02 -0400224 # 'suffixes' used to be a list hardcoded to [".py", ".pyc"].
Thomas Helleraaf1c8d2003-11-14 10:28:42 +0000225 # But we must also collect Python extension modules - although
226 # we cannot separate normal dlls from Python extensions.
227 suffixes = []
Brett Cannoncb66eb02012-05-11 12:58:42 -0400228 suffixes += importlib.machinery.EXTENSION_SUFFIXES[:]
229 suffixes += importlib.machinery.SOURCE_SUFFIXES[:]
230 suffixes += importlib.machinery.BYTECODE_SUFFIXES[:]
Guido van Rossum912a14c1998-03-05 04:56:37 +0000231 for dir in m.__path__:
232 try:
233 names = os.listdir(dir)
Andrew Svetlovad28c7f2012-12-18 22:02:39 +0200234 except OSError:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000235 self.msg(2, "can't list directory", dir)
236 continue
237 for name in names:
238 mod = None
239 for suff in suffixes:
240 n = len(suff)
241 if name[-n:] == suff:
242 mod = name[:-n]
243 break
244 if mod and mod != "__init__":
245 modules[mod] = mod
246 return modules.keys()
Guido van Rossum75dc4961998-03-05 03:42:00 +0000247
248 def import_module(self, partname, fqname, parent):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000249 self.msgin(3, "import_module", partname, fqname, parent)
250 try:
251 m = self.modules[fqname]
252 except KeyError:
253 pass
254 else:
255 self.msgout(3, "import_module ->", m)
256 return m
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000257 if fqname in self.badmodules:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000258 self.msgout(3, "import_module -> None")
259 return None
Thomas Heller2e7c8322004-05-11 15:10:59 +0000260 if parent and parent.__path__ is None:
261 self.msgout(3, "import_module -> None")
262 return None
Guido van Rossum912a14c1998-03-05 04:56:37 +0000263 try:
264 fp, pathname, stuff = self.find_module(partname,
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000265 parent and parent.__path__, parent)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000266 except ImportError:
267 self.msgout(3, "import_module ->", None)
268 return None
269 try:
270 m = self.load_module(fqname, fp, pathname, stuff)
271 finally:
Éric Araujo1e3a68d2011-07-28 23:35:29 +0200272 if fp:
273 fp.close()
Guido van Rossum912a14c1998-03-05 04:56:37 +0000274 if parent:
275 setattr(parent, partname, m)
276 self.msgout(3, "import_module ->", m)
277 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000278
Guido van Rossum1bc535d2007-05-15 18:46:22 +0000279 def load_module(self, fqname, fp, pathname, file_info):
280 suffix, mode, type = file_info
Guido van Rossum912a14c1998-03-05 04:56:37 +0000281 self.msgin(2, "load_module", fqname, fp and "fp", pathname)
282 if type == imp.PKG_DIRECTORY:
283 m = self.load_package(fqname, pathname)
284 self.msgout(2, "load_module ->", m)
285 return m
286 if type == imp.PY_SOURCE:
Guido van Rossum78fc3631998-03-20 17:37:24 +0000287 co = compile(fp.read()+'\n', pathname, 'exec')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000288 elif type == imp.PY_COMPILED:
Brett Cannon0f384782014-02-28 10:50:34 -0500289 try:
Benjamin Peterson42aa93b2017-12-09 10:26:52 -0800290 data = fp.read()
291 importlib._bootstrap_external._classify_pyc(data, fqname, {})
Brett Cannon0f384782014-02-28 10:50:34 -0500292 except ImportError as exc:
293 self.msgout(2, "raise ImportError: " + str(exc), pathname)
294 raise
Benjamin Peterson42aa93b2017-12-09 10:26:52 -0800295 co = marshal.loads(memoryview(data)[16:])
Guido van Rossum912a14c1998-03-05 04:56:37 +0000296 else:
297 co = None
298 m = self.add_module(fqname)
Guido van Rossumab045f91998-03-06 19:55:10 +0000299 m.__file__ = pathname
Guido van Rossum912a14c1998-03-05 04:56:37 +0000300 if co:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000301 if self.replace_paths:
302 co = self.replace_paths_in_code(co)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000303 m.__code__ = co
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000304 self.scan_code(co, m)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000305 self.msgout(2, "load_module ->", m)
306 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000307
Just van Rossume29310a2002-12-31 16:33:00 +0000308 def _add_badmodule(self, name, caller):
309 if name not in self.badmodules:
310 self.badmodules[name] = {}
Benjamin Petersonc0747cf2008-11-03 20:31:38 +0000311 if caller:
312 self.badmodules[name][caller.__name__] = 1
313 else:
314 self.badmodules[name]["-"] = 1
Just van Rossume29310a2002-12-31 16:33:00 +0000315
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000316 def _safe_import_hook(self, name, caller, fromlist, level=-1):
Just van Rossume29310a2002-12-31 16:33:00 +0000317 # wrapper for self.import_hook() that won't raise ImportError
318 if name in self.badmodules:
319 self._add_badmodule(name, caller)
320 return
321 try:
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000322 self.import_hook(name, caller, level=level)
Guido van Rossumb940e112007-01-10 16:19:56 +0000323 except ImportError as msg:
Just van Rossume29310a2002-12-31 16:33:00 +0000324 self.msg(2, "ImportError:", str(msg))
325 self._add_badmodule(name, caller)
326 else:
327 if fromlist:
328 for sub in fromlist:
329 if sub in self.badmodules:
330 self._add_badmodule(sub, caller)
331 continue
332 try:
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000333 self.import_hook(name, caller, [sub], level=level)
Guido van Rossumb940e112007-01-10 16:19:56 +0000334 except ImportError as msg:
Just van Rossume29310a2002-12-31 16:33:00 +0000335 self.msg(2, "ImportError:", str(msg))
336 fullname = name + "." + sub
337 self._add_badmodule(fullname, caller)
338
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300339 def scan_opcodes(self, co):
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000340 # Scan the code, and yield 'interesting' opcode combinations
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000341 code = co.co_code
342 names = co.co_names
343 consts = co.co_consts
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300344 opargs = [(op, arg) for _, op, arg in dis._unpack_opargs(code)
345 if op != EXTENDED_ARG]
346 for i, (op, oparg) in enumerate(opargs):
347 if op in STORE_OPS:
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000348 yield "store", (names[oparg],)
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000349 continue
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300350 if (op == IMPORT_NAME and i >= 2
351 and opargs[i-1][0] == opargs[i-2][0] == LOAD_CONST):
352 level = consts[opargs[i-2][1]]
353 fromlist = consts[opargs[i-1][1]]
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000354 if level == 0: # absolute import
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300355 yield "absolute_import", (fromlist, names[oparg])
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000356 else: # relative import
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300357 yield "relative_import", (level, fromlist, names[oparg])
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000358 continue
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000359
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000360 def scan_code(self, co, m):
361 code = co.co_code
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300362 scanner = self.scan_opcodes
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000363 for what, args in scanner(co):
364 if what == "store":
365 name, = args
366 m.globalnames[name] = 1
367 elif what == "absolute_import":
368 fromlist, name = args
Just van Rossume29310a2002-12-31 16:33:00 +0000369 have_star = 0
370 if fromlist is not None:
371 if "*" in fromlist:
372 have_star = 1
373 fromlist = [f for f in fromlist if f != "*"]
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000374 self._safe_import_hook(name, m, fromlist, level=0)
Just van Rossume29310a2002-12-31 16:33:00 +0000375 if have_star:
376 # We've encountered an "import *". If it is a Python module,
377 # the code has already been parsed and we can suck out the
378 # global names.
379 mm = None
380 if m.__path__:
381 # At this point we don't know whether 'name' is a
382 # submodule of 'm' or a global module. Let's just try
383 # the full name first.
384 mm = self.modules.get(m.__name__ + "." + name)
385 if mm is None:
386 mm = self.modules.get(name)
387 if mm is not None:
388 m.globalnames.update(mm.globalnames)
389 m.starimports.update(mm.starimports)
390 if mm.__code__ is None:
391 m.starimports[name] = 1
392 else:
393 m.starimports[name] = 1
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000394 elif what == "relative_import":
395 level, fromlist, name = args
396 if name:
397 self._safe_import_hook(name, m, fromlist, level=level)
398 else:
399 parent = self.determine_parent(m, level=level)
400 self._safe_import_hook(parent.__name__, None, fromlist, level=0)
401 else:
402 # We don't expect anything else from the generator.
403 raise RuntimeError(what)
404
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000405 for c in co.co_consts:
406 if isinstance(c, type(co)):
407 self.scan_code(c, m)
408
Guido van Rossum75dc4961998-03-05 03:42:00 +0000409 def load_package(self, fqname, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000410 self.msgin(2, "load_package", fqname, pathname)
Thomas Hellerc7aaf952002-11-14 18:45:11 +0000411 newname = replacePackageMap.get(fqname)
412 if newname:
413 fqname = newname
Guido van Rossum912a14c1998-03-05 04:56:37 +0000414 m = self.add_module(fqname)
415 m.__file__ = pathname
416 m.__path__ = [pathname]
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +0000417
Guido van Rossume7e632a1998-09-14 16:02:28 +0000418 # As per comment at top of file, simulate runtime __path__ additions.
419 m.__path__ = m.__path__ + packagePathMap.get(fqname, [])
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +0000420
Guido van Rossum912a14c1998-03-05 04:56:37 +0000421 fp, buf, stuff = self.find_module("__init__", m.__path__)
Brett Cannon028011f2010-10-30 00:26:48 +0000422 try:
423 self.load_module(fqname, fp, buf, stuff)
424 self.msgout(2, "load_package ->", m)
425 return m
426 finally:
427 if fp:
428 fp.close()
Guido van Rossum75dc4961998-03-05 03:42:00 +0000429
430 def add_module(self, fqname):
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000431 if fqname in self.modules:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000432 return self.modules[fqname]
433 self.modules[fqname] = m = Module(fqname)
434 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000435
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000436 def find_module(self, name, path, parent=None):
437 if parent is not None:
Thomas Heller2e7c8322004-05-11 15:10:59 +0000438 # assert path is not None
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000439 fullname = parent.__name__+'.'+name
Guido van Rossum03f7f082001-10-18 19:15:32 +0000440 else:
441 fullname = name
442 if fullname in self.excludes:
443 self.msgout(3, "find_module -> Excluded", fullname)
Collin Winterce36ad82007-08-30 01:19:48 +0000444 raise ImportError(name)
Guido van Rossum78fc3631998-03-20 17:37:24 +0000445
Guido van Rossum912a14c1998-03-05 04:56:37 +0000446 if path is None:
447 if name in sys.builtin_module_names:
448 return (None, None, ("", "", imp.C_BUILTIN))
Guido van Rossum78fc3631998-03-20 17:37:24 +0000449
Guido van Rossum912a14c1998-03-05 04:56:37 +0000450 path = self.path
451 return imp.find_module(name, path)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000452
453 def report(self):
Just van Rossume29310a2002-12-31 16:33:00 +0000454 """Print a report to stdout, listing the found modules with their
455 paths, as well as modules that are missing, or seem to be missing.
456 """
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000457 print()
458 print(" %-25s %s" % ("Name", "File"))
459 print(" %-25s %s" % ("----", "----"))
Guido van Rossum912a14c1998-03-05 04:56:37 +0000460 # Print modules found
Guido van Rossumd59cde82007-06-12 00:25:08 +0000461 keys = sorted(self.modules.keys())
Guido van Rossum912a14c1998-03-05 04:56:37 +0000462 for key in keys:
463 m = self.modules[key]
464 if m.__path__:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000465 print("P", end=' ')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000466 else:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000467 print("m", end=' ')
468 print("%-25s" % key, m.__file__ or "")
Guido van Rossum75dc4961998-03-05 03:42:00 +0000469
Guido van Rossum912a14c1998-03-05 04:56:37 +0000470 # Print missing modules
Just van Rossume29310a2002-12-31 16:33:00 +0000471 missing, maybe = self.any_missing_maybe()
472 if missing:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000473 print()
474 print("Missing modules:")
Just van Rossume29310a2002-12-31 16:33:00 +0000475 for name in missing:
Guido van Rossumd59cde82007-06-12 00:25:08 +0000476 mods = sorted(self.badmodules[name].keys())
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000477 print("?", name, "imported from", ', '.join(mods))
Just van Rossume29310a2002-12-31 16:33:00 +0000478 # Print modules that may be missing, but then again, maybe not...
479 if maybe:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000480 print()
Ezio Melotti30b9d5d2013-08-17 15:50:46 +0300481 print("Submodules that appear to be missing, but could also be", end=' ')
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000482 print("global names in the parent package:")
Just van Rossume29310a2002-12-31 16:33:00 +0000483 for name in maybe:
Guido van Rossumd59cde82007-06-12 00:25:08 +0000484 mods = sorted(self.badmodules[name].keys())
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000485 print("?", name, "imported from", ', '.join(mods))
Guido van Rossum75dc4961998-03-05 03:42:00 +0000486
Guido van Rossum03f7f082001-10-18 19:15:32 +0000487 def any_missing(self):
Just van Rossume29310a2002-12-31 16:33:00 +0000488 """Return a list of modules that appear to be missing. Use
489 any_missing_maybe() if you want to know which modules are
490 certain to be missing, and which *may* be missing.
491 """
492 missing, maybe = self.any_missing_maybe()
493 return missing + maybe
494
495 def any_missing_maybe(self):
496 """Return two lists, one with modules that are certainly missing
497 and one with modules that *may* be missing. The latter names could
498 either be submodules *or* just global names in the package.
499
500 The reason it can't always be determined is that it's impossible to
501 tell which names are imported when "from module import *" is done
502 with an extension module, short of actually importing it.
503 """
Guido van Rossum03f7f082001-10-18 19:15:32 +0000504 missing = []
Just van Rossume29310a2002-12-31 16:33:00 +0000505 maybe = []
506 for name in self.badmodules:
507 if name in self.excludes:
508 continue
509 i = name.rfind(".")
510 if i < 0:
511 missing.append(name)
512 continue
513 subname = name[i+1:]
514 pkgname = name[:i]
515 pkg = self.modules.get(pkgname)
516 if pkg is not None:
517 if pkgname in self.badmodules[name]:
518 # The package tried to import this module itself and
519 # failed. It's definitely missing.
520 missing.append(name)
521 elif subname in pkg.globalnames:
522 # It's a global in the package: definitely not missing.
523 pass
524 elif pkg.starimports:
525 # It could be missing, but the package did an "import *"
526 # from a non-Python module, so we simply can't be sure.
527 maybe.append(name)
528 else:
529 # It's not a global in the package, the package didn't
530 # do funny star imports, it's very likely to be missing.
531 # The symbol could be inserted into the package from the
532 # outside, but since that's not good style we simply list
533 # it missing.
534 missing.append(name)
535 else:
536 missing.append(name)
537 missing.sort()
538 maybe.sort()
539 return missing, maybe
Guido van Rossum03f7f082001-10-18 19:15:32 +0000540
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000541 def replace_paths_in_code(self, co):
542 new_filename = original_filename = os.path.normpath(co.co_filename)
Just van Rossume29310a2002-12-31 16:33:00 +0000543 for f, r in self.replace_paths:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000544 if original_filename.startswith(f):
Just van Rossume29310a2002-12-31 16:33:00 +0000545 new_filename = r + original_filename[len(f):]
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000546 break
547
548 if self.debug and original_filename not in self.processed_paths:
Just van Rossume29310a2002-12-31 16:33:00 +0000549 if new_filename != original_filename:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000550 self.msgout(2, "co_filename %r changed to %r" \
551 % (original_filename,new_filename,))
552 else:
553 self.msgout(2, "co_filename %r remains unchanged" \
554 % (original_filename,))
555 self.processed_paths.append(original_filename)
556
557 consts = list(co.co_consts)
558 for i in range(len(consts)):
559 if isinstance(consts[i], type(co)):
560 consts[i] = self.replace_paths_in_code(consts[i])
561
Berker Peksag0a0d1da2014-07-07 14:58:12 +0300562 return types.CodeType(co.co_argcount, co.co_kwonlyargcount,
563 co.co_nlocals, co.co_stacksize, co.co_flags,
564 co.co_code, tuple(consts), co.co_names,
565 co.co_varnames, new_filename, co.co_name,
566 co.co_firstlineno, co.co_lnotab, co.co_freevars,
567 co.co_cellvars)
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000568
Guido van Rossum75dc4961998-03-05 03:42:00 +0000569
570def test():
571 # Parse command line
572 import getopt
573 try:
Guido van Rossumbaf06031998-08-25 14:06:55 +0000574 opts, args = getopt.getopt(sys.argv[1:], "dmp:qx:")
Guido van Rossumb940e112007-01-10 16:19:56 +0000575 except getopt.error as msg:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000576 print(msg)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000577 return
Guido van Rossum75dc4961998-03-05 03:42:00 +0000578
579 # Process options
580 debug = 1
581 domods = 0
582 addpath = []
Guido van Rossumbaf06031998-08-25 14:06:55 +0000583 exclude = []
Guido van Rossum75dc4961998-03-05 03:42:00 +0000584 for o, a in opts:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000585 if o == '-d':
586 debug = debug + 1
587 if o == '-m':
588 domods = 1
589 if o == '-p':
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000590 addpath = addpath + a.split(os.pathsep)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000591 if o == '-q':
592 debug = 0
Guido van Rossumbaf06031998-08-25 14:06:55 +0000593 if o == '-x':
594 exclude.append(a)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000595
596 # Provide default arguments
597 if not args:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000598 script = "hello.py"
Guido van Rossum75dc4961998-03-05 03:42:00 +0000599 else:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000600 script = args[0]
Guido van Rossum75dc4961998-03-05 03:42:00 +0000601
602 # Set the path based on sys.path and the script directory
603 path = sys.path[:]
604 path[0] = os.path.dirname(script)
605 path = addpath + path
606 if debug > 1:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000607 print("path:")
Guido van Rossum912a14c1998-03-05 04:56:37 +0000608 for item in path:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000609 print(" ", repr(item))
Guido van Rossum75dc4961998-03-05 03:42:00 +0000610
611 # Create the module finder and turn its crank
Guido van Rossumbaf06031998-08-25 14:06:55 +0000612 mf = ModuleFinder(path, debug, exclude)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000613 for arg in args[1:]:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000614 if arg == '-m':
615 domods = 1
616 continue
617 if domods:
618 if arg[-2:] == '.*':
619 mf.import_hook(arg[:-2], None, ["*"])
620 else:
621 mf.import_hook(arg)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000622 else:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000623 mf.load_file(arg)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000624 mf.run_script(script)
625 mf.report()
Just van Rossume29310a2002-12-31 16:33:00 +0000626 return mf # for -i debugging
Guido van Rossum75dc4961998-03-05 03:42:00 +0000627
628
629if __name__ == '__main__':
630 try:
Just van Rossume29310a2002-12-31 16:33:00 +0000631 mf = test()
Guido van Rossum75dc4961998-03-05 03:42:00 +0000632 except KeyboardInterrupt:
Éric Araujo1e3a68d2011-07-28 23:35:29 +0200633 print("\n[interrupted]")