blob: 84ddbdb6ee3df2107b4399ae519e3a7e806b6c00 [file] [log] [blame]
Guido van Rossum75dc4961998-03-05 03:42:00 +00001"""Find modules used by a script, using introspection."""
Thomas Heller919000e2002-11-25 20:21:59 +00002
Guido van Rossum75dc4961998-03-05 03:42:00 +00003import dis
Eric Snow32439d62015-05-02 19:15:18 -06004import importlib._bootstrap_external
Brett Cannon73b969e2012-12-22 19:34:21 -05005import importlib.machinery
Guido van Rossum75dc4961998-03-05 03:42:00 +00006import marshal
7import os
Barryd42e5822020-04-14 20:16:06 +01008import io
Guido van Rossum75dc4961998-03-05 03:42:00 +00009import sys
Christian Heimes45f9af32007-11-27 21:50:00 +000010import types
Brett Cannone4f41de2013-06-16 13:13:40 -040011import warnings
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070012
Guido van Rossum75dc4961998-03-05 03:42:00 +000013
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +030014LOAD_CONST = dis.opmap['LOAD_CONST']
15IMPORT_NAME = dis.opmap['IMPORT_NAME']
16STORE_NAME = dis.opmap['STORE_NAME']
17STORE_GLOBAL = dis.opmap['STORE_GLOBAL']
Victor Stinner7e509782016-04-12 18:17:06 +020018STORE_OPS = STORE_NAME, STORE_GLOBAL
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +030019EXTENDED_ARG = dis.EXTENDED_ARG
Guido van Rossum75dc4961998-03-05 03:42:00 +000020
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070021# Old imp constants:
22
23_SEARCH_ERROR = 0
24_PY_SOURCE = 1
25_PY_COMPILED = 2
26_C_EXTENSION = 3
27_PKG_DIRECTORY = 5
28_C_BUILTIN = 6
29_PY_FROZEN = 7
30
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +000031# Modulefinder does a good job at simulating Python's, but it can not
32# handle __path__ modifications packages make at runtime. Therefore there
33# is a mechanism whereby you can register extra paths in this map for a
Thomas Wouters7e474022000-07-16 12:04:32 +000034# package, and it will be honored.
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +000035
36# Note this is a mapping is lists of paths.
37packagePathMap = {}
38
39# A Public interface
40def AddPackagePath(packagename, path):
Éric Araujocee6bb52011-08-01 15:29:07 +020041 packagePathMap.setdefault(packagename, []).append(path)
Guido van Rossum75dc4961998-03-05 03:42:00 +000042
Thomas Hellerc7aaf952002-11-14 18:45:11 +000043replacePackageMap = {}
44
Martin v. Löwis2f48d892011-05-09 08:05:43 +020045# This ReplacePackage mechanism allows modulefinder to work around
46# situations in which a package injects itself under the name
47# of another package into sys.modules at runtime by calling
48# ReplacePackage("real_package_name", "faked_package_name")
Thomas Hellerc7aaf952002-11-14 18:45:11 +000049# before running ModuleFinder.
50
51def ReplacePackage(oldname, newname):
52 replacePackageMap[oldname] = newname
53
54
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070055def _find_module(name, path=None):
56 """An importlib reimplementation of imp.find_module (for our purposes)."""
57
58 # It's necessary to clear the caches for our Finder first, in case any
59 # modules are being added/deleted/modified at runtime. In particular,
60 # test_modulefinder.py changes file tree contents in a cache-breaking way:
61
62 importlib.machinery.PathFinder.invalidate_caches()
63
64 spec = importlib.machinery.PathFinder.find_spec(name, path)
65
66 if spec is None:
67 raise ImportError("No module named {name!r}".format(name=name), name=name)
68
69 # Some special cases:
70
71 if spec.loader is importlib.machinery.BuiltinImporter:
Barryd42e5822020-04-14 20:16:06 +010072 return None, None, ("", _C_BUILTIN)
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070073
74 if spec.loader is importlib.machinery.FrozenImporter:
Barryd42e5822020-04-14 20:16:06 +010075 return None, None, ("", _PY_FROZEN)
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070076
77 file_path = spec.origin
78
79 if spec.loader.is_package(name):
Barryd42e5822020-04-14 20:16:06 +010080 return None, os.path.dirname(file_path), ("", _PKG_DIRECTORY)
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070081
82 if isinstance(spec.loader, importlib.machinery.SourceFileLoader):
83 kind = _PY_SOURCE
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070084
85 elif isinstance(spec.loader, importlib.machinery.ExtensionFileLoader):
86 kind = _C_EXTENSION
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070087
88 elif isinstance(spec.loader, importlib.machinery.SourcelessFileLoader):
89 kind = _PY_COMPILED
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070090
91 else: # Should never happen.
Barryd42e5822020-04-14 20:16:06 +010092 return None, None, ("", _SEARCH_ERROR)
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070093
Barryd42e5822020-04-14 20:16:06 +010094 file = io.open_code(file_path)
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070095 suffix = os.path.splitext(file_path)[-1]
96
Barryd42e5822020-04-14 20:16:06 +010097 return file, file_path, (suffix, kind)
Brandt Bucher9d7b2c02019-04-07 01:00:41 -070098
99
Guido van Rossum75dc4961998-03-05 03:42:00 +0000100class Module:
101
102 def __init__(self, name, file=None, path=None):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000103 self.__name__ = name
104 self.__file__ = file
105 self.__path__ = path
106 self.__code__ = None
Just van Rossume29310a2002-12-31 16:33:00 +0000107 # The set of global names that are assigned to in the module.
108 # This includes those names imported through starimports of
109 # Python modules.
110 self.globalnames = {}
111 # The set of starimports this module did that could not be
112 # resolved, ie. a starimport from a non-Python module.
113 self.starimports = {}
Guido van Rossum75dc4961998-03-05 03:42:00 +0000114
115 def __repr__(self):
Neil Schemenauer32d23c92004-02-15 16:43:20 +0000116 s = "Module(%r" % (self.__name__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000117 if self.__file__ is not None:
Walter Dörwald70a6b492004-02-12 17:35:32 +0000118 s = s + ", %r" % (self.__file__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000119 if self.__path__ is not None:
Walter Dörwald70a6b492004-02-12 17:35:32 +0000120 s = s + ", %r" % (self.__path__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000121 s = s + ")"
122 return s
Guido van Rossum75dc4961998-03-05 03:42:00 +0000123
Guido van Rossum75dc4961998-03-05 03:42:00 +0000124class ModuleFinder:
125
Brandt Bucher9d7b2c02019-04-07 01:00:41 -0700126 def __init__(self, path=None, debug=0, excludes=None, replace_paths=None):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000127 if path is None:
128 path = sys.path
129 self.path = path
130 self.modules = {}
131 self.badmodules = {}
132 self.debug = debug
133 self.indent = 0
Brandt Bucher9d7b2c02019-04-07 01:00:41 -0700134 self.excludes = excludes if excludes is not None else []
135 self.replace_paths = replace_paths if replace_paths is not None else []
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000136 self.processed_paths = [] # Used in debugging only
Guido van Rossum75dc4961998-03-05 03:42:00 +0000137
138 def msg(self, level, str, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000139 if level <= self.debug:
140 for i in range(self.indent):
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000141 print(" ", end=' ')
142 print(str, end=' ')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000143 for arg in args:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000144 print(repr(arg), end=' ')
145 print()
Guido van Rossum75dc4961998-03-05 03:42:00 +0000146
147 def msgin(self, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000148 level = args[0]
149 if level <= self.debug:
150 self.indent = self.indent + 1
Guido van Rossum68468eb2003-02-27 20:14:51 +0000151 self.msg(*args)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000152
153 def msgout(self, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000154 level = args[0]
155 if level <= self.debug:
156 self.indent = self.indent - 1
Guido van Rossum68468eb2003-02-27 20:14:51 +0000157 self.msg(*args)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000158
159 def run_script(self, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000160 self.msg(2, "run_script", pathname)
Barryd42e5822020-04-14 20:16:06 +0100161 with io.open_code(pathname) as fp:
162 stuff = ("", _PY_SOURCE)
Brett Cannon028011f2010-10-30 00:26:48 +0000163 self.load_module('__main__', fp, pathname, stuff)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000164
165 def load_file(self, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000166 dir, name = os.path.split(pathname)
167 name, ext = os.path.splitext(name)
Barryd42e5822020-04-14 20:16:06 +0100168 with io.open_code(pathname) as fp:
169 stuff = (ext, _PY_SOURCE)
Brett Cannon028011f2010-10-30 00:26:48 +0000170 self.load_module(name, fp, pathname, stuff)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000171
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000172 def import_hook(self, name, caller=None, fromlist=None, level=-1):
173 self.msg(3, "import_hook", name, caller, fromlist, level)
174 parent = self.determine_parent(caller, level=level)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000175 q, tail = self.find_head_package(parent, name)
176 m = self.load_tail(q, tail)
177 if not fromlist:
178 return q
179 if m.__path__:
180 self.ensure_fromlist(m, fromlist)
Thomas Heller318b7b92002-11-26 08:06:50 +0000181 return None
Guido van Rossum75dc4961998-03-05 03:42:00 +0000182
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000183 def determine_parent(self, caller, level=-1):
184 self.msgin(4, "determine_parent", caller, level)
185 if not caller or level == 0:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000186 self.msgout(4, "determine_parent -> None")
187 return None
188 pname = caller.__name__
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000189 if level >= 1: # relative import
190 if caller.__path__:
191 level -= 1
192 if level == 0:
193 parent = self.modules[pname]
194 assert parent is caller
195 self.msgout(4, "determine_parent ->", parent)
196 return parent
197 if pname.count(".") < level:
Collin Winterce36ad82007-08-30 01:19:48 +0000198 raise ImportError("relative importpath too deep")
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000199 pname = ".".join(pname.split(".")[:-level])
200 parent = self.modules[pname]
201 self.msgout(4, "determine_parent ->", parent)
202 return parent
Guido van Rossum912a14c1998-03-05 04:56:37 +0000203 if caller.__path__:
204 parent = self.modules[pname]
205 assert caller is parent
206 self.msgout(4, "determine_parent ->", parent)
207 return parent
208 if '.' in pname:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000209 i = pname.rfind('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000210 pname = pname[:i]
211 parent = self.modules[pname]
212 assert parent.__name__ == pname
213 self.msgout(4, "determine_parent ->", parent)
214 return parent
215 self.msgout(4, "determine_parent -> None")
216 return None
Guido van Rossum75dc4961998-03-05 03:42:00 +0000217
218 def find_head_package(self, parent, name):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000219 self.msgin(4, "find_head_package", parent, name)
220 if '.' in name:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000221 i = name.find('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000222 head = name[:i]
223 tail = name[i+1:]
224 else:
225 head = name
226 tail = ""
227 if parent:
228 qname = "%s.%s" % (parent.__name__, head)
229 else:
230 qname = head
231 q = self.import_module(head, qname, parent)
232 if q:
233 self.msgout(4, "find_head_package ->", (q, tail))
234 return q, tail
235 if parent:
236 qname = head
237 parent = None
238 q = self.import_module(head, qname, parent)
239 if q:
240 self.msgout(4, "find_head_package ->", (q, tail))
241 return q, tail
242 self.msgout(4, "raise ImportError: No module named", qname)
Collin Winterce36ad82007-08-30 01:19:48 +0000243 raise ImportError("No module named " + qname)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000244
245 def load_tail(self, q, tail):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000246 self.msgin(4, "load_tail", q, tail)
247 m = q
248 while tail:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000249 i = tail.find('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000250 if i < 0: i = len(tail)
251 head, tail = tail[:i], tail[i+1:]
252 mname = "%s.%s" % (m.__name__, head)
253 m = self.import_module(head, mname, m)
254 if not m:
255 self.msgout(4, "raise ImportError: No module named", mname)
Collin Winterce36ad82007-08-30 01:19:48 +0000256 raise ImportError("No module named " + mname)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000257 self.msgout(4, "load_tail ->", m)
258 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000259
260 def ensure_fromlist(self, m, fromlist, recursive=0):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000261 self.msg(4, "ensure_fromlist", m, fromlist, recursive)
262 for sub in fromlist:
263 if sub == "*":
264 if not recursive:
265 all = self.find_all_submodules(m)
266 if all:
267 self.ensure_fromlist(m, all, 1)
268 elif not hasattr(m, sub):
269 subname = "%s.%s" % (m.__name__, sub)
270 submod = self.import_module(sub, subname, m)
271 if not submod:
Collin Winterce36ad82007-08-30 01:19:48 +0000272 raise ImportError("No module named " + subname)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000273
274 def find_all_submodules(self, m):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000275 if not m.__path__:
276 return
277 modules = {}
Brett Cannonf299abd2015-04-13 14:21:02 -0400278 # 'suffixes' used to be a list hardcoded to [".py", ".pyc"].
Thomas Helleraaf1c8d2003-11-14 10:28:42 +0000279 # But we must also collect Python extension modules - although
280 # we cannot separate normal dlls from Python extensions.
281 suffixes = []
Brett Cannoncb66eb02012-05-11 12:58:42 -0400282 suffixes += importlib.machinery.EXTENSION_SUFFIXES[:]
283 suffixes += importlib.machinery.SOURCE_SUFFIXES[:]
284 suffixes += importlib.machinery.BYTECODE_SUFFIXES[:]
Guido van Rossum912a14c1998-03-05 04:56:37 +0000285 for dir in m.__path__:
286 try:
287 names = os.listdir(dir)
Andrew Svetlovad28c7f2012-12-18 22:02:39 +0200288 except OSError:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000289 self.msg(2, "can't list directory", dir)
290 continue
291 for name in names:
292 mod = None
293 for suff in suffixes:
294 n = len(suff)
295 if name[-n:] == suff:
296 mod = name[:-n]
297 break
298 if mod and mod != "__init__":
299 modules[mod] = mod
300 return modules.keys()
Guido van Rossum75dc4961998-03-05 03:42:00 +0000301
302 def import_module(self, partname, fqname, parent):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000303 self.msgin(3, "import_module", partname, fqname, parent)
304 try:
305 m = self.modules[fqname]
306 except KeyError:
307 pass
308 else:
309 self.msgout(3, "import_module ->", m)
310 return m
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000311 if fqname in self.badmodules:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000312 self.msgout(3, "import_module -> None")
313 return None
Thomas Heller2e7c8322004-05-11 15:10:59 +0000314 if parent and parent.__path__ is None:
315 self.msgout(3, "import_module -> None")
316 return None
Guido van Rossum912a14c1998-03-05 04:56:37 +0000317 try:
318 fp, pathname, stuff = self.find_module(partname,
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000319 parent and parent.__path__, parent)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000320 except ImportError:
321 self.msgout(3, "import_module ->", None)
322 return None
323 try:
324 m = self.load_module(fqname, fp, pathname, stuff)
325 finally:
Éric Araujo1e3a68d2011-07-28 23:35:29 +0200326 if fp:
327 fp.close()
Guido van Rossum912a14c1998-03-05 04:56:37 +0000328 if parent:
329 setattr(parent, partname, m)
330 self.msgout(3, "import_module ->", m)
331 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000332
Guido van Rossum1bc535d2007-05-15 18:46:22 +0000333 def load_module(self, fqname, fp, pathname, file_info):
Barryd42e5822020-04-14 20:16:06 +0100334 suffix, type = file_info
Guido van Rossum912a14c1998-03-05 04:56:37 +0000335 self.msgin(2, "load_module", fqname, fp and "fp", pathname)
Brandt Bucher9d7b2c02019-04-07 01:00:41 -0700336 if type == _PKG_DIRECTORY:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000337 m = self.load_package(fqname, pathname)
338 self.msgout(2, "load_module ->", m)
339 return m
Brandt Bucher9d7b2c02019-04-07 01:00:41 -0700340 if type == _PY_SOURCE:
Barryd42e5822020-04-14 20:16:06 +0100341 co = compile(fp.read()+b'\n', pathname, 'exec')
Brandt Bucher9d7b2c02019-04-07 01:00:41 -0700342 elif type == _PY_COMPILED:
Brett Cannon0f384782014-02-28 10:50:34 -0500343 try:
Benjamin Peterson42aa93b2017-12-09 10:26:52 -0800344 data = fp.read()
345 importlib._bootstrap_external._classify_pyc(data, fqname, {})
Brett Cannon0f384782014-02-28 10:50:34 -0500346 except ImportError as exc:
347 self.msgout(2, "raise ImportError: " + str(exc), pathname)
348 raise
Benjamin Peterson42aa93b2017-12-09 10:26:52 -0800349 co = marshal.loads(memoryview(data)[16:])
Guido van Rossum912a14c1998-03-05 04:56:37 +0000350 else:
351 co = None
352 m = self.add_module(fqname)
Guido van Rossumab045f91998-03-06 19:55:10 +0000353 m.__file__ = pathname
Guido van Rossum912a14c1998-03-05 04:56:37 +0000354 if co:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000355 if self.replace_paths:
356 co = self.replace_paths_in_code(co)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000357 m.__code__ = co
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000358 self.scan_code(co, m)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000359 self.msgout(2, "load_module ->", m)
360 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000361
Just van Rossume29310a2002-12-31 16:33:00 +0000362 def _add_badmodule(self, name, caller):
363 if name not in self.badmodules:
364 self.badmodules[name] = {}
Benjamin Petersonc0747cf2008-11-03 20:31:38 +0000365 if caller:
366 self.badmodules[name][caller.__name__] = 1
367 else:
368 self.badmodules[name]["-"] = 1
Just van Rossume29310a2002-12-31 16:33:00 +0000369
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000370 def _safe_import_hook(self, name, caller, fromlist, level=-1):
Just van Rossume29310a2002-12-31 16:33:00 +0000371 # wrapper for self.import_hook() that won't raise ImportError
372 if name in self.badmodules:
373 self._add_badmodule(name, caller)
374 return
375 try:
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000376 self.import_hook(name, caller, level=level)
Guido van Rossumb940e112007-01-10 16:19:56 +0000377 except ImportError as msg:
Just van Rossume29310a2002-12-31 16:33:00 +0000378 self.msg(2, "ImportError:", str(msg))
379 self._add_badmodule(name, caller)
Brandt Bucher9d7b2c02019-04-07 01:00:41 -0700380 except SyntaxError as msg:
381 self.msg(2, "SyntaxError:", str(msg))
382 self._add_badmodule(name, caller)
Just van Rossume29310a2002-12-31 16:33:00 +0000383 else:
384 if fromlist:
385 for sub in fromlist:
Brandt Bucher9d7b2c02019-04-07 01:00:41 -0700386 fullname = name + "." + sub
387 if fullname in self.badmodules:
388 self._add_badmodule(fullname, caller)
Just van Rossume29310a2002-12-31 16:33:00 +0000389 continue
390 try:
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000391 self.import_hook(name, caller, [sub], level=level)
Guido van Rossumb940e112007-01-10 16:19:56 +0000392 except ImportError as msg:
Just van Rossume29310a2002-12-31 16:33:00 +0000393 self.msg(2, "ImportError:", str(msg))
Just van Rossume29310a2002-12-31 16:33:00 +0000394 self._add_badmodule(fullname, caller)
395
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300396 def scan_opcodes(self, co):
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000397 # Scan the code, and yield 'interesting' opcode combinations
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000398 code = co.co_code
399 names = co.co_names
400 consts = co.co_consts
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300401 opargs = [(op, arg) for _, op, arg in dis._unpack_opargs(code)
402 if op != EXTENDED_ARG]
403 for i, (op, oparg) in enumerate(opargs):
404 if op in STORE_OPS:
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000405 yield "store", (names[oparg],)
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000406 continue
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300407 if (op == IMPORT_NAME and i >= 2
408 and opargs[i-1][0] == opargs[i-2][0] == LOAD_CONST):
409 level = consts[opargs[i-2][1]]
410 fromlist = consts[opargs[i-1][1]]
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000411 if level == 0: # absolute import
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300412 yield "absolute_import", (fromlist, names[oparg])
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000413 else: # relative import
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300414 yield "relative_import", (level, fromlist, names[oparg])
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000415 continue
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000416
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000417 def scan_code(self, co, m):
418 code = co.co_code
Serhiy Storchaka02d9f5e2016-05-08 23:43:50 +0300419 scanner = self.scan_opcodes
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000420 for what, args in scanner(co):
421 if what == "store":
422 name, = args
423 m.globalnames[name] = 1
424 elif what == "absolute_import":
425 fromlist, name = args
Just van Rossume29310a2002-12-31 16:33:00 +0000426 have_star = 0
427 if fromlist is not None:
428 if "*" in fromlist:
429 have_star = 1
430 fromlist = [f for f in fromlist if f != "*"]
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000431 self._safe_import_hook(name, m, fromlist, level=0)
Just van Rossume29310a2002-12-31 16:33:00 +0000432 if have_star:
433 # We've encountered an "import *". If it is a Python module,
434 # the code has already been parsed and we can suck out the
435 # global names.
436 mm = None
437 if m.__path__:
438 # At this point we don't know whether 'name' is a
439 # submodule of 'm' or a global module. Let's just try
440 # the full name first.
441 mm = self.modules.get(m.__name__ + "." + name)
442 if mm is None:
443 mm = self.modules.get(name)
444 if mm is not None:
445 m.globalnames.update(mm.globalnames)
446 m.starimports.update(mm.starimports)
447 if mm.__code__ is None:
448 m.starimports[name] = 1
449 else:
450 m.starimports[name] = 1
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000451 elif what == "relative_import":
452 level, fromlist, name = args
453 if name:
454 self._safe_import_hook(name, m, fromlist, level=level)
455 else:
456 parent = self.determine_parent(m, level=level)
457 self._safe_import_hook(parent.__name__, None, fromlist, level=0)
458 else:
459 # We don't expect anything else from the generator.
460 raise RuntimeError(what)
461
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000462 for c in co.co_consts:
463 if isinstance(c, type(co)):
464 self.scan_code(c, m)
465
Guido van Rossum75dc4961998-03-05 03:42:00 +0000466 def load_package(self, fqname, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000467 self.msgin(2, "load_package", fqname, pathname)
Thomas Hellerc7aaf952002-11-14 18:45:11 +0000468 newname = replacePackageMap.get(fqname)
469 if newname:
470 fqname = newname
Guido van Rossum912a14c1998-03-05 04:56:37 +0000471 m = self.add_module(fqname)
472 m.__file__ = pathname
473 m.__path__ = [pathname]
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +0000474
Guido van Rossume7e632a1998-09-14 16:02:28 +0000475 # As per comment at top of file, simulate runtime __path__ additions.
476 m.__path__ = m.__path__ + packagePathMap.get(fqname, [])
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +0000477
Guido van Rossum912a14c1998-03-05 04:56:37 +0000478 fp, buf, stuff = self.find_module("__init__", m.__path__)
Brett Cannon028011f2010-10-30 00:26:48 +0000479 try:
480 self.load_module(fqname, fp, buf, stuff)
481 self.msgout(2, "load_package ->", m)
482 return m
483 finally:
484 if fp:
485 fp.close()
Guido van Rossum75dc4961998-03-05 03:42:00 +0000486
487 def add_module(self, fqname):
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000488 if fqname in self.modules:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000489 return self.modules[fqname]
490 self.modules[fqname] = m = Module(fqname)
491 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000492
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000493 def find_module(self, name, path, parent=None):
494 if parent is not None:
Thomas Heller2e7c8322004-05-11 15:10:59 +0000495 # assert path is not None
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000496 fullname = parent.__name__+'.'+name
Guido van Rossum03f7f082001-10-18 19:15:32 +0000497 else:
498 fullname = name
499 if fullname in self.excludes:
500 self.msgout(3, "find_module -> Excluded", fullname)
Collin Winterce36ad82007-08-30 01:19:48 +0000501 raise ImportError(name)
Guido van Rossum78fc3631998-03-20 17:37:24 +0000502
Guido van Rossum912a14c1998-03-05 04:56:37 +0000503 if path is None:
504 if name in sys.builtin_module_names:
Barryd42e5822020-04-14 20:16:06 +0100505 return (None, None, ("", _C_BUILTIN))
Guido van Rossum78fc3631998-03-20 17:37:24 +0000506
Guido van Rossum912a14c1998-03-05 04:56:37 +0000507 path = self.path
Brandt Bucher9d7b2c02019-04-07 01:00:41 -0700508
509 return _find_module(name, path)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000510
511 def report(self):
Just van Rossume29310a2002-12-31 16:33:00 +0000512 """Print a report to stdout, listing the found modules with their
513 paths, as well as modules that are missing, or seem to be missing.
514 """
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000515 print()
516 print(" %-25s %s" % ("Name", "File"))
517 print(" %-25s %s" % ("----", "----"))
Guido van Rossum912a14c1998-03-05 04:56:37 +0000518 # Print modules found
Guido van Rossumd59cde82007-06-12 00:25:08 +0000519 keys = sorted(self.modules.keys())
Guido van Rossum912a14c1998-03-05 04:56:37 +0000520 for key in keys:
521 m = self.modules[key]
522 if m.__path__:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000523 print("P", end=' ')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000524 else:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000525 print("m", end=' ')
526 print("%-25s" % key, m.__file__ or "")
Guido van Rossum75dc4961998-03-05 03:42:00 +0000527
Guido van Rossum912a14c1998-03-05 04:56:37 +0000528 # Print missing modules
Just van Rossume29310a2002-12-31 16:33:00 +0000529 missing, maybe = self.any_missing_maybe()
530 if missing:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000531 print()
532 print("Missing modules:")
Just van Rossume29310a2002-12-31 16:33:00 +0000533 for name in missing:
Guido van Rossumd59cde82007-06-12 00:25:08 +0000534 mods = sorted(self.badmodules[name].keys())
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000535 print("?", name, "imported from", ', '.join(mods))
Just van Rossume29310a2002-12-31 16:33:00 +0000536 # Print modules that may be missing, but then again, maybe not...
537 if maybe:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000538 print()
Ezio Melotti30b9d5d2013-08-17 15:50:46 +0300539 print("Submodules that appear to be missing, but could also be", end=' ')
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000540 print("global names in the parent package:")
Just van Rossume29310a2002-12-31 16:33:00 +0000541 for name in maybe:
Guido van Rossumd59cde82007-06-12 00:25:08 +0000542 mods = sorted(self.badmodules[name].keys())
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000543 print("?", name, "imported from", ', '.join(mods))
Guido van Rossum75dc4961998-03-05 03:42:00 +0000544
Guido van Rossum03f7f082001-10-18 19:15:32 +0000545 def any_missing(self):
Just van Rossume29310a2002-12-31 16:33:00 +0000546 """Return a list of modules that appear to be missing. Use
547 any_missing_maybe() if you want to know which modules are
548 certain to be missing, and which *may* be missing.
549 """
550 missing, maybe = self.any_missing_maybe()
551 return missing + maybe
552
553 def any_missing_maybe(self):
554 """Return two lists, one with modules that are certainly missing
555 and one with modules that *may* be missing. The latter names could
556 either be submodules *or* just global names in the package.
557
558 The reason it can't always be determined is that it's impossible to
559 tell which names are imported when "from module import *" is done
560 with an extension module, short of actually importing it.
561 """
Guido van Rossum03f7f082001-10-18 19:15:32 +0000562 missing = []
Just van Rossume29310a2002-12-31 16:33:00 +0000563 maybe = []
564 for name in self.badmodules:
565 if name in self.excludes:
566 continue
567 i = name.rfind(".")
568 if i < 0:
569 missing.append(name)
570 continue
571 subname = name[i+1:]
572 pkgname = name[:i]
573 pkg = self.modules.get(pkgname)
574 if pkg is not None:
575 if pkgname in self.badmodules[name]:
576 # The package tried to import this module itself and
577 # failed. It's definitely missing.
578 missing.append(name)
579 elif subname in pkg.globalnames:
580 # It's a global in the package: definitely not missing.
581 pass
582 elif pkg.starimports:
583 # It could be missing, but the package did an "import *"
584 # from a non-Python module, so we simply can't be sure.
585 maybe.append(name)
586 else:
587 # It's not a global in the package, the package didn't
588 # do funny star imports, it's very likely to be missing.
589 # The symbol could be inserted into the package from the
590 # outside, but since that's not good style we simply list
591 # it missing.
592 missing.append(name)
593 else:
594 missing.append(name)
595 missing.sort()
596 maybe.sort()
597 return missing, maybe
Guido van Rossum03f7f082001-10-18 19:15:32 +0000598
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000599 def replace_paths_in_code(self, co):
600 new_filename = original_filename = os.path.normpath(co.co_filename)
Just van Rossume29310a2002-12-31 16:33:00 +0000601 for f, r in self.replace_paths:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000602 if original_filename.startswith(f):
Just van Rossume29310a2002-12-31 16:33:00 +0000603 new_filename = r + original_filename[len(f):]
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000604 break
605
606 if self.debug and original_filename not in self.processed_paths:
Just van Rossume29310a2002-12-31 16:33:00 +0000607 if new_filename != original_filename:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000608 self.msgout(2, "co_filename %r changed to %r" \
609 % (original_filename,new_filename,))
610 else:
611 self.msgout(2, "co_filename %r remains unchanged" \
612 % (original_filename,))
613 self.processed_paths.append(original_filename)
614
615 consts = list(co.co_consts)
616 for i in range(len(consts)):
617 if isinstance(consts[i], type(co)):
618 consts[i] = self.replace_paths_in_code(consts[i])
619
Victor Stinnera9f05d62019-05-24 23:57:23 +0200620 return co.replace(co_consts=tuple(consts), co_filename=new_filename)
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000621
Guido van Rossum75dc4961998-03-05 03:42:00 +0000622
623def test():
624 # Parse command line
625 import getopt
626 try:
Guido van Rossumbaf06031998-08-25 14:06:55 +0000627 opts, args = getopt.getopt(sys.argv[1:], "dmp:qx:")
Guido van Rossumb940e112007-01-10 16:19:56 +0000628 except getopt.error as msg:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000629 print(msg)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000630 return
Guido van Rossum75dc4961998-03-05 03:42:00 +0000631
632 # Process options
633 debug = 1
634 domods = 0
635 addpath = []
Guido van Rossumbaf06031998-08-25 14:06:55 +0000636 exclude = []
Guido van Rossum75dc4961998-03-05 03:42:00 +0000637 for o, a in opts:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000638 if o == '-d':
639 debug = debug + 1
640 if o == '-m':
641 domods = 1
642 if o == '-p':
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000643 addpath = addpath + a.split(os.pathsep)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000644 if o == '-q':
645 debug = 0
Guido van Rossumbaf06031998-08-25 14:06:55 +0000646 if o == '-x':
647 exclude.append(a)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000648
649 # Provide default arguments
650 if not args:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000651 script = "hello.py"
Guido van Rossum75dc4961998-03-05 03:42:00 +0000652 else:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000653 script = args[0]
Guido van Rossum75dc4961998-03-05 03:42:00 +0000654
655 # Set the path based on sys.path and the script directory
656 path = sys.path[:]
657 path[0] = os.path.dirname(script)
658 path = addpath + path
659 if debug > 1:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000660 print("path:")
Guido van Rossum912a14c1998-03-05 04:56:37 +0000661 for item in path:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000662 print(" ", repr(item))
Guido van Rossum75dc4961998-03-05 03:42:00 +0000663
664 # Create the module finder and turn its crank
Guido van Rossumbaf06031998-08-25 14:06:55 +0000665 mf = ModuleFinder(path, debug, exclude)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000666 for arg in args[1:]:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000667 if arg == '-m':
668 domods = 1
669 continue
670 if domods:
671 if arg[-2:] == '.*':
672 mf.import_hook(arg[:-2], None, ["*"])
673 else:
674 mf.import_hook(arg)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000675 else:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000676 mf.load_file(arg)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000677 mf.run_script(script)
678 mf.report()
Just van Rossume29310a2002-12-31 16:33:00 +0000679 return mf # for -i debugging
Guido van Rossum75dc4961998-03-05 03:42:00 +0000680
681
682if __name__ == '__main__':
683 try:
Just van Rossume29310a2002-12-31 16:33:00 +0000684 mf = test()
Guido van Rossum75dc4961998-03-05 03:42:00 +0000685 except KeyboardInterrupt:
Éric Araujo1e3a68d2011-07-28 23:35:29 +0200686 print("\n[interrupted]")