blob: 989172aa8f6861080c6b0dd4075c49803e8ce9d6 [file] [log] [blame]
Guido van Rossum75dc4961998-03-05 03:42:00 +00001"""Find modules used by a script, using introspection."""
Just van Rossuma920a882003-07-18 15:31:40 +00002# This module should be kept compatible with Python 2.2, see PEP 291.
Thomas Heller919000e2002-11-25 20:21:59 +00003
Guido van Rossumfc2a0a82006-10-27 23:06:01 +00004from __future__ import generators
Guido van Rossum75dc4961998-03-05 03:42:00 +00005import dis
6import imp
7import marshal
8import os
Guido van Rossum75dc4961998-03-05 03:42:00 +00009import sys
Christian Heimes45f9af32007-11-27 21:50:00 +000010import types
Guido van Rossumfc2a0a82006-10-27 23:06:01 +000011import struct
Guido van Rossum75dc4961998-03-05 03:42:00 +000012
Just van Rossum5d0bd1e2002-11-26 09:53:16 +000013if hasattr(sys.__stdout__, "newlines"):
14 READ_MODE = "U" # universal line endings
15else:
16 # remain compatible with Python < 2.3
17 READ_MODE = "r"
18
Brett Cannon40430012007-10-22 20:24:51 +000019# XXX Clean up once str8's cstor matches bytes.
Guido van Rossum98297ee2007-11-06 21:34:58 +000020LOAD_CONST = bytes([dis.opname.index('LOAD_CONST')])
21IMPORT_NAME = bytes([dis.opname.index('IMPORT_NAME')])
22STORE_NAME = bytes([dis.opname.index('STORE_NAME')])
23STORE_GLOBAL = bytes([dis.opname.index('STORE_GLOBAL')])
Just van Rossume29310a2002-12-31 16:33:00 +000024STORE_OPS = [STORE_NAME, STORE_GLOBAL]
Guido van Rossum98297ee2007-11-06 21:34:58 +000025HAVE_ARGUMENT = bytes([dis.HAVE_ARGUMENT])
Guido van Rossum75dc4961998-03-05 03:42:00 +000026
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +000027# Modulefinder does a good job at simulating Python's, but it can not
28# handle __path__ modifications packages make at runtime. Therefore there
29# is a mechanism whereby you can register extra paths in this map for a
Thomas Wouters7e474022000-07-16 12:04:32 +000030# package, and it will be honored.
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +000031
32# Note this is a mapping is lists of paths.
33packagePathMap = {}
34
35# A Public interface
36def AddPackagePath(packagename, path):
Guido van Rossume7e632a1998-09-14 16:02:28 +000037 paths = packagePathMap.get(packagename, [])
38 paths.append(path)
39 packagePathMap[packagename] = paths
Guido van Rossum75dc4961998-03-05 03:42:00 +000040
Thomas Hellerc7aaf952002-11-14 18:45:11 +000041replacePackageMap = {}
42
43# This ReplacePackage mechanism allows modulefinder to work around the
44# way the _xmlplus package injects itself under the name "xml" into
45# sys.modules at runtime by calling ReplacePackage("_xmlplus", "xml")
46# before running ModuleFinder.
47
48def ReplacePackage(oldname, newname):
49 replacePackageMap[oldname] = newname
50
51
Guido van Rossum75dc4961998-03-05 03:42:00 +000052class Module:
53
54 def __init__(self, name, file=None, path=None):
Guido van Rossum912a14c1998-03-05 04:56:37 +000055 self.__name__ = name
56 self.__file__ = file
57 self.__path__ = path
58 self.__code__ = None
Just van Rossume29310a2002-12-31 16:33:00 +000059 # The set of global names that are assigned to in the module.
60 # This includes those names imported through starimports of
61 # Python modules.
62 self.globalnames = {}
63 # The set of starimports this module did that could not be
64 # resolved, ie. a starimport from a non-Python module.
65 self.starimports = {}
Guido van Rossum75dc4961998-03-05 03:42:00 +000066
67 def __repr__(self):
Neil Schemenauer32d23c92004-02-15 16:43:20 +000068 s = "Module(%r" % (self.__name__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +000069 if self.__file__ is not None:
Walter Dörwald70a6b492004-02-12 17:35:32 +000070 s = s + ", %r" % (self.__file__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +000071 if self.__path__ is not None:
Walter Dörwald70a6b492004-02-12 17:35:32 +000072 s = s + ", %r" % (self.__path__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +000073 s = s + ")"
74 return s
Guido van Rossum75dc4961998-03-05 03:42:00 +000075
Guido van Rossum75dc4961998-03-05 03:42:00 +000076class ModuleFinder:
77
Just van Rossume29310a2002-12-31 16:33:00 +000078 def __init__(self, path=None, debug=0, excludes=[], replace_paths=[]):
Guido van Rossum912a14c1998-03-05 04:56:37 +000079 if path is None:
80 path = sys.path
81 self.path = path
82 self.modules = {}
83 self.badmodules = {}
84 self.debug = debug
85 self.indent = 0
Guido van Rossum78fc3631998-03-20 17:37:24 +000086 self.excludes = excludes
Guido van Rossum6b767ac2001-03-20 20:43:34 +000087 self.replace_paths = replace_paths
88 self.processed_paths = [] # Used in debugging only
Guido van Rossum75dc4961998-03-05 03:42:00 +000089
90 def msg(self, level, str, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +000091 if level <= self.debug:
92 for i in range(self.indent):
Guido van Rossumbe19ed72007-02-09 05:37:30 +000093 print(" ", end=' ')
94 print(str, end=' ')
Guido van Rossum912a14c1998-03-05 04:56:37 +000095 for arg in args:
Guido van Rossumbe19ed72007-02-09 05:37:30 +000096 print(repr(arg), end=' ')
97 print()
Guido van Rossum75dc4961998-03-05 03:42:00 +000098
99 def msgin(self, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000100 level = args[0]
101 if level <= self.debug:
102 self.indent = self.indent + 1
Guido van Rossum68468eb2003-02-27 20:14:51 +0000103 self.msg(*args)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000104
105 def msgout(self, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000106 level = args[0]
107 if level <= self.debug:
108 self.indent = self.indent - 1
Guido van Rossum68468eb2003-02-27 20:14:51 +0000109 self.msg(*args)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000110
111 def run_script(self, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000112 self.msg(2, "run_script", pathname)
Just van Rossum5d0bd1e2002-11-26 09:53:16 +0000113 fp = open(pathname, READ_MODE)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000114 stuff = ("", "r", imp.PY_SOURCE)
115 self.load_module('__main__', fp, pathname, stuff)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000116
117 def load_file(self, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000118 dir, name = os.path.split(pathname)
119 name, ext = os.path.splitext(name)
Just van Rossum5d0bd1e2002-11-26 09:53:16 +0000120 fp = open(pathname, READ_MODE)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000121 stuff = (ext, "r", imp.PY_SOURCE)
122 self.load_module(name, fp, pathname, stuff)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000123
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000124 def import_hook(self, name, caller=None, fromlist=None, level=-1):
125 self.msg(3, "import_hook", name, caller, fromlist, level)
126 parent = self.determine_parent(caller, level=level)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000127 q, tail = self.find_head_package(parent, name)
128 m = self.load_tail(q, tail)
129 if not fromlist:
130 return q
131 if m.__path__:
132 self.ensure_fromlist(m, fromlist)
Thomas Heller318b7b92002-11-26 08:06:50 +0000133 return None
Guido van Rossum75dc4961998-03-05 03:42:00 +0000134
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000135 def determine_parent(self, caller, level=-1):
136 self.msgin(4, "determine_parent", caller, level)
137 if not caller or level == 0:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000138 self.msgout(4, "determine_parent -> None")
139 return None
140 pname = caller.__name__
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000141 if level >= 1: # relative import
142 if caller.__path__:
143 level -= 1
144 if level == 0:
145 parent = self.modules[pname]
146 assert parent is caller
147 self.msgout(4, "determine_parent ->", parent)
148 return parent
149 if pname.count(".") < level:
Collin Winterce36ad82007-08-30 01:19:48 +0000150 raise ImportError("relative importpath too deep")
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000151 pname = ".".join(pname.split(".")[:-level])
152 parent = self.modules[pname]
153 self.msgout(4, "determine_parent ->", parent)
154 return parent
Guido van Rossum912a14c1998-03-05 04:56:37 +0000155 if caller.__path__:
156 parent = self.modules[pname]
157 assert caller is parent
158 self.msgout(4, "determine_parent ->", parent)
159 return parent
160 if '.' in pname:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000161 i = pname.rfind('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000162 pname = pname[:i]
163 parent = self.modules[pname]
164 assert parent.__name__ == pname
165 self.msgout(4, "determine_parent ->", parent)
166 return parent
167 self.msgout(4, "determine_parent -> None")
168 return None
Guido van Rossum75dc4961998-03-05 03:42:00 +0000169
170 def find_head_package(self, parent, name):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000171 self.msgin(4, "find_head_package", parent, name)
172 if '.' in name:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000173 i = name.find('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000174 head = name[:i]
175 tail = name[i+1:]
176 else:
177 head = name
178 tail = ""
179 if parent:
180 qname = "%s.%s" % (parent.__name__, head)
181 else:
182 qname = head
183 q = self.import_module(head, qname, parent)
184 if q:
185 self.msgout(4, "find_head_package ->", (q, tail))
186 return q, tail
187 if parent:
188 qname = head
189 parent = None
190 q = self.import_module(head, qname, parent)
191 if q:
192 self.msgout(4, "find_head_package ->", (q, tail))
193 return q, tail
194 self.msgout(4, "raise ImportError: No module named", qname)
Collin Winterce36ad82007-08-30 01:19:48 +0000195 raise ImportError("No module named " + qname)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000196
197 def load_tail(self, q, tail):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000198 self.msgin(4, "load_tail", q, tail)
199 m = q
200 while tail:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000201 i = tail.find('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000202 if i < 0: i = len(tail)
203 head, tail = tail[:i], tail[i+1:]
204 mname = "%s.%s" % (m.__name__, head)
205 m = self.import_module(head, mname, m)
206 if not m:
207 self.msgout(4, "raise ImportError: No module named", mname)
Collin Winterce36ad82007-08-30 01:19:48 +0000208 raise ImportError("No module named " + mname)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000209 self.msgout(4, "load_tail ->", m)
210 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000211
212 def ensure_fromlist(self, m, fromlist, recursive=0):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000213 self.msg(4, "ensure_fromlist", m, fromlist, recursive)
214 for sub in fromlist:
215 if sub == "*":
216 if not recursive:
217 all = self.find_all_submodules(m)
218 if all:
219 self.ensure_fromlist(m, all, 1)
220 elif not hasattr(m, sub):
221 subname = "%s.%s" % (m.__name__, sub)
222 submod = self.import_module(sub, subname, m)
223 if not submod:
Collin Winterce36ad82007-08-30 01:19:48 +0000224 raise ImportError("No module named " + subname)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000225
226 def find_all_submodules(self, m):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000227 if not m.__path__:
228 return
229 modules = {}
Thomas Helleraaf1c8d2003-11-14 10:28:42 +0000230 # 'suffixes' used to be a list hardcoded to [".py", ".pyc", ".pyo"].
231 # But we must also collect Python extension modules - although
232 # we cannot separate normal dlls from Python extensions.
233 suffixes = []
234 for triple in imp.get_suffixes():
235 suffixes.append(triple[0])
Guido van Rossum912a14c1998-03-05 04:56:37 +0000236 for dir in m.__path__:
237 try:
238 names = os.listdir(dir)
239 except os.error:
240 self.msg(2, "can't list directory", dir)
241 continue
242 for name in names:
243 mod = None
244 for suff in suffixes:
245 n = len(suff)
246 if name[-n:] == suff:
247 mod = name[:-n]
248 break
249 if mod and mod != "__init__":
250 modules[mod] = mod
251 return modules.keys()
Guido van Rossum75dc4961998-03-05 03:42:00 +0000252
253 def import_module(self, partname, fqname, parent):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000254 self.msgin(3, "import_module", partname, fqname, parent)
255 try:
256 m = self.modules[fqname]
257 except KeyError:
258 pass
259 else:
260 self.msgout(3, "import_module ->", m)
261 return m
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000262 if fqname in self.badmodules:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000263 self.msgout(3, "import_module -> None")
264 return None
Thomas Heller2e7c8322004-05-11 15:10:59 +0000265 if parent and parent.__path__ is None:
266 self.msgout(3, "import_module -> None")
267 return None
Guido van Rossum912a14c1998-03-05 04:56:37 +0000268 try:
269 fp, pathname, stuff = self.find_module(partname,
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000270 parent and parent.__path__, parent)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000271 except ImportError:
272 self.msgout(3, "import_module ->", None)
273 return None
274 try:
275 m = self.load_module(fqname, fp, pathname, stuff)
276 finally:
277 if fp: fp.close()
278 if parent:
279 setattr(parent, partname, m)
280 self.msgout(3, "import_module ->", m)
281 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000282
Guido van Rossum1bc535d2007-05-15 18:46:22 +0000283 def load_module(self, fqname, fp, pathname, file_info):
284 suffix, mode, type = file_info
Guido van Rossum912a14c1998-03-05 04:56:37 +0000285 self.msgin(2, "load_module", fqname, fp and "fp", pathname)
286 if type == imp.PKG_DIRECTORY:
287 m = self.load_package(fqname, pathname)
288 self.msgout(2, "load_module ->", m)
289 return m
290 if type == imp.PY_SOURCE:
Guido van Rossum78fc3631998-03-20 17:37:24 +0000291 co = compile(fp.read()+'\n', pathname, 'exec')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000292 elif type == imp.PY_COMPILED:
293 if fp.read(4) != imp.get_magic():
294 self.msgout(2, "raise ImportError: Bad magic number", pathname)
Collin Winterce36ad82007-08-30 01:19:48 +0000295 raise ImportError("Bad magic number in %s" % pathname)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000296 fp.read(4)
297 co = marshal.load(fp)
298 else:
299 co = None
300 m = self.add_module(fqname)
Guido van Rossumab045f91998-03-06 19:55:10 +0000301 m.__file__ = pathname
Guido van Rossum912a14c1998-03-05 04:56:37 +0000302 if co:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000303 if self.replace_paths:
304 co = self.replace_paths_in_code(co)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000305 m.__code__ = co
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000306 self.scan_code(co, m)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000307 self.msgout(2, "load_module ->", m)
308 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000309
Just van Rossume29310a2002-12-31 16:33:00 +0000310 def _add_badmodule(self, name, caller):
311 if name not in self.badmodules:
312 self.badmodules[name] = {}
Benjamin Petersonc0747cf2008-11-03 20:31:38 +0000313 if caller:
314 self.badmodules[name][caller.__name__] = 1
315 else:
316 self.badmodules[name]["-"] = 1
Just van Rossume29310a2002-12-31 16:33:00 +0000317
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000318 def _safe_import_hook(self, name, caller, fromlist, level=-1):
Just van Rossume29310a2002-12-31 16:33:00 +0000319 # wrapper for self.import_hook() that won't raise ImportError
320 if name in self.badmodules:
321 self._add_badmodule(name, caller)
322 return
323 try:
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000324 self.import_hook(name, caller, level=level)
Guido van Rossumb940e112007-01-10 16:19:56 +0000325 except ImportError as msg:
Just van Rossume29310a2002-12-31 16:33:00 +0000326 self.msg(2, "ImportError:", str(msg))
327 self._add_badmodule(name, caller)
328 else:
329 if fromlist:
330 for sub in fromlist:
331 if sub in self.badmodules:
332 self._add_badmodule(sub, caller)
333 continue
334 try:
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000335 self.import_hook(name, caller, [sub], level=level)
Guido van Rossumb940e112007-01-10 16:19:56 +0000336 except ImportError as msg:
Just van Rossume29310a2002-12-31 16:33:00 +0000337 self.msg(2, "ImportError:", str(msg))
338 fullname = name + "." + sub
339 self._add_badmodule(fullname, caller)
340
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000341 def scan_opcodes(self, co,
342 unpack = struct.unpack):
343 # Scan the code, and yield 'interesting' opcode combinations
344 # Version for Python 2.4 and older
345 code = co.co_code
346 names = co.co_names
347 consts = co.co_consts
348 while code:
349 c = code[0]
350 if c in STORE_OPS:
351 oparg, = unpack('<H', code[1:3])
352 yield "store", (names[oparg],)
353 code = code[3:]
354 continue
355 if c == LOAD_CONST and code[3] == IMPORT_NAME:
356 oparg_1, oparg_2 = unpack('<xHxH', code[:6])
357 yield "import", (consts[oparg_1], names[oparg_2])
358 code = code[6:]
359 continue
360 if c >= HAVE_ARGUMENT:
361 code = code[3:]
362 else:
363 code = code[1:]
364
365 def scan_opcodes_25(self, co,
366 unpack = struct.unpack):
367 # Scan the code, and yield 'interesting' opcode combinations
368 # Python 2.5 version (has absolute and relative imports)
369 code = co.co_code
370 names = co.co_names
371 consts = co.co_consts
372 LOAD_LOAD_AND_IMPORT = LOAD_CONST + LOAD_CONST + IMPORT_NAME
373 while code:
Guido van Rossum98297ee2007-11-06 21:34:58 +0000374 c = bytes([code[0]])
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000375 if c in STORE_OPS:
376 oparg, = unpack('<H', code[1:3])
377 yield "store", (names[oparg],)
378 code = code[3:]
379 continue
380 if code[:9:3] == LOAD_LOAD_AND_IMPORT:
381 oparg_1, oparg_2, oparg_3 = unpack('<xHxHxH', code[:9])
382 level = consts[oparg_1]
383 if level == 0: # absolute import
384 yield "absolute_import", (consts[oparg_2], names[oparg_3])
385 else: # relative import
386 yield "relative_import", (level, consts[oparg_2], names[oparg_3])
387 code = code[9:]
388 continue
389 if c >= HAVE_ARGUMENT:
390 code = code[3:]
391 else:
392 code = code[1:]
393
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000394 def scan_code(self, co, m):
395 code = co.co_code
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000396 if sys.version_info >= (2, 5):
397 scanner = self.scan_opcodes_25
398 else:
399 scanner = self.scan_opcodes
400 for what, args in scanner(co):
401 if what == "store":
402 name, = args
403 m.globalnames[name] = 1
404 elif what == "absolute_import":
405 fromlist, name = args
Just van Rossume29310a2002-12-31 16:33:00 +0000406 have_star = 0
407 if fromlist is not None:
408 if "*" in fromlist:
409 have_star = 1
410 fromlist = [f for f in fromlist if f != "*"]
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000411 self._safe_import_hook(name, m, fromlist, level=0)
Just van Rossume29310a2002-12-31 16:33:00 +0000412 if have_star:
413 # We've encountered an "import *". If it is a Python module,
414 # the code has already been parsed and we can suck out the
415 # global names.
416 mm = None
417 if m.__path__:
418 # At this point we don't know whether 'name' is a
419 # submodule of 'm' or a global module. Let's just try
420 # the full name first.
421 mm = self.modules.get(m.__name__ + "." + name)
422 if mm is None:
423 mm = self.modules.get(name)
424 if mm is not None:
425 m.globalnames.update(mm.globalnames)
426 m.starimports.update(mm.starimports)
427 if mm.__code__ is None:
428 m.starimports[name] = 1
429 else:
430 m.starimports[name] = 1
Guido van Rossumfc2a0a82006-10-27 23:06:01 +0000431 elif what == "relative_import":
432 level, fromlist, name = args
433 if name:
434 self._safe_import_hook(name, m, fromlist, level=level)
435 else:
436 parent = self.determine_parent(m, level=level)
437 self._safe_import_hook(parent.__name__, None, fromlist, level=0)
438 else:
439 # We don't expect anything else from the generator.
440 raise RuntimeError(what)
441
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000442 for c in co.co_consts:
443 if isinstance(c, type(co)):
444 self.scan_code(c, m)
445
Guido van Rossum75dc4961998-03-05 03:42:00 +0000446 def load_package(self, fqname, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000447 self.msgin(2, "load_package", fqname, pathname)
Thomas Hellerc7aaf952002-11-14 18:45:11 +0000448 newname = replacePackageMap.get(fqname)
449 if newname:
450 fqname = newname
Guido van Rossum912a14c1998-03-05 04:56:37 +0000451 m = self.add_module(fqname)
452 m.__file__ = pathname
453 m.__path__ = [pathname]
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +0000454
Guido van Rossume7e632a1998-09-14 16:02:28 +0000455 # As per comment at top of file, simulate runtime __path__ additions.
456 m.__path__ = m.__path__ + packagePathMap.get(fqname, [])
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +0000457
Guido van Rossum912a14c1998-03-05 04:56:37 +0000458 fp, buf, stuff = self.find_module("__init__", m.__path__)
459 self.load_module(fqname, fp, buf, stuff)
460 self.msgout(2, "load_package ->", m)
461 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000462
463 def add_module(self, fqname):
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000464 if fqname in self.modules:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000465 return self.modules[fqname]
466 self.modules[fqname] = m = Module(fqname)
467 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000468
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000469 def find_module(self, name, path, parent=None):
470 if parent is not None:
Thomas Heller2e7c8322004-05-11 15:10:59 +0000471 # assert path is not None
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000472 fullname = parent.__name__+'.'+name
Guido van Rossum03f7f082001-10-18 19:15:32 +0000473 else:
474 fullname = name
475 if fullname in self.excludes:
476 self.msgout(3, "find_module -> Excluded", fullname)
Collin Winterce36ad82007-08-30 01:19:48 +0000477 raise ImportError(name)
Guido van Rossum78fc3631998-03-20 17:37:24 +0000478
Guido van Rossum912a14c1998-03-05 04:56:37 +0000479 if path is None:
480 if name in sys.builtin_module_names:
481 return (None, None, ("", "", imp.C_BUILTIN))
Guido van Rossum78fc3631998-03-20 17:37:24 +0000482
Guido van Rossum912a14c1998-03-05 04:56:37 +0000483 path = self.path
484 return imp.find_module(name, path)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000485
486 def report(self):
Just van Rossume29310a2002-12-31 16:33:00 +0000487 """Print a report to stdout, listing the found modules with their
488 paths, as well as modules that are missing, or seem to be missing.
489 """
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000490 print()
491 print(" %-25s %s" % ("Name", "File"))
492 print(" %-25s %s" % ("----", "----"))
Guido van Rossum912a14c1998-03-05 04:56:37 +0000493 # Print modules found
Guido van Rossumd59cde82007-06-12 00:25:08 +0000494 keys = sorted(self.modules.keys())
Guido van Rossum912a14c1998-03-05 04:56:37 +0000495 for key in keys:
496 m = self.modules[key]
497 if m.__path__:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000498 print("P", end=' ')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000499 else:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000500 print("m", end=' ')
501 print("%-25s" % key, m.__file__ or "")
Guido van Rossum75dc4961998-03-05 03:42:00 +0000502
Guido van Rossum912a14c1998-03-05 04:56:37 +0000503 # Print missing modules
Just van Rossume29310a2002-12-31 16:33:00 +0000504 missing, maybe = self.any_missing_maybe()
505 if missing:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000506 print()
507 print("Missing modules:")
Just van Rossume29310a2002-12-31 16:33:00 +0000508 for name in missing:
Guido van Rossumd59cde82007-06-12 00:25:08 +0000509 mods = sorted(self.badmodules[name].keys())
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000510 print("?", name, "imported from", ', '.join(mods))
Just van Rossume29310a2002-12-31 16:33:00 +0000511 # Print modules that may be missing, but then again, maybe not...
512 if maybe:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000513 print()
514 print("Submodules thay appear to be missing, but could also be", end=' ')
515 print("global names in the parent package:")
Just van Rossume29310a2002-12-31 16:33:00 +0000516 for name in maybe:
Guido van Rossumd59cde82007-06-12 00:25:08 +0000517 mods = sorted(self.badmodules[name].keys())
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000518 print("?", name, "imported from", ', '.join(mods))
Guido van Rossum75dc4961998-03-05 03:42:00 +0000519
Guido van Rossum03f7f082001-10-18 19:15:32 +0000520 def any_missing(self):
Just van Rossume29310a2002-12-31 16:33:00 +0000521 """Return a list of modules that appear to be missing. Use
522 any_missing_maybe() if you want to know which modules are
523 certain to be missing, and which *may* be missing.
524 """
525 missing, maybe = self.any_missing_maybe()
526 return missing + maybe
527
528 def any_missing_maybe(self):
529 """Return two lists, one with modules that are certainly missing
530 and one with modules that *may* be missing. The latter names could
531 either be submodules *or* just global names in the package.
532
533 The reason it can't always be determined is that it's impossible to
534 tell which names are imported when "from module import *" is done
535 with an extension module, short of actually importing it.
536 """
Guido van Rossum03f7f082001-10-18 19:15:32 +0000537 missing = []
Just van Rossume29310a2002-12-31 16:33:00 +0000538 maybe = []
539 for name in self.badmodules:
540 if name in self.excludes:
541 continue
542 i = name.rfind(".")
543 if i < 0:
544 missing.append(name)
545 continue
546 subname = name[i+1:]
547 pkgname = name[:i]
548 pkg = self.modules.get(pkgname)
549 if pkg is not None:
550 if pkgname in self.badmodules[name]:
551 # The package tried to import this module itself and
552 # failed. It's definitely missing.
553 missing.append(name)
554 elif subname in pkg.globalnames:
555 # It's a global in the package: definitely not missing.
556 pass
557 elif pkg.starimports:
558 # It could be missing, but the package did an "import *"
559 # from a non-Python module, so we simply can't be sure.
560 maybe.append(name)
561 else:
562 # It's not a global in the package, the package didn't
563 # do funny star imports, it's very likely to be missing.
564 # The symbol could be inserted into the package from the
565 # outside, but since that's not good style we simply list
566 # it missing.
567 missing.append(name)
568 else:
569 missing.append(name)
570 missing.sort()
571 maybe.sort()
572 return missing, maybe
Guido van Rossum03f7f082001-10-18 19:15:32 +0000573
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000574 def replace_paths_in_code(self, co):
575 new_filename = original_filename = os.path.normpath(co.co_filename)
Just van Rossume29310a2002-12-31 16:33:00 +0000576 for f, r in self.replace_paths:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000577 if original_filename.startswith(f):
Just van Rossume29310a2002-12-31 16:33:00 +0000578 new_filename = r + original_filename[len(f):]
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000579 break
580
581 if self.debug and original_filename not in self.processed_paths:
Just van Rossume29310a2002-12-31 16:33:00 +0000582 if new_filename != original_filename:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000583 self.msgout(2, "co_filename %r changed to %r" \
584 % (original_filename,new_filename,))
585 else:
586 self.msgout(2, "co_filename %r remains unchanged" \
587 % (original_filename,))
588 self.processed_paths.append(original_filename)
589
590 consts = list(co.co_consts)
591 for i in range(len(consts)):
592 if isinstance(consts[i], type(co)):
593 consts[i] = self.replace_paths_in_code(consts[i])
594
Christian Heimes45f9af32007-11-27 21:50:00 +0000595 return types.CodeType(co.co_argcount, co.co_nlocals, co.co_stacksize,
Tim Peters2c60f7a2003-01-29 03:49:43 +0000596 co.co_flags, co.co_code, tuple(consts), co.co_names,
597 co.co_varnames, new_filename, co.co_name,
Neal Norwitz82c72312002-11-12 23:09:12 +0000598 co.co_firstlineno, co.co_lnotab,
599 co.co_freevars, co.co_cellvars)
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000600
Guido van Rossum75dc4961998-03-05 03:42:00 +0000601
602def test():
603 # Parse command line
604 import getopt
605 try:
Guido van Rossumbaf06031998-08-25 14:06:55 +0000606 opts, args = getopt.getopt(sys.argv[1:], "dmp:qx:")
Guido van Rossumb940e112007-01-10 16:19:56 +0000607 except getopt.error as msg:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000608 print(msg)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000609 return
Guido van Rossum75dc4961998-03-05 03:42:00 +0000610
611 # Process options
612 debug = 1
613 domods = 0
614 addpath = []
Guido van Rossumbaf06031998-08-25 14:06:55 +0000615 exclude = []
Guido van Rossum75dc4961998-03-05 03:42:00 +0000616 for o, a in opts:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000617 if o == '-d':
618 debug = debug + 1
619 if o == '-m':
620 domods = 1
621 if o == '-p':
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000622 addpath = addpath + a.split(os.pathsep)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000623 if o == '-q':
624 debug = 0
Guido van Rossumbaf06031998-08-25 14:06:55 +0000625 if o == '-x':
626 exclude.append(a)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000627
628 # Provide default arguments
629 if not args:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000630 script = "hello.py"
Guido van Rossum75dc4961998-03-05 03:42:00 +0000631 else:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000632 script = args[0]
Guido van Rossum75dc4961998-03-05 03:42:00 +0000633
634 # Set the path based on sys.path and the script directory
635 path = sys.path[:]
636 path[0] = os.path.dirname(script)
637 path = addpath + path
638 if debug > 1:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000639 print("path:")
Guido van Rossum912a14c1998-03-05 04:56:37 +0000640 for item in path:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000641 print(" ", repr(item))
Guido van Rossum75dc4961998-03-05 03:42:00 +0000642
643 # Create the module finder and turn its crank
Guido van Rossumbaf06031998-08-25 14:06:55 +0000644 mf = ModuleFinder(path, debug, exclude)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000645 for arg in args[1:]:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000646 if arg == '-m':
647 domods = 1
648 continue
649 if domods:
650 if arg[-2:] == '.*':
651 mf.import_hook(arg[:-2], None, ["*"])
652 else:
653 mf.import_hook(arg)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000654 else:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000655 mf.load_file(arg)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000656 mf.run_script(script)
657 mf.report()
Just van Rossume29310a2002-12-31 16:33:00 +0000658 return mf # for -i debugging
Guido van Rossum75dc4961998-03-05 03:42:00 +0000659
660
661if __name__ == '__main__':
662 try:
Just van Rossume29310a2002-12-31 16:33:00 +0000663 mf = test()
Guido van Rossum75dc4961998-03-05 03:42:00 +0000664 except KeyboardInterrupt:
Guido van Rossumbe19ed72007-02-09 05:37:30 +0000665 print("\n[interrupt]")