blob: 2ffd44854b4c4ca2cd4cadf197dc4370051e5950 [file] [log] [blame]
Guido van Rossum75dc4961998-03-05 03:42:00 +00001"""Find modules used by a script, using introspection."""
Just van Rossuma920a882003-07-18 15:31:40 +00002# This module should be kept compatible with Python 2.2, see PEP 291.
Thomas Heller919000e2002-11-25 20:21:59 +00003
Thomas Heller112d1a62006-10-27 19:05:53 +00004from __future__ import generators
Guido van Rossum75dc4961998-03-05 03:42:00 +00005import dis
6import imp
7import marshal
8import os
Guido van Rossum75dc4961998-03-05 03:42:00 +00009import sys
Christian Heimesc756d002007-11-27 21:34:01 +000010import types
Thomas Heller112d1a62006-10-27 19:05:53 +000011import struct
Guido van Rossum75dc4961998-03-05 03:42:00 +000012
Just van Rossum5d0bd1e2002-11-26 09:53:16 +000013if hasattr(sys.__stdout__, "newlines"):
14 READ_MODE = "U" # universal line endings
15else:
16 # remain compatible with Python < 2.3
17 READ_MODE = "r"
18
Serhiy Storchaka3111c942016-05-09 00:02:06 +030019LOAD_CONST = dis.opmap['LOAD_CONST']
20IMPORT_NAME = dis.opmap['IMPORT_NAME']
21STORE_NAME = dis.opmap['STORE_NAME']
22STORE_GLOBAL = dis.opmap['STORE_GLOBAL']
23STORE_OPS = STORE_NAME, STORE_GLOBAL
24HAVE_ARGUMENT = dis.HAVE_ARGUMENT
25EXTENDED_ARG = dis.EXTENDED_ARG
26
27def _unpack_opargs(code):
28 # enumerate() is not an option, since we sometimes process
29 # multiple elements on a single pass through the loop
30 extended_arg = 0
31 n = len(code)
32 i = 0
33 while i < n:
34 op = ord(code[i])
35 offset = i
36 i = i+1
37 arg = None
38 if op >= HAVE_ARGUMENT:
39 arg = ord(code[i]) + ord(code[i+1])*256 + extended_arg
40 extended_arg = 0
41 i = i+2
42 if op == EXTENDED_ARG:
43 extended_arg = arg*65536
44 yield (offset, op, arg)
Guido van Rossum75dc4961998-03-05 03:42:00 +000045
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +000046# Modulefinder does a good job at simulating Python's, but it can not
47# handle __path__ modifications packages make at runtime. Therefore there
48# is a mechanism whereby you can register extra paths in this map for a
Thomas Wouters7e474022000-07-16 12:04:32 +000049# package, and it will be honored.
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +000050
51# Note this is a mapping is lists of paths.
52packagePathMap = {}
53
54# A Public interface
55def AddPackagePath(packagename, path):
Guido van Rossume7e632a1998-09-14 16:02:28 +000056 paths = packagePathMap.get(packagename, [])
57 paths.append(path)
58 packagePathMap[packagename] = paths
Guido van Rossum75dc4961998-03-05 03:42:00 +000059
Thomas Hellerc7aaf952002-11-14 18:45:11 +000060replacePackageMap = {}
61
62# This ReplacePackage mechanism allows modulefinder to work around the
63# way the _xmlplus package injects itself under the name "xml" into
64# sys.modules at runtime by calling ReplacePackage("_xmlplus", "xml")
65# before running ModuleFinder.
66
67def ReplacePackage(oldname, newname):
68 replacePackageMap[oldname] = newname
69
70
Guido van Rossum75dc4961998-03-05 03:42:00 +000071class Module:
72
73 def __init__(self, name, file=None, path=None):
Guido van Rossum912a14c1998-03-05 04:56:37 +000074 self.__name__ = name
75 self.__file__ = file
76 self.__path__ = path
77 self.__code__ = None
Just van Rossume29310a2002-12-31 16:33:00 +000078 # The set of global names that are assigned to in the module.
79 # This includes those names imported through starimports of
80 # Python modules.
81 self.globalnames = {}
82 # The set of starimports this module did that could not be
83 # resolved, ie. a starimport from a non-Python module.
84 self.starimports = {}
Guido van Rossum75dc4961998-03-05 03:42:00 +000085
86 def __repr__(self):
Neil Schemenauer32d23c92004-02-15 16:43:20 +000087 s = "Module(%r" % (self.__name__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +000088 if self.__file__ is not None:
Walter Dörwald70a6b492004-02-12 17:35:32 +000089 s = s + ", %r" % (self.__file__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +000090 if self.__path__ is not None:
Walter Dörwald70a6b492004-02-12 17:35:32 +000091 s = s + ", %r" % (self.__path__,)
Guido van Rossum912a14c1998-03-05 04:56:37 +000092 s = s + ")"
93 return s
Guido van Rossum75dc4961998-03-05 03:42:00 +000094
Guido van Rossum75dc4961998-03-05 03:42:00 +000095class ModuleFinder:
96
Just van Rossume29310a2002-12-31 16:33:00 +000097 def __init__(self, path=None, debug=0, excludes=[], replace_paths=[]):
Guido van Rossum912a14c1998-03-05 04:56:37 +000098 if path is None:
99 path = sys.path
100 self.path = path
101 self.modules = {}
102 self.badmodules = {}
103 self.debug = debug
104 self.indent = 0
Guido van Rossum78fc3631998-03-20 17:37:24 +0000105 self.excludes = excludes
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000106 self.replace_paths = replace_paths
107 self.processed_paths = [] # Used in debugging only
Guido van Rossum75dc4961998-03-05 03:42:00 +0000108
109 def msg(self, level, str, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000110 if level <= self.debug:
111 for i in range(self.indent):
112 print " ",
113 print str,
114 for arg in args:
115 print repr(arg),
116 print
Guido van Rossum75dc4961998-03-05 03:42:00 +0000117
118 def msgin(self, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000119 level = args[0]
120 if level <= self.debug:
121 self.indent = self.indent + 1
Guido van Rossum68468eb2003-02-27 20:14:51 +0000122 self.msg(*args)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000123
124 def msgout(self, *args):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000125 level = args[0]
126 if level <= self.debug:
127 self.indent = self.indent - 1
Guido van Rossum68468eb2003-02-27 20:14:51 +0000128 self.msg(*args)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000129
130 def run_script(self, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000131 self.msg(2, "run_script", pathname)
Benjamin Petersonca1fb3e2015-03-10 19:06:18 -0500132 with open(pathname, READ_MODE) as fp:
133 stuff = ("", "r", imp.PY_SOURCE)
134 self.load_module('__main__', fp, pathname, stuff)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000135
136 def load_file(self, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000137 dir, name = os.path.split(pathname)
138 name, ext = os.path.splitext(name)
Benjamin Petersonca1fb3e2015-03-10 19:06:18 -0500139 with open(pathname, READ_MODE) as fp:
140 stuff = (ext, "r", imp.PY_SOURCE)
141 self.load_module(name, fp, pathname, stuff)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000142
Thomas Heller112d1a62006-10-27 19:05:53 +0000143 def import_hook(self, name, caller=None, fromlist=None, level=-1):
144 self.msg(3, "import_hook", name, caller, fromlist, level)
145 parent = self.determine_parent(caller, level=level)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000146 q, tail = self.find_head_package(parent, name)
147 m = self.load_tail(q, tail)
148 if not fromlist:
149 return q
150 if m.__path__:
151 self.ensure_fromlist(m, fromlist)
Thomas Heller318b7b92002-11-26 08:06:50 +0000152 return None
Guido van Rossum75dc4961998-03-05 03:42:00 +0000153
Thomas Heller112d1a62006-10-27 19:05:53 +0000154 def determine_parent(self, caller, level=-1):
155 self.msgin(4, "determine_parent", caller, level)
156 if not caller or level == 0:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000157 self.msgout(4, "determine_parent -> None")
158 return None
159 pname = caller.__name__
Thomas Heller112d1a62006-10-27 19:05:53 +0000160 if level >= 1: # relative import
161 if caller.__path__:
162 level -= 1
163 if level == 0:
164 parent = self.modules[pname]
165 assert parent is caller
166 self.msgout(4, "determine_parent ->", parent)
167 return parent
168 if pname.count(".") < level:
169 raise ImportError, "relative importpath too deep"
170 pname = ".".join(pname.split(".")[:-level])
171 parent = self.modules[pname]
172 self.msgout(4, "determine_parent ->", parent)
173 return parent
Guido van Rossum912a14c1998-03-05 04:56:37 +0000174 if caller.__path__:
175 parent = self.modules[pname]
176 assert caller is parent
177 self.msgout(4, "determine_parent ->", parent)
178 return parent
179 if '.' in pname:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000180 i = pname.rfind('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000181 pname = pname[:i]
182 parent = self.modules[pname]
183 assert parent.__name__ == pname
184 self.msgout(4, "determine_parent ->", parent)
185 return parent
186 self.msgout(4, "determine_parent -> None")
187 return None
Guido van Rossum75dc4961998-03-05 03:42:00 +0000188
189 def find_head_package(self, parent, name):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000190 self.msgin(4, "find_head_package", parent, name)
191 if '.' in name:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000192 i = name.find('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000193 head = name[:i]
194 tail = name[i+1:]
195 else:
196 head = name
197 tail = ""
198 if parent:
199 qname = "%s.%s" % (parent.__name__, head)
200 else:
201 qname = head
202 q = self.import_module(head, qname, parent)
203 if q:
204 self.msgout(4, "find_head_package ->", (q, tail))
205 return q, tail
206 if parent:
207 qname = head
208 parent = None
209 q = self.import_module(head, qname, parent)
210 if q:
211 self.msgout(4, "find_head_package ->", (q, tail))
212 return q, tail
213 self.msgout(4, "raise ImportError: No module named", qname)
214 raise ImportError, "No module named " + qname
Guido van Rossum75dc4961998-03-05 03:42:00 +0000215
216 def load_tail(self, q, tail):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000217 self.msgin(4, "load_tail", q, tail)
218 m = q
219 while tail:
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000220 i = tail.find('.')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000221 if i < 0: i = len(tail)
222 head, tail = tail[:i], tail[i+1:]
223 mname = "%s.%s" % (m.__name__, head)
224 m = self.import_module(head, mname, m)
225 if not m:
226 self.msgout(4, "raise ImportError: No module named", mname)
227 raise ImportError, "No module named " + mname
228 self.msgout(4, "load_tail ->", m)
229 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000230
231 def ensure_fromlist(self, m, fromlist, recursive=0):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000232 self.msg(4, "ensure_fromlist", m, fromlist, recursive)
233 for sub in fromlist:
234 if sub == "*":
235 if not recursive:
236 all = self.find_all_submodules(m)
237 if all:
238 self.ensure_fromlist(m, all, 1)
239 elif not hasattr(m, sub):
240 subname = "%s.%s" % (m.__name__, sub)
241 submod = self.import_module(sub, subname, m)
242 if not submod:
243 raise ImportError, "No module named " + subname
Guido van Rossum75dc4961998-03-05 03:42:00 +0000244
245 def find_all_submodules(self, m):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000246 if not m.__path__:
247 return
248 modules = {}
Thomas Helleraaf1c8d2003-11-14 10:28:42 +0000249 # 'suffixes' used to be a list hardcoded to [".py", ".pyc", ".pyo"].
250 # But we must also collect Python extension modules - although
251 # we cannot separate normal dlls from Python extensions.
252 suffixes = []
253 for triple in imp.get_suffixes():
254 suffixes.append(triple[0])
Guido van Rossum912a14c1998-03-05 04:56:37 +0000255 for dir in m.__path__:
256 try:
257 names = os.listdir(dir)
258 except os.error:
259 self.msg(2, "can't list directory", dir)
260 continue
261 for name in names:
262 mod = None
263 for suff in suffixes:
264 n = len(suff)
265 if name[-n:] == suff:
266 mod = name[:-n]
267 break
268 if mod and mod != "__init__":
269 modules[mod] = mod
270 return modules.keys()
Guido van Rossum75dc4961998-03-05 03:42:00 +0000271
272 def import_module(self, partname, fqname, parent):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000273 self.msgin(3, "import_module", partname, fqname, parent)
274 try:
275 m = self.modules[fqname]
276 except KeyError:
277 pass
278 else:
279 self.msgout(3, "import_module ->", m)
280 return m
Brett Cannon9bd059f2008-08-04 00:27:29 +0000281 if fqname in self.badmodules:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000282 self.msgout(3, "import_module -> None")
283 return None
Thomas Heller2e7c8322004-05-11 15:10:59 +0000284 if parent and parent.__path__ is None:
285 self.msgout(3, "import_module -> None")
286 return None
Guido van Rossum912a14c1998-03-05 04:56:37 +0000287 try:
288 fp, pathname, stuff = self.find_module(partname,
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000289 parent and parent.__path__, parent)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000290 except ImportError:
291 self.msgout(3, "import_module ->", None)
292 return None
293 try:
294 m = self.load_module(fqname, fp, pathname, stuff)
295 finally:
296 if fp: fp.close()
297 if parent:
298 setattr(parent, partname, m)
299 self.msgout(3, "import_module ->", m)
300 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000301
Brett Cannon9bd059f2008-08-04 00:27:29 +0000302 def load_module(self, fqname, fp, pathname, file_info):
303 suffix, mode, type = file_info
Guido van Rossum912a14c1998-03-05 04:56:37 +0000304 self.msgin(2, "load_module", fqname, fp and "fp", pathname)
305 if type == imp.PKG_DIRECTORY:
306 m = self.load_package(fqname, pathname)
307 self.msgout(2, "load_module ->", m)
308 return m
309 if type == imp.PY_SOURCE:
Guido van Rossum78fc3631998-03-20 17:37:24 +0000310 co = compile(fp.read()+'\n', pathname, 'exec')
Guido van Rossum912a14c1998-03-05 04:56:37 +0000311 elif type == imp.PY_COMPILED:
312 if fp.read(4) != imp.get_magic():
313 self.msgout(2, "raise ImportError: Bad magic number", pathname)
Guido van Rossumce33eb32000-05-02 13:49:13 +0000314 raise ImportError, "Bad magic number in %s" % pathname
Guido van Rossum912a14c1998-03-05 04:56:37 +0000315 fp.read(4)
316 co = marshal.load(fp)
317 else:
318 co = None
319 m = self.add_module(fqname)
Guido van Rossumab045f91998-03-06 19:55:10 +0000320 m.__file__ = pathname
Guido van Rossum912a14c1998-03-05 04:56:37 +0000321 if co:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000322 if self.replace_paths:
323 co = self.replace_paths_in_code(co)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000324 m.__code__ = co
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000325 self.scan_code(co, m)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000326 self.msgout(2, "load_module ->", m)
327 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000328
Just van Rossume29310a2002-12-31 16:33:00 +0000329 def _add_badmodule(self, name, caller):
330 if name not in self.badmodules:
331 self.badmodules[name] = {}
Thomas Heller1fac5a42008-10-30 20:18:13 +0000332 if caller:
333 self.badmodules[name][caller.__name__] = 1
334 else:
335 self.badmodules[name]["-"] = 1
Just van Rossume29310a2002-12-31 16:33:00 +0000336
Thomas Heller112d1a62006-10-27 19:05:53 +0000337 def _safe_import_hook(self, name, caller, fromlist, level=-1):
Just van Rossume29310a2002-12-31 16:33:00 +0000338 # wrapper for self.import_hook() that won't raise ImportError
339 if name in self.badmodules:
340 self._add_badmodule(name, caller)
341 return
342 try:
Thomas Heller112d1a62006-10-27 19:05:53 +0000343 self.import_hook(name, caller, level=level)
Just van Rossume29310a2002-12-31 16:33:00 +0000344 except ImportError, msg:
345 self.msg(2, "ImportError:", str(msg))
346 self._add_badmodule(name, caller)
347 else:
348 if fromlist:
349 for sub in fromlist:
350 if sub in self.badmodules:
351 self._add_badmodule(sub, caller)
352 continue
353 try:
Thomas Heller112d1a62006-10-27 19:05:53 +0000354 self.import_hook(name, caller, [sub], level=level)
Just van Rossume29310a2002-12-31 16:33:00 +0000355 except ImportError, msg:
356 self.msg(2, "ImportError:", str(msg))
357 fullname = name + "." + sub
358 self._add_badmodule(fullname, caller)
359
Thomas Heller112d1a62006-10-27 19:05:53 +0000360 def scan_opcodes(self, co,
361 unpack = struct.unpack):
362 # Scan the code, and yield 'interesting' opcode combinations
363 # Version for Python 2.4 and older
364 code = co.co_code
365 names = co.co_names
366 consts = co.co_consts
Serhiy Storchaka3111c942016-05-09 00:02:06 +0300367 opargs = [(op, arg) for _, op, arg in _unpack_opargs(code)
368 if op != EXTENDED_ARG]
369 for i, (op, oparg) in enumerate(opargs):
Thomas Heller112d1a62006-10-27 19:05:53 +0000370 if c in STORE_OPS:
Thomas Heller112d1a62006-10-27 19:05:53 +0000371 yield "store", (names[oparg],)
Thomas Heller112d1a62006-10-27 19:05:53 +0000372 continue
Serhiy Storchaka3111c942016-05-09 00:02:06 +0300373 if (op == IMPORT_NAME and i >= 1
374 and opargs[i-1][0] == LOAD_CONST):
375 fromlist = consts[opargs[i-1][1]]
376 yield "import", (fromlist, names[oparg])
Thomas Heller112d1a62006-10-27 19:05:53 +0000377 continue
Thomas Heller112d1a62006-10-27 19:05:53 +0000378
Serhiy Storchaka3111c942016-05-09 00:02:06 +0300379 def scan_opcodes_25(self, co):
Thomas Heller112d1a62006-10-27 19:05:53 +0000380 # Scan the code, and yield 'interesting' opcode combinations
Thomas Heller112d1a62006-10-27 19:05:53 +0000381 code = co.co_code
382 names = co.co_names
383 consts = co.co_consts
Serhiy Storchaka3111c942016-05-09 00:02:06 +0300384 opargs = [(op, arg) for _, op, arg in _unpack_opargs(code)
385 if op != EXTENDED_ARG]
386 for i, (op, oparg) in enumerate(opargs):
387 if op in STORE_OPS:
Thomas Heller112d1a62006-10-27 19:05:53 +0000388 yield "store", (names[oparg],)
Thomas Heller112d1a62006-10-27 19:05:53 +0000389 continue
Serhiy Storchaka3111c942016-05-09 00:02:06 +0300390 if (op == IMPORT_NAME and i >= 2
391 and opargs[i-1][0] == opargs[i-2][0] == LOAD_CONST):
392 level = consts[opargs[i-2][1]]
393 fromlist = consts[opargs[i-1][1]]
Thomas Heller112d1a62006-10-27 19:05:53 +0000394 if level == -1: # normal import
Serhiy Storchaka3111c942016-05-09 00:02:06 +0300395 yield "import", (fromlist, names[oparg])
Thomas Heller112d1a62006-10-27 19:05:53 +0000396 elif level == 0: # absolute import
Serhiy Storchaka3111c942016-05-09 00:02:06 +0300397 yield "absolute_import", (fromlist, names[oparg])
Thomas Heller112d1a62006-10-27 19:05:53 +0000398 else: # relative import
Serhiy Storchaka3111c942016-05-09 00:02:06 +0300399 yield "relative_import", (level, fromlist, names[oparg])
Thomas Heller112d1a62006-10-27 19:05:53 +0000400 continue
Thomas Heller112d1a62006-10-27 19:05:53 +0000401
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000402 def scan_code(self, co, m):
403 code = co.co_code
Thomas Heller112d1a62006-10-27 19:05:53 +0000404 if sys.version_info >= (2, 5):
405 scanner = self.scan_opcodes_25
406 else:
407 scanner = self.scan_opcodes
408 for what, args in scanner(co):
409 if what == "store":
410 name, = args
411 m.globalnames[name] = 1
412 elif what in ("import", "absolute_import"):
413 fromlist, name = args
Just van Rossume29310a2002-12-31 16:33:00 +0000414 have_star = 0
415 if fromlist is not None:
416 if "*" in fromlist:
417 have_star = 1
418 fromlist = [f for f in fromlist if f != "*"]
Thomas Heller112d1a62006-10-27 19:05:53 +0000419 if what == "absolute_import": level = 0
420 else: level = -1
421 self._safe_import_hook(name, m, fromlist, level=level)
Just van Rossume29310a2002-12-31 16:33:00 +0000422 if have_star:
423 # We've encountered an "import *". If it is a Python module,
424 # the code has already been parsed and we can suck out the
425 # global names.
426 mm = None
427 if m.__path__:
428 # At this point we don't know whether 'name' is a
429 # submodule of 'm' or a global module. Let's just try
430 # the full name first.
431 mm = self.modules.get(m.__name__ + "." + name)
432 if mm is None:
433 mm = self.modules.get(name)
434 if mm is not None:
435 m.globalnames.update(mm.globalnames)
436 m.starimports.update(mm.starimports)
437 if mm.__code__ is None:
438 m.starimports[name] = 1
439 else:
440 m.starimports[name] = 1
Thomas Heller112d1a62006-10-27 19:05:53 +0000441 elif what == "relative_import":
442 level, fromlist, name = args
443 if name:
444 self._safe_import_hook(name, m, fromlist, level=level)
445 else:
446 parent = self.determine_parent(m, level=level)
447 self._safe_import_hook(parent.__name__, None, fromlist, level=0)
448 else:
449 # We don't expect anything else from the generator.
450 raise RuntimeError(what)
451
Guido van Rossum3c51cf21998-03-05 05:15:07 +0000452 for c in co.co_consts:
453 if isinstance(c, type(co)):
454 self.scan_code(c, m)
455
Guido van Rossum75dc4961998-03-05 03:42:00 +0000456 def load_package(self, fqname, pathname):
Guido van Rossum912a14c1998-03-05 04:56:37 +0000457 self.msgin(2, "load_package", fqname, pathname)
Thomas Hellerc7aaf952002-11-14 18:45:11 +0000458 newname = replacePackageMap.get(fqname)
459 if newname:
460 fqname = newname
Guido van Rossum912a14c1998-03-05 04:56:37 +0000461 m = self.add_module(fqname)
462 m.__file__ = pathname
463 m.__path__ = [pathname]
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +0000464
Guido van Rossume7e632a1998-09-14 16:02:28 +0000465 # As per comment at top of file, simulate runtime __path__ additions.
466 m.__path__ = m.__path__ + packagePathMap.get(fqname, [])
Guido van Rossumf1b5a0e1998-05-18 20:21:56 +0000467
Guido van Rossum912a14c1998-03-05 04:56:37 +0000468 fp, buf, stuff = self.find_module("__init__", m.__path__)
469 self.load_module(fqname, fp, buf, stuff)
470 self.msgout(2, "load_package ->", m)
Benjamin Petersonca1fb3e2015-03-10 19:06:18 -0500471 if fp:
472 fp.close()
Guido van Rossum912a14c1998-03-05 04:56:37 +0000473 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000474
475 def add_module(self, fqname):
Brett Cannon9bd059f2008-08-04 00:27:29 +0000476 if fqname in self.modules:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000477 return self.modules[fqname]
478 self.modules[fqname] = m = Module(fqname)
479 return m
Guido van Rossum75dc4961998-03-05 03:42:00 +0000480
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000481 def find_module(self, name, path, parent=None):
482 if parent is not None:
Thomas Heller2e7c8322004-05-11 15:10:59 +0000483 # assert path is not None
Just van Rossumf0dfbaf2003-03-05 17:23:48 +0000484 fullname = parent.__name__+'.'+name
Guido van Rossum03f7f082001-10-18 19:15:32 +0000485 else:
486 fullname = name
487 if fullname in self.excludes:
488 self.msgout(3, "find_module -> Excluded", fullname)
Guido van Rossum78fc3631998-03-20 17:37:24 +0000489 raise ImportError, name
490
Guido van Rossum912a14c1998-03-05 04:56:37 +0000491 if path is None:
492 if name in sys.builtin_module_names:
493 return (None, None, ("", "", imp.C_BUILTIN))
Guido van Rossum78fc3631998-03-20 17:37:24 +0000494
Guido van Rossum912a14c1998-03-05 04:56:37 +0000495 path = self.path
496 return imp.find_module(name, path)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000497
498 def report(self):
Just van Rossume29310a2002-12-31 16:33:00 +0000499 """Print a report to stdout, listing the found modules with their
500 paths, as well as modules that are missing, or seem to be missing.
501 """
Guido van Rossum912a14c1998-03-05 04:56:37 +0000502 print
503 print " %-25s %s" % ("Name", "File")
504 print " %-25s %s" % ("----", "----")
505 # Print modules found
506 keys = self.modules.keys()
507 keys.sort()
508 for key in keys:
509 m = self.modules[key]
510 if m.__path__:
511 print "P",
512 else:
513 print "m",
514 print "%-25s" % key, m.__file__ or ""
Guido van Rossum75dc4961998-03-05 03:42:00 +0000515
Guido van Rossum912a14c1998-03-05 04:56:37 +0000516 # Print missing modules
Just van Rossume29310a2002-12-31 16:33:00 +0000517 missing, maybe = self.any_missing_maybe()
518 if missing:
519 print
520 print "Missing modules:"
521 for name in missing:
522 mods = self.badmodules[name].keys()
Guido van Rossum38b92eb1998-12-15 15:35:23 +0000523 mods.sort()
Just van Rossume29310a2002-12-31 16:33:00 +0000524 print "?", name, "imported from", ', '.join(mods)
525 # Print modules that may be missing, but then again, maybe not...
526 if maybe:
527 print
Ezio Melottif5469cf2013-08-17 15:43:51 +0300528 print "Submodules that appear to be missing, but could also be",
Just van Rossume29310a2002-12-31 16:33:00 +0000529 print "global names in the parent package:"
530 for name in maybe:
531 mods = self.badmodules[name].keys()
532 mods.sort()
533 print "?", name, "imported from", ', '.join(mods)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000534
Guido van Rossum03f7f082001-10-18 19:15:32 +0000535 def any_missing(self):
Just van Rossume29310a2002-12-31 16:33:00 +0000536 """Return a list of modules that appear to be missing. Use
537 any_missing_maybe() if you want to know which modules are
538 certain to be missing, and which *may* be missing.
539 """
540 missing, maybe = self.any_missing_maybe()
541 return missing + maybe
542
543 def any_missing_maybe(self):
544 """Return two lists, one with modules that are certainly missing
545 and one with modules that *may* be missing. The latter names could
546 either be submodules *or* just global names in the package.
547
548 The reason it can't always be determined is that it's impossible to
549 tell which names are imported when "from module import *" is done
550 with an extension module, short of actually importing it.
551 """
Guido van Rossum03f7f082001-10-18 19:15:32 +0000552 missing = []
Just van Rossume29310a2002-12-31 16:33:00 +0000553 maybe = []
554 for name in self.badmodules:
555 if name in self.excludes:
556 continue
557 i = name.rfind(".")
558 if i < 0:
559 missing.append(name)
560 continue
561 subname = name[i+1:]
562 pkgname = name[:i]
563 pkg = self.modules.get(pkgname)
564 if pkg is not None:
565 if pkgname in self.badmodules[name]:
566 # The package tried to import this module itself and
567 # failed. It's definitely missing.
568 missing.append(name)
569 elif subname in pkg.globalnames:
570 # It's a global in the package: definitely not missing.
571 pass
572 elif pkg.starimports:
573 # It could be missing, but the package did an "import *"
574 # from a non-Python module, so we simply can't be sure.
575 maybe.append(name)
576 else:
577 # It's not a global in the package, the package didn't
578 # do funny star imports, it's very likely to be missing.
579 # The symbol could be inserted into the package from the
580 # outside, but since that's not good style we simply list
581 # it missing.
582 missing.append(name)
583 else:
584 missing.append(name)
585 missing.sort()
586 maybe.sort()
587 return missing, maybe
Guido van Rossum03f7f082001-10-18 19:15:32 +0000588
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000589 def replace_paths_in_code(self, co):
590 new_filename = original_filename = os.path.normpath(co.co_filename)
Just van Rossume29310a2002-12-31 16:33:00 +0000591 for f, r in self.replace_paths:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000592 if original_filename.startswith(f):
Just van Rossume29310a2002-12-31 16:33:00 +0000593 new_filename = r + original_filename[len(f):]
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000594 break
595
596 if self.debug and original_filename not in self.processed_paths:
Just van Rossume29310a2002-12-31 16:33:00 +0000597 if new_filename != original_filename:
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000598 self.msgout(2, "co_filename %r changed to %r" \
599 % (original_filename,new_filename,))
600 else:
601 self.msgout(2, "co_filename %r remains unchanged" \
602 % (original_filename,))
603 self.processed_paths.append(original_filename)
604
605 consts = list(co.co_consts)
606 for i in range(len(consts)):
607 if isinstance(consts[i], type(co)):
608 consts[i] = self.replace_paths_in_code(consts[i])
609
Christian Heimesc756d002007-11-27 21:34:01 +0000610 return types.CodeType(co.co_argcount, co.co_nlocals, co.co_stacksize,
Tim Peters2c60f7a2003-01-29 03:49:43 +0000611 co.co_flags, co.co_code, tuple(consts), co.co_names,
612 co.co_varnames, new_filename, co.co_name,
Neal Norwitz82c72312002-11-12 23:09:12 +0000613 co.co_firstlineno, co.co_lnotab,
614 co.co_freevars, co.co_cellvars)
Guido van Rossum6b767ac2001-03-20 20:43:34 +0000615
Guido van Rossum75dc4961998-03-05 03:42:00 +0000616
617def test():
618 # Parse command line
619 import getopt
620 try:
Guido van Rossumbaf06031998-08-25 14:06:55 +0000621 opts, args = getopt.getopt(sys.argv[1:], "dmp:qx:")
Guido van Rossum75dc4961998-03-05 03:42:00 +0000622 except getopt.error, msg:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000623 print msg
624 return
Guido van Rossum75dc4961998-03-05 03:42:00 +0000625
626 # Process options
627 debug = 1
628 domods = 0
629 addpath = []
Guido van Rossumbaf06031998-08-25 14:06:55 +0000630 exclude = []
Guido van Rossum75dc4961998-03-05 03:42:00 +0000631 for o, a in opts:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000632 if o == '-d':
633 debug = debug + 1
634 if o == '-m':
635 domods = 1
636 if o == '-p':
Walter Dörwaldaaab30e2002-09-11 20:36:02 +0000637 addpath = addpath + a.split(os.pathsep)
Guido van Rossum912a14c1998-03-05 04:56:37 +0000638 if o == '-q':
639 debug = 0
Guido van Rossumbaf06031998-08-25 14:06:55 +0000640 if o == '-x':
641 exclude.append(a)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000642
643 # Provide default arguments
644 if not args:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000645 script = "hello.py"
Guido van Rossum75dc4961998-03-05 03:42:00 +0000646 else:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000647 script = args[0]
Guido van Rossum75dc4961998-03-05 03:42:00 +0000648
649 # Set the path based on sys.path and the script directory
650 path = sys.path[:]
651 path[0] = os.path.dirname(script)
652 path = addpath + path
653 if debug > 1:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000654 print "path:"
655 for item in path:
Walter Dörwald70a6b492004-02-12 17:35:32 +0000656 print " ", repr(item)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000657
658 # Create the module finder and turn its crank
Guido van Rossumbaf06031998-08-25 14:06:55 +0000659 mf = ModuleFinder(path, debug, exclude)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000660 for arg in args[1:]:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000661 if arg == '-m':
662 domods = 1
663 continue
664 if domods:
665 if arg[-2:] == '.*':
666 mf.import_hook(arg[:-2], None, ["*"])
667 else:
668 mf.import_hook(arg)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000669 else:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000670 mf.load_file(arg)
Guido van Rossum75dc4961998-03-05 03:42:00 +0000671 mf.run_script(script)
672 mf.report()
Just van Rossume29310a2002-12-31 16:33:00 +0000673 return mf # for -i debugging
Guido van Rossum75dc4961998-03-05 03:42:00 +0000674
675
676if __name__ == '__main__':
677 try:
Just van Rossume29310a2002-12-31 16:33:00 +0000678 mf = test()
Guido van Rossum75dc4961998-03-05 03:42:00 +0000679 except KeyboardInterrupt:
Guido van Rossum912a14c1998-03-05 04:56:37 +0000680 print "\n[interrupt]"