Guido van Rossum | a4deda0 | 2002-12-23 16:30:00 +0000 | [diff] [blame] | 1 | """Utilities to support packages.""" |
| 2 | |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 3 | # NOTE: This module must remain compatible with Python 2.3, as it is shared |
| 4 | # by setuptools for distribution with Python 2.3 and up. |
| 5 | |
Guido van Rossum | a4deda0 | 2002-12-23 16:30:00 +0000 | [diff] [blame] | 6 | import os |
| 7 | import sys |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 8 | import imp |
| 9 | import os.path |
| 10 | from types import ModuleType |
| 11 | |
| 12 | __all__ = [ |
| 13 | 'get_importer', 'iter_importers', 'get_loader', 'find_loader', |
Éric Araujo | ea088c5 | 2011-05-25 18:11:24 +0200 | [diff] [blame] | 14 | 'walk_packages', 'iter_modules', 'get_data', |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 15 | 'ImpImporter', 'ImpLoader', 'read_code', 'extend_path', |
| 16 | ] |
| 17 | |
| 18 | def read_code(stream): |
| 19 | # This helper is needed in order for the PEP 302 emulation to |
| 20 | # correctly handle compiled files |
| 21 | import marshal |
| 22 | |
| 23 | magic = stream.read(4) |
| 24 | if magic != imp.get_magic(): |
| 25 | return None |
| 26 | |
| 27 | stream.read(4) # Skip timestamp |
| 28 | return marshal.load(stream) |
| 29 | |
| 30 | |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 31 | def simplegeneric(func): |
| 32 | """Make a trivial single-dispatch generic function""" |
| 33 | registry = {} |
Neal Norwitz | 0bbbb00 | 2006-04-28 04:32:20 +0000 | [diff] [blame] | 34 | def wrapper(*args, **kw): |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 35 | ob = args[0] |
| 36 | try: |
| 37 | cls = ob.__class__ |
| 38 | except AttributeError: |
| 39 | cls = type(ob) |
| 40 | try: |
| 41 | mro = cls.__mro__ |
| 42 | except AttributeError: |
| 43 | try: |
Neal Norwitz | 0bbbb00 | 2006-04-28 04:32:20 +0000 | [diff] [blame] | 44 | class cls(cls, object): |
| 45 | pass |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 46 | mro = cls.__mro__[1:] |
| 47 | except TypeError: |
Tim Peters | 584b0e0 | 2006-04-18 17:32:12 +0000 | [diff] [blame] | 48 | mro = object, # must be an ExtensionClass or some such :( |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 49 | for t in mro: |
| 50 | if t in registry: |
Neal Norwitz | 0bbbb00 | 2006-04-28 04:32:20 +0000 | [diff] [blame] | 51 | return registry[t](*args, **kw) |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 52 | else: |
Neal Norwitz | 0bbbb00 | 2006-04-28 04:32:20 +0000 | [diff] [blame] | 53 | return func(*args, **kw) |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 54 | try: |
| 55 | wrapper.__name__ = func.__name__ |
Neal Norwitz | 0bbbb00 | 2006-04-28 04:32:20 +0000 | [diff] [blame] | 56 | except (TypeError, AttributeError): |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 57 | pass # Python 2.3 doesn't allow functions to be renamed |
| 58 | |
| 59 | def register(typ, func=None): |
| 60 | if func is None: |
| 61 | return lambda f: register(typ, f) |
| 62 | registry[typ] = func |
| 63 | return func |
| 64 | |
| 65 | wrapper.__dict__ = func.__dict__ |
| 66 | wrapper.__doc__ = func.__doc__ |
| 67 | wrapper.register = register |
Tim Peters | 584b0e0 | 2006-04-18 17:32:12 +0000 | [diff] [blame] | 68 | return wrapper |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 69 | |
| 70 | |
| 71 | def walk_packages(path=None, prefix='', onerror=None): |
Georg Brandl | 69b9b67 | 2006-07-25 10:22:34 +0000 | [diff] [blame] | 72 | """Yields (module_loader, name, ispkg) for all modules recursively |
| 73 | on path, or, if path is None, all accessible modules. |
Tim Peters | 9134307 | 2006-07-25 22:30:24 +0000 | [diff] [blame] | 74 | |
Georg Brandl | 69b9b67 | 2006-07-25 10:22:34 +0000 | [diff] [blame] | 75 | 'path' should be either None or a list of paths to look for |
| 76 | modules in. |
| 77 | |
| 78 | 'prefix' is a string to output on the front of every module name |
| 79 | on output. |
| 80 | |
| 81 | Note that this function must import all *packages* (NOT all |
| 82 | modules!) on the given path, in order to access the __path__ |
| 83 | attribute to find submodules. |
Tim Peters | 9134307 | 2006-07-25 22:30:24 +0000 | [diff] [blame] | 84 | |
Georg Brandl | 69b9b67 | 2006-07-25 10:22:34 +0000 | [diff] [blame] | 85 | 'onerror' is a function which gets called with one argument (the |
Phillip J. Eby | eb26ea3 | 2006-07-26 19:48:27 +0000 | [diff] [blame] | 86 | name of the package which was being imported) if any exception |
| 87 | occurs while trying to import a package. If no onerror function is |
| 88 | supplied, ImportErrors are caught and ignored, while all other |
| 89 | exceptions are propagated, terminating the search. |
Georg Brandl | 69b9b67 | 2006-07-25 10:22:34 +0000 | [diff] [blame] | 90 | |
| 91 | Examples: |
Phillip J. Eby | eb26ea3 | 2006-07-26 19:48:27 +0000 | [diff] [blame] | 92 | |
| 93 | # list all modules python can access |
Tim Peters | 95621b2 | 2006-07-26 23:23:15 +0000 | [diff] [blame] | 94 | walk_packages() |
Phillip J. Eby | eb26ea3 | 2006-07-26 19:48:27 +0000 | [diff] [blame] | 95 | |
| 96 | # list all submodules of ctypes |
| 97 | walk_packages(ctypes.__path__, ctypes.__name__+'.') |
Georg Brandl | 69b9b67 | 2006-07-25 10:22:34 +0000 | [diff] [blame] | 98 | """ |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 99 | |
Neal Norwitz | 0bbbb00 | 2006-04-28 04:32:20 +0000 | [diff] [blame] | 100 | def seen(p, m={}): |
| 101 | if p in m: |
| 102 | return True |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 103 | m[p] = True |
| 104 | |
| 105 | for importer, name, ispkg in iter_modules(path, prefix): |
| 106 | yield importer, name, ispkg |
| 107 | |
| 108 | if ispkg: |
| 109 | try: |
| 110 | __import__(name) |
| 111 | except ImportError: |
| 112 | if onerror is not None: |
Georg Brandl | 69b9b67 | 2006-07-25 10:22:34 +0000 | [diff] [blame] | 113 | onerror(name) |
Phillip J. Eby | eb26ea3 | 2006-07-26 19:48:27 +0000 | [diff] [blame] | 114 | except Exception: |
| 115 | if onerror is not None: |
| 116 | onerror(name) |
| 117 | else: |
| 118 | raise |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 119 | else: |
| 120 | path = getattr(sys.modules[name], '__path__', None) or [] |
| 121 | |
| 122 | # don't traverse path items we've seen before |
| 123 | path = [p for p in path if not seen(p)] |
| 124 | |
Georg Brandl | 69b9b67 | 2006-07-25 10:22:34 +0000 | [diff] [blame] | 125 | for item in walk_packages(path, name+'.', onerror): |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 126 | yield item |
| 127 | |
| 128 | |
| 129 | def iter_modules(path=None, prefix=''): |
Georg Brandl | 69b9b67 | 2006-07-25 10:22:34 +0000 | [diff] [blame] | 130 | """Yields (module_loader, name, ispkg) for all submodules on path, |
| 131 | or, if path is None, all top-level modules on sys.path. |
| 132 | |
| 133 | 'path' should be either None or a list of paths to look for |
| 134 | modules in. |
| 135 | |
| 136 | 'prefix' is a string to output on the front of every module name |
| 137 | on output. |
| 138 | """ |
Tim Peters | 9134307 | 2006-07-25 22:30:24 +0000 | [diff] [blame] | 139 | |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 140 | if path is None: |
| 141 | importers = iter_importers() |
| 142 | else: |
| 143 | importers = map(get_importer, path) |
| 144 | |
| 145 | yielded = {} |
| 146 | for i in importers: |
| 147 | for name, ispkg in iter_importer_modules(i, prefix): |
| 148 | if name not in yielded: |
| 149 | yielded[name] = 1 |
| 150 | yield i, name, ispkg |
| 151 | |
| 152 | |
| 153 | #@simplegeneric |
| 154 | def iter_importer_modules(importer, prefix=''): |
Neal Norwitz | 0bbbb00 | 2006-04-28 04:32:20 +0000 | [diff] [blame] | 155 | if not hasattr(importer, 'iter_modules'): |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 156 | return [] |
| 157 | return importer.iter_modules(prefix) |
| 158 | |
| 159 | iter_importer_modules = simplegeneric(iter_importer_modules) |
| 160 | |
| 161 | |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 162 | class ImpImporter: |
| 163 | """PEP 302 Importer that wraps Python's "classic" import algorithm |
| 164 | |
| 165 | ImpImporter(dirname) produces a PEP 302 importer that searches that |
| 166 | directory. ImpImporter(None) produces a PEP 302 importer that searches |
| 167 | the current sys.path, plus any modules that are frozen or built-in. |
| 168 | |
| 169 | Note that ImpImporter does not currently support being used by placement |
| 170 | on sys.meta_path. |
| 171 | """ |
| 172 | |
| 173 | def __init__(self, path=None): |
| 174 | self.path = path |
| 175 | |
| 176 | def find_module(self, fullname, path=None): |
| 177 | # Note: we ignore 'path' argument since it is only used via meta_path |
| 178 | subname = fullname.split(".")[-1] |
| 179 | if subname != fullname and self.path is None: |
| 180 | return None |
| 181 | if self.path is None: |
| 182 | path = None |
| 183 | else: |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 184 | path = [os.path.realpath(self.path)] |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 185 | try: |
| 186 | file, filename, etc = imp.find_module(subname, path) |
| 187 | except ImportError: |
| 188 | return None |
| 189 | return ImpLoader(fullname, file, filename, etc) |
| 190 | |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 191 | def iter_modules(self, prefix=''): |
| 192 | if self.path is None or not os.path.isdir(self.path): |
| 193 | return |
| 194 | |
| 195 | yielded = {} |
| 196 | import inspect |
Ned Deily | 777f2e0 | 2011-10-06 14:17:47 -0700 | [diff] [blame] | 197 | try: |
| 198 | filenames = os.listdir(self.path) |
| 199 | except OSError: |
| 200 | # ignore unreadable directories like import does |
| 201 | filenames = [] |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 202 | filenames.sort() # handle packages before same-named modules |
| 203 | |
| 204 | for fn in filenames: |
| 205 | modname = inspect.getmodulename(fn) |
| 206 | if modname=='__init__' or modname in yielded: |
| 207 | continue |
Tim Peters | 584b0e0 | 2006-04-18 17:32:12 +0000 | [diff] [blame] | 208 | |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 209 | path = os.path.join(self.path, fn) |
| 210 | ispkg = False |
| 211 | |
| 212 | if not modname and os.path.isdir(path) and '.' not in fn: |
| 213 | modname = fn |
Ned Deily | 777f2e0 | 2011-10-06 14:17:47 -0700 | [diff] [blame] | 214 | try: |
| 215 | dircontents = os.listdir(path) |
| 216 | except OSError: |
| 217 | # ignore unreadable directories like import does |
| 218 | dircontents = [] |
| 219 | for fn in dircontents: |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 220 | subname = inspect.getmodulename(fn) |
| 221 | if subname=='__init__': |
| 222 | ispkg = True |
| 223 | break |
| 224 | else: |
| 225 | continue # not a package |
| 226 | |
| 227 | if modname and '.' not in modname: |
| 228 | yielded[modname] = 1 |
| 229 | yield prefix + modname, ispkg |
| 230 | |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 231 | |
| 232 | class ImpLoader: |
| 233 | """PEP 302 Loader that wraps Python's "classic" import algorithm |
| 234 | """ |
| 235 | code = source = None |
| 236 | |
| 237 | def __init__(self, fullname, file, filename, etc): |
| 238 | self.file = file |
| 239 | self.filename = filename |
| 240 | self.fullname = fullname |
| 241 | self.etc = etc |
| 242 | |
| 243 | def load_module(self, fullname): |
| 244 | self._reopen() |
| 245 | try: |
| 246 | mod = imp.load_module(fullname, self.file, self.filename, self.etc) |
| 247 | finally: |
| 248 | if self.file: |
| 249 | self.file.close() |
| 250 | # Note: we don't set __loader__ because we want the module to look |
| 251 | # normal; i.e. this is just a wrapper for standard import machinery |
| 252 | return mod |
| 253 | |
| 254 | def get_data(self, pathname): |
| 255 | return open(pathname, "rb").read() |
| 256 | |
| 257 | def _reopen(self): |
| 258 | if self.file and self.file.closed: |
Neal Norwitz | f992a2b | 2006-06-11 07:26:27 +0000 | [diff] [blame] | 259 | mod_type = self.etc[2] |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 260 | if mod_type==imp.PY_SOURCE: |
| 261 | self.file = open(self.filename, 'rU') |
| 262 | elif mod_type in (imp.PY_COMPILED, imp.C_EXTENSION): |
| 263 | self.file = open(self.filename, 'rb') |
| 264 | |
| 265 | def _fix_name(self, fullname): |
| 266 | if fullname is None: |
| 267 | fullname = self.fullname |
| 268 | elif fullname != self.fullname: |
| 269 | raise ImportError("Loader for module %s cannot handle " |
| 270 | "module %s" % (self.fullname, fullname)) |
| 271 | return fullname |
| 272 | |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 273 | def is_package(self, fullname): |
| 274 | fullname = self._fix_name(fullname) |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 275 | return self.etc[2]==imp.PKG_DIRECTORY |
| 276 | |
| 277 | def get_code(self, fullname=None): |
| 278 | fullname = self._fix_name(fullname) |
| 279 | if self.code is None: |
| 280 | mod_type = self.etc[2] |
| 281 | if mod_type==imp.PY_SOURCE: |
| 282 | source = self.get_source(fullname) |
| 283 | self.code = compile(source, self.filename, 'exec') |
| 284 | elif mod_type==imp.PY_COMPILED: |
| 285 | self._reopen() |
| 286 | try: |
| 287 | self.code = read_code(self.file) |
| 288 | finally: |
| 289 | self.file.close() |
| 290 | elif mod_type==imp.PKG_DIRECTORY: |
| 291 | self.code = self._get_delegate().get_code() |
| 292 | return self.code |
| 293 | |
| 294 | def get_source(self, fullname=None): |
| 295 | fullname = self._fix_name(fullname) |
| 296 | if self.source is None: |
| 297 | mod_type = self.etc[2] |
| 298 | if mod_type==imp.PY_SOURCE: |
| 299 | self._reopen() |
| 300 | try: |
| 301 | self.source = self.file.read() |
| 302 | finally: |
| 303 | self.file.close() |
| 304 | elif mod_type==imp.PY_COMPILED: |
| 305 | if os.path.exists(self.filename[:-1]): |
| 306 | f = open(self.filename[:-1], 'rU') |
| 307 | self.source = f.read() |
| 308 | f.close() |
| 309 | elif mod_type==imp.PKG_DIRECTORY: |
| 310 | self.source = self._get_delegate().get_source() |
| 311 | return self.source |
| 312 | |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 313 | |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 314 | def _get_delegate(self): |
| 315 | return ImpImporter(self.filename).find_module('__init__') |
| 316 | |
| 317 | def get_filename(self, fullname=None): |
| 318 | fullname = self._fix_name(fullname) |
| 319 | mod_type = self.etc[2] |
| 320 | if self.etc[2]==imp.PKG_DIRECTORY: |
| 321 | return self._get_delegate().get_filename() |
| 322 | elif self.etc[2] in (imp.PY_SOURCE, imp.PY_COMPILED, imp.C_EXTENSION): |
| 323 | return self.filename |
| 324 | return None |
| 325 | |
| 326 | |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 327 | try: |
| 328 | import zipimport |
| 329 | from zipimport import zipimporter |
Tim Peters | 584b0e0 | 2006-04-18 17:32:12 +0000 | [diff] [blame] | 330 | |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 331 | def iter_zipimport_modules(importer, prefix=''): |
| 332 | dirlist = zipimport._zip_directory_cache[importer.archive].keys() |
| 333 | dirlist.sort() |
| 334 | _prefix = importer.prefix |
| 335 | plen = len(_prefix) |
| 336 | yielded = {} |
| 337 | import inspect |
| 338 | for fn in dirlist: |
| 339 | if not fn.startswith(_prefix): |
| 340 | continue |
| 341 | |
| 342 | fn = fn[plen:].split(os.sep) |
| 343 | |
| 344 | if len(fn)==2 and fn[1].startswith('__init__.py'): |
| 345 | if fn[0] not in yielded: |
| 346 | yielded[fn[0]] = 1 |
| 347 | yield fn[0], True |
| 348 | |
| 349 | if len(fn)!=1: |
| 350 | continue |
| 351 | |
| 352 | modname = inspect.getmodulename(fn[0]) |
| 353 | if modname=='__init__': |
| 354 | continue |
| 355 | |
| 356 | if modname and '.' not in modname and modname not in yielded: |
| 357 | yielded[modname] = 1 |
| 358 | yield prefix + modname, False |
| 359 | |
| 360 | iter_importer_modules.register(zipimporter, iter_zipimport_modules) |
| 361 | |
| 362 | except ImportError: |
| 363 | pass |
| 364 | |
| 365 | |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 366 | def get_importer(path_item): |
| 367 | """Retrieve a PEP 302 importer for the given path item |
| 368 | |
| 369 | The returned importer is cached in sys.path_importer_cache |
| 370 | if it was newly created by a path hook. |
| 371 | |
| 372 | If there is no importer, a wrapper around the basic import |
| 373 | machinery is returned. This wrapper is never inserted into |
| 374 | the importer cache (None is inserted instead). |
| 375 | |
| 376 | The cache (or part of it) can be cleared manually if a |
| 377 | rescan of sys.path_hooks is necessary. |
| 378 | """ |
| 379 | try: |
| 380 | importer = sys.path_importer_cache[path_item] |
| 381 | except KeyError: |
| 382 | for path_hook in sys.path_hooks: |
| 383 | try: |
| 384 | importer = path_hook(path_item) |
| 385 | break |
| 386 | except ImportError: |
| 387 | pass |
| 388 | else: |
| 389 | importer = None |
Neal Norwitz | 0bbbb00 | 2006-04-28 04:32:20 +0000 | [diff] [blame] | 390 | sys.path_importer_cache.setdefault(path_item, importer) |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 391 | |
Phillip J. Eby | f7575d0 | 2006-07-28 21:12:07 +0000 | [diff] [blame] | 392 | if importer is None: |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 393 | try: |
| 394 | importer = ImpImporter(path_item) |
| 395 | except ImportError: |
Georg Brandl | f4ef116 | 2006-05-26 18:03:31 +0000 | [diff] [blame] | 396 | importer = None |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 397 | return importer |
| 398 | |
| 399 | |
Phillip J. Eby | ceb3087 | 2006-04-18 00:59:55 +0000 | [diff] [blame] | 400 | def iter_importers(fullname=""): |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 401 | """Yield PEP 302 importers for the given module name |
| 402 | |
| 403 | If fullname contains a '.', the importers will be for the package |
| 404 | containing fullname, otherwise they will be importers for sys.meta_path, |
| 405 | sys.path, and Python's "classic" import machinery, in that order. If |
| 406 | the named module is in a package, that package is imported as a side |
| 407 | effect of invoking this function. |
| 408 | |
| 409 | Non PEP 302 mechanisms (e.g. the Windows registry) used by the |
| 410 | standard import machinery to find files in alternative locations |
| 411 | are partially supported, but are searched AFTER sys.path. Normally, |
| 412 | these locations are searched BEFORE sys.path, preventing sys.path |
| 413 | entries from shadowing them. |
| 414 | |
| 415 | For this to cause a visible difference in behaviour, there must |
| 416 | be a module or package name that is accessible via both sys.path |
| 417 | and one of the non PEP 302 file system mechanisms. In this case, |
| 418 | the emulation will find the former version, while the builtin |
| 419 | import mechanism will find the latter. |
| 420 | |
| 421 | Items of the following types can be affected by this discrepancy: |
| 422 | imp.C_EXTENSION, imp.PY_SOURCE, imp.PY_COMPILED, imp.PKG_DIRECTORY |
| 423 | """ |
| 424 | if fullname.startswith('.'): |
| 425 | raise ImportError("Relative module names not supported") |
| 426 | if '.' in fullname: |
| 427 | # Get the containing package's __path__ |
| 428 | pkg = '.'.join(fullname.split('.')[:-1]) |
| 429 | if pkg not in sys.modules: |
| 430 | __import__(pkg) |
Neal Norwitz | 0bbbb00 | 2006-04-28 04:32:20 +0000 | [diff] [blame] | 431 | path = getattr(sys.modules[pkg], '__path__', None) or [] |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 432 | else: |
| 433 | for importer in sys.meta_path: |
| 434 | yield importer |
| 435 | path = sys.path |
| 436 | for item in path: |
| 437 | yield get_importer(item) |
| 438 | if '.' not in fullname: |
| 439 | yield ImpImporter() |
| 440 | |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 441 | def get_loader(module_or_name): |
| 442 | """Get a PEP 302 "loader" object for module_or_name |
| 443 | |
| 444 | If the module or package is accessible via the normal import |
| 445 | mechanism, a wrapper around the relevant part of that machinery |
| 446 | is returned. Returns None if the module cannot be found or imported. |
| 447 | If the named module is not already imported, its containing package |
| 448 | (if any) is imported, in order to establish the package __path__. |
| 449 | |
| 450 | This function uses iter_importers(), and is thus subject to the same |
| 451 | limitations regarding platform-specific special import locations such |
| 452 | as the Windows registry. |
| 453 | """ |
| 454 | if module_or_name in sys.modules: |
| 455 | module_or_name = sys.modules[module_or_name] |
| 456 | if isinstance(module_or_name, ModuleType): |
| 457 | module = module_or_name |
Neal Norwitz | 0bbbb00 | 2006-04-28 04:32:20 +0000 | [diff] [blame] | 458 | loader = getattr(module, '__loader__', None) |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 459 | if loader is not None: |
| 460 | return loader |
| 461 | fullname = module.__name__ |
| 462 | else: |
| 463 | fullname = module_or_name |
| 464 | return find_loader(fullname) |
| 465 | |
Phillip J. Eby | ab1d245 | 2006-04-17 20:17:25 +0000 | [diff] [blame] | 466 | def find_loader(fullname): |
| 467 | """Find a PEP 302 "loader" object for fullname |
| 468 | |
| 469 | If fullname contains dots, path must be the containing package's __path__. |
| 470 | Returns None if the module cannot be found or imported. This function uses |
| 471 | iter_importers(), and is thus subject to the same limitations regarding |
| 472 | platform-specific special import locations such as the Windows registry. |
| 473 | """ |
| 474 | for importer in iter_importers(fullname): |
| 475 | loader = importer.find_module(fullname) |
| 476 | if loader is not None: |
| 477 | return loader |
| 478 | |
| 479 | return None |
| 480 | |
Guido van Rossum | a4deda0 | 2002-12-23 16:30:00 +0000 | [diff] [blame] | 481 | |
| 482 | def extend_path(path, name): |
| 483 | """Extend a package's path. |
| 484 | |
| 485 | Intended use is to place the following code in a package's __init__.py: |
| 486 | |
| 487 | from pkgutil import extend_path |
| 488 | __path__ = extend_path(__path__, __name__) |
| 489 | |
| 490 | This will add to the package's __path__ all subdirectories of |
| 491 | directories on sys.path named after the package. This is useful |
| 492 | if one wants to distribute different parts of a single logical |
| 493 | package as multiple directories. |
| 494 | |
| 495 | It also looks for *.pkg files beginning where * matches the name |
| 496 | argument. This feature is similar to *.pth files (see site.py), |
| 497 | except that it doesn't special-case lines starting with 'import'. |
| 498 | A *.pkg file is trusted at face value: apart from checking for |
| 499 | duplicates, all entries found in a *.pkg file are added to the |
| 500 | path, regardless of whether they are exist the filesystem. (This |
| 501 | is a feature.) |
| 502 | |
| 503 | If the input path is not a list (as is the case for frozen |
| 504 | packages) it is returned unchanged. The input path is not |
| 505 | modified; an extended copy is returned. Items are only appended |
| 506 | to the copy at the end. |
| 507 | |
| 508 | It is assumed that sys.path is a sequence. Items of sys.path that |
| 509 | are not (unicode or 8-bit) strings referring to existing |
| 510 | directories are ignored. Unicode items of sys.path that cause |
| 511 | errors when used as filenames may cause this function to raise an |
| 512 | exception (in line with os.path.isdir() behavior). |
| 513 | """ |
| 514 | |
| 515 | if not isinstance(path, list): |
| 516 | # This could happen e.g. when this is called from inside a |
| 517 | # frozen package. Return the path unchanged in that case. |
| 518 | return path |
| 519 | |
| 520 | pname = os.path.join(*name.split('.')) # Reconstitute as relative path |
| 521 | # Just in case os.extsep != '.' |
| 522 | sname = os.extsep.join(name.split('.')) |
| 523 | sname_pkg = sname + os.extsep + "pkg" |
| 524 | init_py = "__init__" + os.extsep + "py" |
| 525 | |
| 526 | path = path[:] # Start with a copy of the existing path |
| 527 | |
| 528 | for dir in sys.path: |
Raymond Hettinger | 7a70ea4 | 2003-09-17 05:50:59 +0000 | [diff] [blame] | 529 | if not isinstance(dir, basestring) or not os.path.isdir(dir): |
Guido van Rossum | a4deda0 | 2002-12-23 16:30:00 +0000 | [diff] [blame] | 530 | continue |
| 531 | subdir = os.path.join(dir, pname) |
| 532 | # XXX This may still add duplicate entries to path on |
| 533 | # case-insensitive filesystems |
| 534 | initfile = os.path.join(subdir, init_py) |
| 535 | if subdir not in path and os.path.isfile(initfile): |
| 536 | path.append(subdir) |
| 537 | # XXX Is this the right thing for subpackages like zope.app? |
| 538 | # It looks for a file named "zope.app.pkg" |
| 539 | pkgfile = os.path.join(dir, sname_pkg) |
| 540 | if os.path.isfile(pkgfile): |
| 541 | try: |
| 542 | f = open(pkgfile) |
| 543 | except IOError, msg: |
| 544 | sys.stderr.write("Can't open %s: %s\n" % |
| 545 | (pkgfile, msg)) |
| 546 | else: |
| 547 | for line in f: |
| 548 | line = line.rstrip('\n') |
| 549 | if not line or line.startswith('#'): |
| 550 | continue |
| 551 | path.append(line) # Don't check for existence! |
| 552 | f.close() |
| 553 | |
| 554 | return path |
Nick Coghlan | 106fc48 | 2008-04-15 10:25:31 +0000 | [diff] [blame] | 555 | |
| 556 | def get_data(package, resource): |
| 557 | """Get a resource from a package. |
| 558 | |
| 559 | This is a wrapper round the PEP 302 loader get_data API. The package |
| 560 | argument should be the name of a package, in standard module format |
| 561 | (foo.bar). The resource argument should be in the form of a relative |
| 562 | filename, using '/' as the path separator. The parent directory name '..' |
| 563 | is not allowed, and nor is a rooted name (starting with a '/'). |
| 564 | |
| 565 | The function returns a binary string, which is the contents of the |
| 566 | specified resource. |
| 567 | |
| 568 | For packages located in the filesystem, which have already been imported, |
| 569 | this is the rough equivalent of |
| 570 | |
| 571 | d = os.path.dirname(sys.modules[package].__file__) |
| 572 | data = open(os.path.join(d, resource), 'rb').read() |
| 573 | |
| 574 | If the package cannot be located or loaded, or it uses a PEP 302 loader |
| 575 | which does not support get_data(), then None is returned. |
| 576 | """ |
| 577 | |
| 578 | loader = get_loader(package) |
| 579 | if loader is None or not hasattr(loader, 'get_data'): |
| 580 | return None |
| 581 | mod = sys.modules.get(package) or loader.load_module(package) |
| 582 | if mod is None or not hasattr(mod, '__file__'): |
| 583 | return None |
| 584 | |
| 585 | # Modify the resource name to be compatible with the loader.get_data |
| 586 | # signature - an os.path format "filename" starting with the dirname of |
| 587 | # the package's __file__ |
| 588 | parts = resource.split('/') |
| 589 | parts.insert(0, os.path.dirname(mod.__file__)) |
| 590 | resource_name = os.path.join(*parts) |
| 591 | return loader.get_data(resource_name) |