Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 1 | """runpy.py - locating and running Python code using the module namespace |
| 2 | |
| 3 | Provides support for locating and running Python scripts using the Python |
| 4 | module namespace instead of the native filesystem. |
| 5 | |
| 6 | This allows Python code to play nicely with non-filesystem based PEP 302 |
| 7 | importers when locating support scripts as well as when importing modules. |
| 8 | """ |
| 9 | # Written by Nick Coghlan <ncoghlan at gmail.com> |
| 10 | # to implement PEP 338 (Executing Modules as Scripts) |
| 11 | |
Brett Cannon | aa93642 | 2012-04-27 15:30:58 -0400 | [diff] [blame] | 12 | |
Brett Cannon | e0d88a1 | 2012-04-25 20:54:04 -0400 | [diff] [blame] | 13 | import os |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 14 | import sys |
Nick Coghlan | be7e49f | 2012-07-20 23:40:09 +1000 | [diff] [blame] | 15 | import importlib.machinery # importlib first so we can test #15386 via -m |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 16 | import imp |
Nick Coghlan | 85e729e | 2012-07-15 18:09:52 +1000 | [diff] [blame] | 17 | from pkgutil import read_code, get_loader, get_importer |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 18 | |
| 19 | __all__ = [ |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 20 | "run_module", "run_path", |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 21 | ] |
| 22 | |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 23 | class _TempModule(object): |
| 24 | """Temporarily replace a module in sys.modules with an empty namespace""" |
| 25 | def __init__(self, mod_name): |
| 26 | self.mod_name = mod_name |
| 27 | self.module = imp.new_module(mod_name) |
| 28 | self._saved_module = [] |
| 29 | |
| 30 | def __enter__(self): |
| 31 | mod_name = self.mod_name |
| 32 | try: |
| 33 | self._saved_module.append(sys.modules[mod_name]) |
| 34 | except KeyError: |
| 35 | pass |
| 36 | sys.modules[mod_name] = self.module |
| 37 | return self |
| 38 | |
| 39 | def __exit__(self, *args): |
| 40 | if self._saved_module: |
| 41 | sys.modules[self.mod_name] = self._saved_module[0] |
| 42 | else: |
| 43 | del sys.modules[self.mod_name] |
| 44 | self._saved_module = [] |
| 45 | |
| 46 | class _ModifiedArgv0(object): |
| 47 | def __init__(self, value): |
| 48 | self.value = value |
| 49 | self._saved_value = self._sentinel = object() |
| 50 | |
| 51 | def __enter__(self): |
| 52 | if self._saved_value is not self._sentinel: |
| 53 | raise RuntimeError("Already preserving saved value") |
| 54 | self._saved_value = sys.argv[0] |
| 55 | sys.argv[0] = self.value |
| 56 | |
| 57 | def __exit__(self, *args): |
| 58 | self.value = self._sentinel |
| 59 | sys.argv[0] = self._saved_value |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 60 | |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 61 | def _run_code(code, run_globals, init_globals=None, |
| 62 | mod_name=None, mod_fname=None, |
Christian Heimes | cbf3b5c | 2007-12-03 21:02:03 +0000 | [diff] [blame] | 63 | mod_loader=None, pkg_name=None): |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 64 | """Helper to run code in nominated namespace""" |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 65 | if init_globals is not None: |
| 66 | run_globals.update(init_globals) |
| 67 | run_globals.update(__name__ = mod_name, |
| 68 | __file__ = mod_fname, |
Barry Warsaw | 28a691b | 2010-04-17 00:19:56 +0000 | [diff] [blame] | 69 | __cached__ = None, |
Nick Coghlan | 761bb11 | 2012-07-14 23:59:22 +1000 | [diff] [blame] | 70 | __doc__ = None, |
Christian Heimes | cbf3b5c | 2007-12-03 21:02:03 +0000 | [diff] [blame] | 71 | __loader__ = mod_loader, |
| 72 | __package__ = pkg_name) |
Georg Brandl | 7cae87c | 2006-09-06 06:51:57 +0000 | [diff] [blame] | 73 | exec(code, run_globals) |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 74 | return run_globals |
| 75 | |
| 76 | def _run_module_code(code, init_globals=None, |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 77 | mod_name=None, mod_fname=None, |
Christian Heimes | cbf3b5c | 2007-12-03 21:02:03 +0000 | [diff] [blame] | 78 | mod_loader=None, pkg_name=None): |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 79 | """Helper to run code in new namespace with sys modified""" |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 80 | with _TempModule(mod_name) as temp_module, _ModifiedArgv0(mod_fname): |
| 81 | mod_globals = temp_module.module.__dict__ |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 82 | _run_code(code, mod_globals, init_globals, |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 83 | mod_name, mod_fname, mod_loader, pkg_name) |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 84 | # Copy the globals of the temporary module, as they |
| 85 | # may be cleared when the temporary module goes away |
| 86 | return mod_globals.copy() |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 87 | |
| 88 | |
Thomas Wouters | 49fd7fa | 2006-04-21 10:40:58 +0000 | [diff] [blame] | 89 | # This helper is needed due to a missing component in the PEP 302 |
| 90 | # loader protocol (specifically, "get_filename" is non-standard) |
Nick Coghlan | f088e5e | 2008-12-14 11:50:48 +0000 | [diff] [blame] | 91 | # Since we can't introduce new features in maintenance releases, |
| 92 | # support was added to zipimporter under the name '_get_filename' |
Thomas Wouters | 49fd7fa | 2006-04-21 10:40:58 +0000 | [diff] [blame] | 93 | def _get_filename(loader, mod_name): |
Nick Coghlan | f088e5e | 2008-12-14 11:50:48 +0000 | [diff] [blame] | 94 | for attr in ("get_filename", "_get_filename"): |
| 95 | meth = getattr(loader, attr, None) |
| 96 | if meth is not None: |
Brett Cannon | e0d88a1 | 2012-04-25 20:54:04 -0400 | [diff] [blame] | 97 | return os.path.abspath(meth(mod_name)) |
Nick Coghlan | f088e5e | 2008-12-14 11:50:48 +0000 | [diff] [blame] | 98 | return None |
Thomas Wouters | 49fd7fa | 2006-04-21 10:40:58 +0000 | [diff] [blame] | 99 | |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 100 | # Helper to get the loader, code and filename for a module |
| 101 | def _get_module_details(mod_name): |
Thomas Wouters | 49fd7fa | 2006-04-21 10:40:58 +0000 | [diff] [blame] | 102 | loader = get_loader(mod_name) |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 103 | if loader is None: |
Guido van Rossum | 806c246 | 2007-08-06 23:33:07 +0000 | [diff] [blame] | 104 | raise ImportError("No module named %s" % mod_name) |
| 105 | if loader.is_package(mod_name): |
Nick Coghlan | 3f48ae3 | 2009-02-08 01:58:26 +0000 | [diff] [blame] | 106 | if mod_name == "__main__" or mod_name.endswith(".__main__"): |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 107 | raise ImportError("Cannot use package as __main__ module") |
Nick Coghlan | 3f48ae3 | 2009-02-08 01:58:26 +0000 | [diff] [blame] | 108 | try: |
| 109 | pkg_main_name = mod_name + ".__main__" |
| 110 | return _get_module_details(pkg_main_name) |
| 111 | except ImportError as e: |
| 112 | raise ImportError(("%s; %r is a package and cannot " + |
| 113 | "be directly executed") %(e, mod_name)) |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 114 | code = loader.get_code(mod_name) |
| 115 | if code is None: |
Guido van Rossum | 806c246 | 2007-08-06 23:33:07 +0000 | [diff] [blame] | 116 | raise ImportError("No code object available for %s" % mod_name) |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 117 | filename = _get_filename(loader, mod_name) |
Nick Coghlan | 3f48ae3 | 2009-02-08 01:58:26 +0000 | [diff] [blame] | 118 | return mod_name, loader, code, filename |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 119 | |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 120 | # XXX ncoghlan: Should this be documented and made public? |
| 121 | # (Current thoughts: don't repeat the mistake that lead to its |
| 122 | # creation when run_module() no longer met the needs of |
| 123 | # mainmodule.c, but couldn't be changed because it was public) |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 124 | def _run_module_as_main(mod_name, alter_argv=True): |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 125 | """Runs the designated module in the __main__ namespace |
| 126 | |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 127 | Note that the executed module will have full access to the |
| 128 | __main__ namespace. If this is not desirable, the run_module() |
R. David Murray | 445448c | 2009-12-20 17:28:31 +0000 | [diff] [blame] | 129 | function should be used to run the module code in a fresh namespace. |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 130 | |
| 131 | At the very least, these variables in __main__ will be overwritten: |
| 132 | __name__ |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 133 | __file__ |
Barry Warsaw | 28a691b | 2010-04-17 00:19:56 +0000 | [diff] [blame] | 134 | __cached__ |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 135 | __loader__ |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 136 | __package__ |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 137 | """ |
Christian Heimes | c3f30c4 | 2008-02-22 16:37:40 +0000 | [diff] [blame] | 138 | try: |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 139 | if alter_argv or mod_name != "__main__": # i.e. -m switch |
| 140 | mod_name, loader, code, fname = _get_module_details(mod_name) |
| 141 | else: # i.e. directory or zipfile execution |
| 142 | mod_name, loader, code, fname = _get_main_module_details() |
Christian Heimes | c3f30c4 | 2008-02-22 16:37:40 +0000 | [diff] [blame] | 143 | except ImportError as exc: |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 144 | # Try to provide a good error message |
| 145 | # for directories, zip files and the -m switch |
| 146 | if alter_argv: |
| 147 | # For -m switch, just display the exception |
| 148 | info = str(exc) |
| 149 | else: |
| 150 | # For directories/zipfiles, let the user |
| 151 | # know what the code was looking for |
Benjamin Peterson | e360795 | 2009-11-25 18:38:11 +0000 | [diff] [blame] | 152 | info = "can't find '__main__' module in %r" % sys.argv[0] |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 153 | msg = "%s: %s" % (sys.executable, info) |
Christian Heimes | c3f30c4 | 2008-02-22 16:37:40 +0000 | [diff] [blame] | 154 | sys.exit(msg) |
Christian Heimes | cbf3b5c | 2007-12-03 21:02:03 +0000 | [diff] [blame] | 155 | pkg_name = mod_name.rpartition('.')[0] |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 156 | main_globals = sys.modules["__main__"].__dict__ |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 157 | if alter_argv: |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 158 | sys.argv[0] = fname |
| 159 | return _run_code(code, main_globals, None, |
Christian Heimes | cbf3b5c | 2007-12-03 21:02:03 +0000 | [diff] [blame] | 160 | "__main__", fname, loader, pkg_name) |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 161 | |
| 162 | def run_module(mod_name, init_globals=None, |
| 163 | run_name=None, alter_sys=False): |
| 164 | """Execute a module's code without importing it |
| 165 | |
| 166 | Returns the resulting top level namespace dictionary |
| 167 | """ |
Nick Coghlan | 3f48ae3 | 2009-02-08 01:58:26 +0000 | [diff] [blame] | 168 | mod_name, loader, code, fname = _get_module_details(mod_name) |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 169 | if run_name is None: |
| 170 | run_name = mod_name |
Christian Heimes | cbf3b5c | 2007-12-03 21:02:03 +0000 | [diff] [blame] | 171 | pkg_name = mod_name.rpartition('.')[0] |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 172 | if alter_sys: |
| 173 | return _run_module_code(code, init_globals, run_name, |
Christian Heimes | cbf3b5c | 2007-12-03 21:02:03 +0000 | [diff] [blame] | 174 | fname, loader, pkg_name) |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 175 | else: |
| 176 | # Leave the sys module alone |
Christian Heimes | cbf3b5c | 2007-12-03 21:02:03 +0000 | [diff] [blame] | 177 | return _run_code(code, {}, init_globals, run_name, |
| 178 | fname, loader, pkg_name) |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 179 | |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 180 | def _get_main_module_details(): |
| 181 | # Helper that gives a nicer error message when attempting to |
| 182 | # execute a zipfile or directory by invoking __main__.py |
Nick Coghlan | 85e729e | 2012-07-15 18:09:52 +1000 | [diff] [blame] | 183 | # Also moves the standard __main__ out of the way so that the |
| 184 | # preexisting __loader__ entry doesn't cause issues |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 185 | main_name = "__main__" |
Nick Coghlan | 85e729e | 2012-07-15 18:09:52 +1000 | [diff] [blame] | 186 | saved_main = sys.modules[main_name] |
| 187 | del sys.modules[main_name] |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 188 | try: |
| 189 | return _get_module_details(main_name) |
| 190 | except ImportError as exc: |
| 191 | if main_name in str(exc): |
| 192 | raise ImportError("can't find %r module in %r" % |
Nick Coghlan | 85e729e | 2012-07-15 18:09:52 +1000 | [diff] [blame] | 193 | (main_name, sys.path[0])) from exc |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 194 | raise |
Nick Coghlan | 85e729e | 2012-07-15 18:09:52 +1000 | [diff] [blame] | 195 | finally: |
| 196 | sys.modules[main_name] = saved_main |
Benjamin Peterson | f6489f9 | 2009-11-25 17:46:26 +0000 | [diff] [blame] | 197 | |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 198 | |
Nick Coghlan | 85e729e | 2012-07-15 18:09:52 +1000 | [diff] [blame] | 199 | def _get_code_from_file(run_name, fname): |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 200 | # Check for a compiled file first |
| 201 | with open(fname, "rb") as f: |
| 202 | code = read_code(f) |
| 203 | if code is None: |
| 204 | # That didn't work, so try it as normal source code |
Victor Stinner | 6c47102 | 2011-07-04 01:45:39 +0200 | [diff] [blame] | 205 | with open(fname, "rb") as f: |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 206 | code = compile(f.read(), fname, 'exec') |
Nick Coghlan | 85e729e | 2012-07-15 18:09:52 +1000 | [diff] [blame] | 207 | loader = importlib.machinery.SourceFileLoader(run_name, fname) |
| 208 | else: |
| 209 | loader = importlib.machinery.SourcelessFileLoader(run_name, fname) |
| 210 | return code, loader |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 211 | |
| 212 | def run_path(path_name, init_globals=None, run_name=None): |
| 213 | """Execute code located at the specified filesystem location |
| 214 | |
| 215 | Returns the resulting top level namespace dictionary |
| 216 | |
| 217 | The file path may refer directly to a Python script (i.e. |
| 218 | one that could be directly executed with execfile) or else |
| 219 | it may refer to a zipfile or directory containing a top |
| 220 | level __main__.py script. |
| 221 | """ |
| 222 | if run_name is None: |
| 223 | run_name = "<run_path>" |
Nick Coghlan | 761bb11 | 2012-07-14 23:59:22 +1000 | [diff] [blame] | 224 | pkg_name = run_name.rpartition(".")[0] |
Nick Coghlan | 85e729e | 2012-07-15 18:09:52 +1000 | [diff] [blame] | 225 | importer = get_importer(path_name) |
Brett Cannon | aa93642 | 2012-04-27 15:30:58 -0400 | [diff] [blame] | 226 | if isinstance(importer, (type(None), imp.NullImporter)): |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 227 | # Not a valid sys.path entry, so run the code directly |
| 228 | # execfile() doesn't help as we want to allow compiled files |
Nick Coghlan | 85e729e | 2012-07-15 18:09:52 +1000 | [diff] [blame] | 229 | code, mod_loader = _get_code_from_file(run_name, path_name) |
Nick Coghlan | 761bb11 | 2012-07-14 23:59:22 +1000 | [diff] [blame] | 230 | return _run_module_code(code, init_globals, run_name, path_name, |
Nick Coghlan | 85e729e | 2012-07-15 18:09:52 +1000 | [diff] [blame] | 231 | mod_loader, pkg_name) |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 232 | else: |
| 233 | # Importer is defined for path, so add it to |
| 234 | # the start of sys.path |
| 235 | sys.path.insert(0, path_name) |
| 236 | try: |
| 237 | # Here's where things are a little different from the run_module |
| 238 | # case. There, we only had to replace the module in sys while the |
| 239 | # code was running and doing so was somewhat optional. Here, we |
| 240 | # have no choice and we have to remove it even while we read the |
| 241 | # code. If we don't do this, a __loader__ attribute in the |
| 242 | # existing __main__ module may prevent location of the new module. |
Nick Coghlan | 85e729e | 2012-07-15 18:09:52 +1000 | [diff] [blame] | 243 | mod_name, loader, code, fname = _get_main_module_details() |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 244 | with _TempModule(run_name) as temp_module, \ |
| 245 | _ModifiedArgv0(path_name): |
| 246 | mod_globals = temp_module.module.__dict__ |
| 247 | return _run_code(code, mod_globals, init_globals, |
Benjamin Peterson | 01e3979 | 2010-10-13 01:04:36 +0000 | [diff] [blame] | 248 | run_name, fname, loader, pkg_name).copy() |
Nick Coghlan | 260bd3e | 2009-11-16 06:49:25 +0000 | [diff] [blame] | 249 | finally: |
| 250 | try: |
| 251 | sys.path.remove(path_name) |
| 252 | except ValueError: |
| 253 | pass |
| 254 | |
| 255 | |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 256 | if __name__ == "__main__": |
| 257 | # Run the module specified as the next command line argument |
| 258 | if len(sys.argv) < 2: |
Guido van Rossum | be19ed7 | 2007-02-09 05:37:30 +0000 | [diff] [blame] | 259 | print("No module specified for execution", file=sys.stderr) |
Thomas Wouters | a977329 | 2006-04-21 09:43:23 +0000 | [diff] [blame] | 260 | else: |
| 261 | del sys.argv[0] # Make the requested module sys.argv[0] |
Thomas Wouters | ed03b41 | 2007-08-28 21:37:11 +0000 | [diff] [blame] | 262 | _run_module_as_main(sys.argv[0]) |