Greg Ward | 2689e3d | 1999-03-22 14:52:19 +0000 | [diff] [blame] | 1 | """distutils.util |
| 2 | |
Greg Ward | aebf706 | 2000-04-04 02:05:59 +0000 | [diff] [blame] | 3 | Miscellaneous utility functions -- anything that doesn't fit into |
Greg Ward | 4752769 | 2000-09-30 18:49:14 +0000 | [diff] [blame] | 4 | one of the other *util.py modules. |
| 5 | """ |
Greg Ward | 2689e3d | 1999-03-22 14:52:19 +0000 | [diff] [blame] | 6 | |
Éric Araujo | 47a4521 | 2011-10-08 00:34:13 +0200 | [diff] [blame] | 7 | import os |
| 8 | import re |
Brett Cannon | 61c3556 | 2013-06-15 12:59:53 -0400 | [diff] [blame] | 9 | import importlib.util |
Éric Araujo | 47a4521 | 2011-10-08 00:34:13 +0200 | [diff] [blame] | 10 | import string |
Victor Stinner | 9def284 | 2016-01-18 12:15:08 +0100 | [diff] [blame] | 11 | import sys |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 12 | from distutils.errors import DistutilsPlatformError |
| 13 | from distutils.dep_util import newer |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 14 | from distutils.spawn import spawn |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 15 | from distutils import log |
Tarek Ziadé | 04fe7c0 | 2009-10-25 23:08:47 +0000 | [diff] [blame] | 16 | from distutils.errors import DistutilsByteCompileError |
Greg Ward | aa458bc | 2000-04-22 15:14:58 +0000 | [diff] [blame] | 17 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 18 | def get_platform (): |
Benjamin Peterson | 0693063 | 2017-09-04 16:36:05 -0700 | [diff] [blame] | 19 | """Return a string that identifies the current platform. This is used mainly to |
| 20 | distinguish platform-specific build directories and platform-specific built |
| 21 | distributions. Typically includes the OS name and version and the |
| 22 | architecture (as supplied by 'os.uname()'), although the exact information |
| 23 | included depends on the OS; eg. on Linux, the kernel version isn't |
| 24 | particularly important. |
Tarek Ziadé | 8b441d0 | 2010-01-29 11:46:31 +0000 | [diff] [blame] | 25 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 26 | Examples of returned values: |
| 27 | linux-i586 |
| 28 | linux-alpha (?) |
| 29 | solaris-2.6-sun4u |
Tarek Ziadé | 8b441d0 | 2010-01-29 11:46:31 +0000 | [diff] [blame] | 30 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 31 | Windows will return one of: |
| 32 | win-amd64 (64bit Windows on AMD64 (aka x86_64, Intel64, EM64T, etc) |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 33 | win32 (all others - specifically, sys.platform is returned) |
| 34 | |
| 35 | For other non-POSIX platforms, currently just returns 'sys.platform'. |
Benjamin Peterson | 0693063 | 2017-09-04 16:36:05 -0700 | [diff] [blame] | 36 | |
Tarek Ziadé | 8b441d0 | 2010-01-29 11:46:31 +0000 | [diff] [blame] | 37 | """ |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 38 | if os.name == 'nt': |
Zachary Ware | 49ce74e | 2017-09-06 15:45:25 -0700 | [diff] [blame] | 39 | if 'amd64' in sys.version.lower(): |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 40 | return 'win-amd64' |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 41 | return sys.platform |
Tarek Ziadé | 8b441d0 | 2010-01-29 11:46:31 +0000 | [diff] [blame] | 42 | |
doko@ubuntu.com | 1abe1c5 | 2012-06-30 20:42:45 +0200 | [diff] [blame] | 43 | # Set for cross builds explicitly |
| 44 | if "_PYTHON_HOST_PLATFORM" in os.environ: |
| 45 | return os.environ["_PYTHON_HOST_PLATFORM"] |
| 46 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 47 | if os.name != "posix" or not hasattr(os, 'uname'): |
| 48 | # XXX what about the architecture? NT is Intel or Alpha, |
| 49 | # Mac OS is M68k or PPC, etc. |
| 50 | return sys.platform |
Tarek Ziadé | 8b441d0 | 2010-01-29 11:46:31 +0000 | [diff] [blame] | 51 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 52 | # Try to distinguish various flavours of Unix |
Greg Ward | 5091929 | 2000-03-07 03:27:08 +0000 | [diff] [blame] | 53 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 54 | (osname, host, release, version, machine) = os.uname() |
Greg Ward | 5091929 | 2000-03-07 03:27:08 +0000 | [diff] [blame] | 55 | |
Benjamin Peterson | 288d1da | 2017-09-28 22:44:27 -0700 | [diff] [blame] | 56 | # Convert the OS name to lowercase, remove '/' characters, and translate |
| 57 | # spaces (for "Power Macintosh") |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 58 | osname = osname.lower().replace('/', '') |
| 59 | machine = machine.replace(' ', '_') |
| 60 | machine = machine.replace('/', '-') |
| 61 | |
| 62 | if osname[:5] == "linux": |
| 63 | # At least on Linux/Intel, 'machine' is the processor -- |
| 64 | # i386, etc. |
| 65 | # XXX what about Alpha, SPARC, etc? |
| 66 | return "%s-%s" % (osname, machine) |
| 67 | elif osname[:5] == "sunos": |
| 68 | if release[0] >= "5": # SunOS 5 == Solaris 2 |
| 69 | osname = "solaris" |
| 70 | release = "%d.%s" % (int(release[0]) - 3, release[2:]) |
Jesus Cea | 6e35d41 | 2012-01-18 04:27:37 +0100 | [diff] [blame] | 71 | # We can't use "platform.architecture()[0]" because a |
| 72 | # bootstrap problem. We use a dict to get an error |
| 73 | # if some suspicious happens. |
| 74 | bitness = {2147483647:"32bit", 9223372036854775807:"64bit"} |
Jesus Cea | 031605a | 2012-01-18 05:04:49 +0100 | [diff] [blame] | 75 | machine += ".%s" % bitness[sys.maxsize] |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 76 | # fall through to standard osname-release-machine representation |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 77 | elif osname[:3] == "aix": |
| 78 | return "%s-%s.%s" % (osname, version, release) |
| 79 | elif osname[:6] == "cygwin": |
| 80 | osname = "cygwin" |
| 81 | rel_re = re.compile (r'[\d.]+', re.ASCII) |
| 82 | m = rel_re.match(release) |
| 83 | if m: |
| 84 | release = m.group() |
| 85 | elif osname[:6] == "darwin": |
Ned Deily | df8aa2b | 2012-07-21 05:36:30 -0700 | [diff] [blame] | 86 | import _osx_support, distutils.sysconfig |
| 87 | osname, release, machine = _osx_support.get_platform_osx( |
| 88 | distutils.sysconfig.get_config_vars(), |
| 89 | osname, release, machine) |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 90 | |
| 91 | return "%s-%s-%s" % (osname, release, machine) |
| 92 | |
| 93 | # get_platform () |
| 94 | |
| 95 | |
| 96 | def convert_path (pathname): |
| 97 | """Return 'pathname' as a name that will work on the native filesystem, |
Greg Ward | b8b263b | 2000-09-30 18:40:42 +0000 | [diff] [blame] | 98 | i.e. split it on '/' and put it back together again using the current |
| 99 | directory separator. Needed because filenames in the setup script are |
| 100 | always supplied in Unix style, and have to be converted to the local |
| 101 | convention before we can actually use them in the filesystem. Raises |
Greg Ward | 4752769 | 2000-09-30 18:49:14 +0000 | [diff] [blame] | 102 | ValueError on non-Unix-ish systems if 'pathname' either starts or |
| 103 | ends with a slash. |
Greg Ward | b8b263b | 2000-09-30 18:40:42 +0000 | [diff] [blame] | 104 | """ |
Greg Ward | 7ec0535 | 2000-09-22 01:05:43 +0000 | [diff] [blame] | 105 | if os.sep == '/': |
| 106 | return pathname |
Neal Norwitz | b0df6a1 | 2002-08-13 17:42:57 +0000 | [diff] [blame] | 107 | if not pathname: |
| 108 | return pathname |
| 109 | if pathname[0] == '/': |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 110 | raise ValueError("path '%s' cannot be absolute" % pathname) |
Neal Norwitz | b0df6a1 | 2002-08-13 17:42:57 +0000 | [diff] [blame] | 111 | if pathname[-1] == '/': |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 112 | raise ValueError("path '%s' cannot end with '/'" % pathname) |
Greg Ward | 7ec0535 | 2000-09-22 01:05:43 +0000 | [diff] [blame] | 113 | |
Neal Norwitz | 9d72bb4 | 2007-04-17 08:48:32 +0000 | [diff] [blame] | 114 | paths = pathname.split('/') |
Jack Jansen | b4cd5c1 | 2001-01-28 12:23:32 +0000 | [diff] [blame] | 115 | while '.' in paths: |
| 116 | paths.remove('.') |
| 117 | if not paths: |
| 118 | return os.curdir |
Neal Norwitz | d910855 | 2006-03-17 08:00:19 +0000 | [diff] [blame] | 119 | return os.path.join(*paths) |
Greg Ward | 5091929 | 2000-03-07 03:27:08 +0000 | [diff] [blame] | 120 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 121 | # convert_path () |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 122 | |
| 123 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 124 | def change_root (new_root, pathname): |
| 125 | """Return 'pathname' with 'new_root' prepended. If 'pathname' is |
| 126 | relative, this is equivalent to "os.path.join(new_root,pathname)". |
Greg Ward | 67f75d4 | 2000-04-27 01:53:46 +0000 | [diff] [blame] | 127 | Otherwise, it requires making 'pathname' relative and then joining the |
Greg Ward | 4b46ef9 | 2000-05-31 02:14:32 +0000 | [diff] [blame] | 128 | two, which is tricky on DOS/Windows and Mac OS. |
| 129 | """ |
| 130 | if os.name == 'posix': |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 131 | if not os.path.isabs(pathname): |
| 132 | return os.path.join(new_root, pathname) |
Greg Ward | 4b46ef9 | 2000-05-31 02:14:32 +0000 | [diff] [blame] | 133 | else: |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 134 | return os.path.join(new_root, pathname[1:]) |
Greg Ward | 67f75d4 | 2000-04-27 01:53:46 +0000 | [diff] [blame] | 135 | |
| 136 | elif os.name == 'nt': |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 137 | (drive, path) = os.path.splitdrive(pathname) |
Greg Ward | 4b46ef9 | 2000-05-31 02:14:32 +0000 | [diff] [blame] | 138 | if path[0] == '\\': |
| 139 | path = path[1:] |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 140 | return os.path.join(new_root, path) |
Greg Ward | 67f75d4 | 2000-04-27 01:53:46 +0000 | [diff] [blame] | 141 | |
Greg Ward | 67f75d4 | 2000-04-27 01:53:46 +0000 | [diff] [blame] | 142 | else: |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 143 | raise DistutilsPlatformError("nothing known about platform '%s'" % os.name) |
| 144 | |
Greg Ward | 67f75d4 | 2000-04-27 01:53:46 +0000 | [diff] [blame] | 145 | |
Gregory P. Smith | e7e35ac | 2000-05-12 00:40:00 +0000 | [diff] [blame] | 146 | _environ_checked = 0 |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 147 | def check_environ (): |
| 148 | """Ensure that 'os.environ' has all the environment variables we |
| 149 | guarantee that users can use in config files, command-line options, |
Greg Ward | b8b263b | 2000-09-30 18:40:42 +0000 | [diff] [blame] | 150 | etc. Currently this includes: |
| 151 | HOME - user's home directory (Unix only) |
| 152 | PLAT - description of the current platform, including hardware |
| 153 | and OS (see 'get_platform()') |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 154 | """ |
Gregory P. Smith | e7e35ac | 2000-05-12 00:40:00 +0000 | [diff] [blame] | 155 | global _environ_checked |
| 156 | if _environ_checked: |
| 157 | return |
| 158 | |
Guido van Rossum | e2b70bc | 2006-08-18 22:13:04 +0000 | [diff] [blame] | 159 | if os.name == 'posix' and 'HOME' not in os.environ: |
Victor Stinner | 17d0c05 | 2018-12-18 16:17:56 +0100 | [diff] [blame] | 160 | try: |
| 161 | import pwd |
| 162 | os.environ['HOME'] = pwd.getpwuid(os.getuid())[5] |
| 163 | except (ImportError, KeyError): |
| 164 | # bpo-10496: if the current user identifier doesn't exist in the |
| 165 | # password database, do nothing |
| 166 | pass |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 167 | |
Guido van Rossum | e2b70bc | 2006-08-18 22:13:04 +0000 | [diff] [blame] | 168 | if 'PLAT' not in os.environ: |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 169 | os.environ['PLAT'] = get_platform() |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 170 | |
Gregory P. Smith | e7e35ac | 2000-05-12 00:40:00 +0000 | [diff] [blame] | 171 | _environ_checked = 1 |
| 172 | |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 173 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 174 | def subst_vars (s, local_vars): |
| 175 | """Perform shell/Perl-style variable substitution on 'string'. Every |
| 176 | occurrence of '$' followed by a name is considered a variable, and |
Greg Ward | 4752769 | 2000-09-30 18:49:14 +0000 | [diff] [blame] | 177 | variable is substituted by the value found in the 'local_vars' |
| 178 | dictionary, or in 'os.environ' if it's not in 'local_vars'. |
| 179 | 'os.environ' is first checked/augmented to guarantee that it contains |
| 180 | certain values: see 'check_environ()'. Raise ValueError for any |
| 181 | variables not found in either 'local_vars' or 'os.environ'. |
Greg Ward | b8b263b | 2000-09-30 18:40:42 +0000 | [diff] [blame] | 182 | """ |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 183 | check_environ() |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 184 | def _subst (match, local_vars=local_vars): |
| 185 | var_name = match.group(1) |
Guido van Rossum | e2b70bc | 2006-08-18 22:13:04 +0000 | [diff] [blame] | 186 | if var_name in local_vars: |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 187 | return str(local_vars[var_name]) |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 188 | else: |
| 189 | return os.environ[var_name] |
| 190 | |
Greg Ward | 4752769 | 2000-09-30 18:49:14 +0000 | [diff] [blame] | 191 | try: |
Jeremy Hylton | 5e2d076 | 2001-01-25 20:10:32 +0000 | [diff] [blame] | 192 | return re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s) |
Guido van Rossum | b940e11 | 2007-01-10 16:19:56 +0000 | [diff] [blame] | 193 | except KeyError as var: |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 194 | raise ValueError("invalid variable '$%s'" % var) |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 195 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 196 | # subst_vars () |
Greg Ward | 7c1a6d4 | 2000-03-29 02:48:40 +0000 | [diff] [blame] | 197 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 198 | |
| 199 | def grok_environment_error (exc, prefix="error: "): |
Éric Araujo | fc773a2 | 2014-03-12 03:34:02 -0400 | [diff] [blame] | 200 | # Function kept for backward compatibility. |
| 201 | # Used to try clever things with EnvironmentErrors, |
| 202 | # but nowadays str(exception) produces good messages. |
| 203 | return prefix + str(exc) |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 204 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 205 | |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 206 | # Needed by 'split_quoted()' |
Martin v. Löwis | 1c0f1f9 | 2004-03-25 14:58:19 +0000 | [diff] [blame] | 207 | _wordchars_re = _squote_re = _dquote_re = None |
| 208 | def _init_regex(): |
| 209 | global _wordchars_re, _squote_re, _dquote_re |
| 210 | _wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace) |
| 211 | _squote_re = re.compile(r"'(?:[^'\\]|\\.)*'") |
| 212 | _dquote_re = re.compile(r'"(?:[^"\\]|\\.)*"') |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 213 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 214 | def split_quoted (s): |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 215 | """Split a string up according to Unix shell-like rules for quotes and |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 216 | backslashes. In short: words are delimited by spaces, as long as those |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 217 | spaces are not escaped by a backslash, or inside a quoted string. |
| 218 | Single and double quotes are equivalent, and the quote characters can |
| 219 | be backslash-escaped. The backslash is stripped from any two-character |
| 220 | escape sequence, leaving only the escaped character. The quote |
| 221 | characters are stripped from any quoted string. Returns a list of |
| 222 | words. |
| 223 | """ |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 224 | |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 225 | # This is a nice algorithm for splitting up a single string, since it |
| 226 | # doesn't require character-by-character examination. It was a little |
| 227 | # bit of a brain-bender to get it working right, though... |
Martin v. Löwis | 1c0f1f9 | 2004-03-25 14:58:19 +0000 | [diff] [blame] | 228 | if _wordchars_re is None: _init_regex() |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 229 | |
Neal Norwitz | 9d72bb4 | 2007-04-17 08:48:32 +0000 | [diff] [blame] | 230 | s = s.strip() |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 231 | words = [] |
| 232 | pos = 0 |
| 233 | |
| 234 | while s: |
| 235 | m = _wordchars_re.match(s, pos) |
| 236 | end = m.end() |
| 237 | if end == len(s): |
| 238 | words.append(s[:end]) |
| 239 | break |
| 240 | |
Greg Ward | 2b042de | 2000-08-08 14:38:13 +0000 | [diff] [blame] | 241 | if s[end] in string.whitespace: # unescaped, unquoted whitespace: now |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 242 | words.append(s[:end]) # we definitely have a word delimiter |
Neal Norwitz | 9d72bb4 | 2007-04-17 08:48:32 +0000 | [diff] [blame] | 243 | s = s[end:].lstrip() |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 244 | pos = 0 |
| 245 | |
| 246 | elif s[end] == '\\': # preserve whatever is being escaped; |
| 247 | # will become part of the current word |
| 248 | s = s[:end] + s[end+1:] |
| 249 | pos = end+1 |
| 250 | |
| 251 | else: |
| 252 | if s[end] == "'": # slurp singly-quoted string |
| 253 | m = _squote_re.match(s, end) |
| 254 | elif s[end] == '"': # slurp doubly-quoted string |
| 255 | m = _dquote_re.match(s, end) |
| 256 | else: |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 257 | raise RuntimeError("this can't happen (bad char '%c')" % s[end]) |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 258 | |
| 259 | if m is None: |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 260 | raise ValueError("bad string (mismatched %s quotes?)" % s[end]) |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 261 | |
| 262 | (beg, end) = m.span() |
| 263 | s = s[:beg] + s[beg+1:end-1] + s[end:] |
| 264 | pos = m.end() - 2 |
| 265 | |
| 266 | if pos >= len(s): |
| 267 | words.append(s) |
| 268 | break |
| 269 | |
| 270 | return words |
| 271 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 272 | # split_quoted () |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 273 | |
| 274 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 275 | def execute (func, args, msg=None, verbose=0, dry_run=0): |
| 276 | """Perform some action that affects the outside world (eg. by |
| 277 | writing to the filesystem). Such actions are special because they |
| 278 | are disabled by the 'dry_run' flag. This method takes care of all |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 279 | that bureaucracy for you; all you have to do is supply the |
| 280 | function to call and an argument tuple for it (to embody the |
| 281 | "external action" being performed), and an optional message to |
| 282 | print. |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 283 | """ |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 284 | if msg is None: |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 285 | msg = "%s%r" % (func.__name__, args) |
Fred Drake | b94b849 | 2001-12-06 20:51:35 +0000 | [diff] [blame] | 286 | if msg[-2:] == ',)': # correct for singleton tuple |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 287 | msg = msg[0:-2] + ')' |
| 288 | |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 289 | log.info(msg) |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 290 | if not dry_run: |
Neal Norwitz | d910855 | 2006-03-17 08:00:19 +0000 | [diff] [blame] | 291 | func(*args) |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 292 | |
Greg Ward | 817dc09 | 2000-09-25 01:25:06 +0000 | [diff] [blame] | 293 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 294 | def strtobool (val): |
Greg Ward | 817dc09 | 2000-09-25 01:25:06 +0000 | [diff] [blame] | 295 | """Convert a string representation of truth to true (1) or false (0). |
Tim Peters | 182b5ac | 2004-07-18 06:16:08 +0000 | [diff] [blame] | 296 | |
Greg Ward | 817dc09 | 2000-09-25 01:25:06 +0000 | [diff] [blame] | 297 | True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values |
| 298 | are 'n', 'no', 'f', 'false', 'off', and '0'. Raises ValueError if |
| 299 | 'val' is anything else. |
| 300 | """ |
Neal Norwitz | 9d72bb4 | 2007-04-17 08:48:32 +0000 | [diff] [blame] | 301 | val = val.lower() |
Greg Ward | 817dc09 | 2000-09-25 01:25:06 +0000 | [diff] [blame] | 302 | if val in ('y', 'yes', 't', 'true', 'on', '1'): |
| 303 | return 1 |
| 304 | elif val in ('n', 'no', 'f', 'false', 'off', '0'): |
| 305 | return 0 |
| 306 | else: |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 307 | raise ValueError("invalid truth value %r" % (val,)) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 308 | |
| 309 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 310 | def byte_compile (py_files, |
| 311 | optimize=0, force=0, |
| 312 | prefix=None, base_dir=None, |
| 313 | verbose=1, dry_run=0, |
| 314 | direct=None): |
Brett Cannon | f299abd | 2015-04-13 14:21:02 -0400 | [diff] [blame] | 315 | """Byte-compile a collection of Python source files to .pyc |
| 316 | files in a __pycache__ subdirectory. 'py_files' is a list |
Éric Araujo | 04ea953 | 2011-10-08 03:02:37 +0200 | [diff] [blame] | 317 | of files to compile; any files that don't end in ".py" are silently |
| 318 | skipped. 'optimize' must be one of the following: |
Brett Cannon | f299abd | 2015-04-13 14:21:02 -0400 | [diff] [blame] | 319 | 0 - don't optimize |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 320 | 1 - normal optimization (like "python -O") |
| 321 | 2 - extra optimization (like "python -OO") |
| 322 | If 'force' is true, all files are recompiled regardless of |
| 323 | timestamps. |
| 324 | |
| 325 | The source filename encoded in each bytecode file defaults to the |
| 326 | filenames listed in 'py_files'; you can modify these with 'prefix' and |
| 327 | 'basedir'. 'prefix' is a string that will be stripped off of each |
| 328 | source filename, and 'base_dir' is a directory name that will be |
| 329 | prepended (after 'prefix' is stripped). You can supply either or both |
| 330 | (or neither) of 'prefix' and 'base_dir', as you wish. |
| 331 | |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 332 | If 'dry_run' is true, doesn't actually do anything that would |
| 333 | affect the filesystem. |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 334 | |
| 335 | Byte-compilation is either done directly in this interpreter process |
| 336 | with the standard py_compile module, or indirectly by writing a |
| 337 | temporary script and executing it. Normally, you should let |
| 338 | 'byte_compile()' figure out to use direct compilation or not (see |
| 339 | the source for details). The 'direct' flag is used by the script |
| 340 | generated in indirect mode; unless you know what you're doing, leave |
| 341 | it set to None. |
| 342 | """ |
Victor Stinner | 9def284 | 2016-01-18 12:15:08 +0100 | [diff] [blame] | 343 | |
| 344 | # Late import to fix a bootstrap issue: _posixsubprocess is built by |
| 345 | # setup.py, but setup.py uses distutils. |
| 346 | import subprocess |
| 347 | |
Tarek Ziadé | 04fe7c0 | 2009-10-25 23:08:47 +0000 | [diff] [blame] | 348 | # nothing is done if sys.dont_write_bytecode is True |
| 349 | if sys.dont_write_bytecode: |
| 350 | raise DistutilsByteCompileError('byte-compiling is disabled.') |
| 351 | |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 352 | # First, if the caller didn't force us into direct or indirect mode, |
| 353 | # figure out which mode we should be in. We take a conservative |
| 354 | # approach: choose direct mode *only* if the current interpreter is |
| 355 | # in debug mode and optimize is 0. If we're not in debug mode (-O |
| 356 | # or -OO), we don't know which level of optimization this |
| 357 | # interpreter is running with, so we can't do direct |
| 358 | # byte-compilation and be certain that it's the right thing. Thus, |
| 359 | # always compile indirectly if the current interpreter is in either |
| 360 | # optimize mode, or if either optimization level was requested by |
| 361 | # the caller. |
| 362 | if direct is None: |
| 363 | direct = (__debug__ and optimize == 0) |
| 364 | |
| 365 | # "Indirect" byte-compilation: write a temporary script and then |
| 366 | # run it with the appropriate flags. |
| 367 | if not direct: |
Marc-André Lemburg | 0375079 | 2002-12-03 08:45:11 +0000 | [diff] [blame] | 368 | try: |
| 369 | from tempfile import mkstemp |
| 370 | (script_fd, script_name) = mkstemp(".py") |
Brett Cannon | cd171c8 | 2013-07-04 17:43:24 -0400 | [diff] [blame] | 371 | except ImportError: |
Marc-André Lemburg | 0375079 | 2002-12-03 08:45:11 +0000 | [diff] [blame] | 372 | from tempfile import mktemp |
| 373 | (script_fd, script_name) = None, mktemp(".py") |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 374 | log.info("writing byte-compilation script '%s'", script_name) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 375 | if not dry_run: |
Marc-André Lemburg | 0375079 | 2002-12-03 08:45:11 +0000 | [diff] [blame] | 376 | if script_fd is not None: |
| 377 | script = os.fdopen(script_fd, "w") |
| 378 | else: |
| 379 | script = open(script_name, "w") |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 380 | |
Serhiy Storchaka | c5d5dfd | 2018-12-20 19:00:14 +0200 | [diff] [blame^] | 381 | with script: |
| 382 | script.write("""\ |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 383 | from distutils.util import byte_compile |
| 384 | files = [ |
| 385 | """) |
Greg Ward | 9216cfe | 2000-10-03 03:31:05 +0000 | [diff] [blame] | 386 | |
Serhiy Storchaka | c5d5dfd | 2018-12-20 19:00:14 +0200 | [diff] [blame^] | 387 | # XXX would be nice to write absolute filenames, just for |
| 388 | # safety's sake (script should be more robust in the face of |
| 389 | # chdir'ing before running it). But this requires abspath'ing |
| 390 | # 'prefix' as well, and that breaks the hack in build_lib's |
| 391 | # 'byte_compile()' method that carefully tacks on a trailing |
| 392 | # slash (os.sep really) to make sure the prefix here is "just |
| 393 | # right". This whole prefix business is rather delicate -- the |
| 394 | # problem is that it's really a directory, but I'm treating it |
| 395 | # as a dumb string, so trailing slashes and so forth matter. |
Greg Ward | 9216cfe | 2000-10-03 03:31:05 +0000 | [diff] [blame] | 396 | |
Serhiy Storchaka | c5d5dfd | 2018-12-20 19:00:14 +0200 | [diff] [blame^] | 397 | #py_files = map(os.path.abspath, py_files) |
| 398 | #if prefix: |
| 399 | # prefix = os.path.abspath(prefix) |
Greg Ward | 9216cfe | 2000-10-03 03:31:05 +0000 | [diff] [blame] | 400 | |
Serhiy Storchaka | c5d5dfd | 2018-12-20 19:00:14 +0200 | [diff] [blame^] | 401 | script.write(",\n".join(map(repr, py_files)) + "]\n") |
| 402 | script.write(""" |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 403 | byte_compile(files, optimize=%r, force=%r, |
| 404 | prefix=%r, base_dir=%r, |
| 405 | verbose=%r, dry_run=0, |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 406 | direct=1) |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 407 | """ % (optimize, force, prefix, base_dir, verbose)) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 408 | |
Victor Stinner | 9def284 | 2016-01-18 12:15:08 +0100 | [diff] [blame] | 409 | cmd = [sys.executable] |
| 410 | cmd.extend(subprocess._optim_args_from_interpreter_flags()) |
| 411 | cmd.append(script_name) |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 412 | spawn(cmd, dry_run=dry_run) |
Greg Ward | 9216cfe | 2000-10-03 03:31:05 +0000 | [diff] [blame] | 413 | execute(os.remove, (script_name,), "removing %s" % script_name, |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 414 | dry_run=dry_run) |
Fred Drake | b94b849 | 2001-12-06 20:51:35 +0000 | [diff] [blame] | 415 | |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 416 | # "Direct" byte-compilation: use the py_compile module to compile |
| 417 | # right here, right now. Note that the script generated in indirect |
| 418 | # mode simply calls 'byte_compile()' in direct mode, a weird sort of |
| 419 | # cross-process recursion. Hey, it works! |
| 420 | else: |
| 421 | from py_compile import compile |
| 422 | |
| 423 | for file in py_files: |
| 424 | if file[-3:] != ".py": |
Greg Ward | f217e21 | 2000-10-01 23:49:30 +0000 | [diff] [blame] | 425 | # This lets us be lazy and not filter filenames in |
| 426 | # the "install_lib" command. |
| 427 | continue |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 428 | |
| 429 | # Terminology from the py_compile module: |
| 430 | # cfile - byte-compiled file |
| 431 | # dfile - purported source filename (same as 'file' by default) |
Éric Araujo | 47a4521 | 2011-10-08 00:34:13 +0200 | [diff] [blame] | 432 | if optimize >= 0: |
Brett Cannon | f299abd | 2015-04-13 14:21:02 -0400 | [diff] [blame] | 433 | opt = '' if optimize == 0 else optimize |
Brett Cannon | 61c3556 | 2013-06-15 12:59:53 -0400 | [diff] [blame] | 434 | cfile = importlib.util.cache_from_source( |
Brett Cannon | f299abd | 2015-04-13 14:21:02 -0400 | [diff] [blame] | 435 | file, optimization=opt) |
Éric Araujo | 47a4521 | 2011-10-08 00:34:13 +0200 | [diff] [blame] | 436 | else: |
Brett Cannon | 61c3556 | 2013-06-15 12:59:53 -0400 | [diff] [blame] | 437 | cfile = importlib.util.cache_from_source(file) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 438 | dfile = file |
| 439 | if prefix: |
| 440 | if file[:len(prefix)] != prefix: |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 441 | raise ValueError("invalid prefix: filename %r doesn't start with %r" |
| 442 | % (file, prefix)) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 443 | dfile = dfile[len(prefix):] |
| 444 | if base_dir: |
| 445 | dfile = os.path.join(base_dir, dfile) |
| 446 | |
| 447 | cfile_base = os.path.basename(cfile) |
| 448 | if direct: |
| 449 | if force or newer(file, cfile): |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 450 | log.info("byte-compiling %s to %s", file, cfile_base) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 451 | if not dry_run: |
| 452 | compile(file, cfile, dfile) |
| 453 | else: |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 454 | log.debug("skipping byte-compilation of %s to %s", |
| 455 | file, cfile_base) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 456 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 457 | # byte_compile () |
Andrew M. Kuchling | df66df0 | 2001-03-22 03:03:41 +0000 | [diff] [blame] | 458 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 459 | def rfc822_escape (header): |
Andrew M. Kuchling | df66df0 | 2001-03-22 03:03:41 +0000 | [diff] [blame] | 460 | """Return a version of the string escaped for inclusion in an |
Andrew M. Kuchling | 88b0884 | 2001-03-23 17:30:26 +0000 | [diff] [blame] | 461 | RFC-822 header, by ensuring there are 8 spaces space after each newline. |
Andrew M. Kuchling | df66df0 | 2001-03-22 03:03:41 +0000 | [diff] [blame] | 462 | """ |
Tarek Ziadé | df872d4 | 2009-12-06 09:28:17 +0000 | [diff] [blame] | 463 | lines = header.split('\n') |
| 464 | sep = '\n' + 8 * ' ' |
Neal Norwitz | 9d72bb4 | 2007-04-17 08:48:32 +0000 | [diff] [blame] | 465 | return sep.join(lines) |
Martin v. Löwis | 6178db6 | 2008-12-01 04:38:52 +0000 | [diff] [blame] | 466 | |
| 467 | # 2to3 support |
| 468 | |
| 469 | def run_2to3(files, fixer_names=None, options=None, explicit=None): |
| 470 | """Invoke 2to3 on a list of Python files. |
| 471 | The files should all come from the build area, as the |
| 472 | modification is done in-place. To reduce the build time, |
| 473 | only files modified since the last invocation of this |
| 474 | function should be passed in the files argument.""" |
| 475 | |
| 476 | if not files: |
| 477 | return |
| 478 | |
| 479 | # Make this class local, to delay import of 2to3 |
| 480 | from lib2to3.refactor import RefactoringTool, get_fixers_from_package |
| 481 | class DistutilsRefactoringTool(RefactoringTool): |
| 482 | def log_error(self, msg, *args, **kw): |
| 483 | log.error(msg, *args) |
| 484 | |
| 485 | def log_message(self, msg, *args): |
| 486 | log.info(msg, *args) |
| 487 | |
| 488 | def log_debug(self, msg, *args): |
| 489 | log.debug(msg, *args) |
| 490 | |
| 491 | if fixer_names is None: |
| 492 | fixer_names = get_fixers_from_package('lib2to3.fixes') |
| 493 | r = DistutilsRefactoringTool(fixer_names, options=options) |
| 494 | r.refactor(files, write=True) |
| 495 | |
Georg Brandl | 6d4a9cf | 2009-03-31 00:34:54 +0000 | [diff] [blame] | 496 | def copydir_run_2to3(src, dest, template=None, fixer_names=None, |
| 497 | options=None, explicit=None): |
| 498 | """Recursively copy a directory, only copying new and changed files, |
| 499 | running run_2to3 over all newly copied Python modules afterward. |
| 500 | |
| 501 | If you give a template string, it's parsed like a MANIFEST.in. |
| 502 | """ |
| 503 | from distutils.dir_util import mkpath |
| 504 | from distutils.file_util import copy_file |
| 505 | from distutils.filelist import FileList |
| 506 | filelist = FileList() |
| 507 | curdir = os.getcwd() |
| 508 | os.chdir(src) |
| 509 | try: |
| 510 | filelist.findall() |
| 511 | finally: |
| 512 | os.chdir(curdir) |
| 513 | filelist.files[:] = filelist.allfiles |
| 514 | if template: |
| 515 | for line in template.splitlines(): |
| 516 | line = line.strip() |
| 517 | if not line: continue |
| 518 | filelist.process_template_line(line) |
| 519 | copied = [] |
| 520 | for filename in filelist.files: |
| 521 | outname = os.path.join(dest, filename) |
| 522 | mkpath(os.path.dirname(outname)) |
| 523 | res = copy_file(os.path.join(src, filename), outname, update=1) |
| 524 | if res[1]: copied.append(outname) |
| 525 | run_2to3([fn for fn in copied if fn.lower().endswith('.py')], |
| 526 | fixer_names=fixer_names, options=options, explicit=explicit) |
| 527 | return copied |
| 528 | |
Martin v. Löwis | 6178db6 | 2008-12-01 04:38:52 +0000 | [diff] [blame] | 529 | class Mixin2to3: |
| 530 | '''Mixin class for commands that run 2to3. |
| 531 | To configure 2to3, setup scripts may either change |
| 532 | the class variables, or inherit from individual commands |
| 533 | to override how 2to3 is invoked.''' |
| 534 | |
| 535 | # provide list of fixers to run; |
| 536 | # defaults to all from lib2to3.fixers |
| 537 | fixer_names = None |
| 538 | |
| 539 | # options dictionary |
| 540 | options = None |
| 541 | |
| 542 | # list of fixers to invoke even though they are marked as explicit |
| 543 | explicit = None |
| 544 | |
| 545 | def run_2to3(self, files): |
| 546 | return run_2to3(files, self.fixer_names, self.options, self.explicit) |