Greg Ward | 2689e3d | 1999-03-22 14:52:19 +0000 | [diff] [blame] | 1 | """distutils.util |
| 2 | |
Greg Ward | aebf706 | 2000-04-04 02:05:59 +0000 | [diff] [blame] | 3 | Miscellaneous utility functions -- anything that doesn't fit into |
Greg Ward | 4752769 | 2000-09-30 18:49:14 +0000 | [diff] [blame] | 4 | one of the other *util.py modules. |
| 5 | """ |
Greg Ward | 2689e3d | 1999-03-22 14:52:19 +0000 | [diff] [blame] | 6 | |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 7 | import sys, os, string, re |
| 8 | from distutils.errors import DistutilsPlatformError |
| 9 | from distutils.dep_util import newer |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 10 | from distutils.spawn import spawn |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 11 | from distutils import log |
Tarek Ziadé | 04fe7c0 | 2009-10-25 23:08:47 +0000 | [diff] [blame] | 12 | from distutils.errors import DistutilsByteCompileError |
Greg Ward | aa458bc | 2000-04-22 15:14:58 +0000 | [diff] [blame] | 13 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 14 | def get_platform (): |
| 15 | """Return a string that identifies the current platform. This is used |
| 16 | mainly to distinguish platform-specific build directories and |
| 17 | platform-specific built distributions. Typically includes the OS name |
| 18 | and version and the architecture (as supplied by 'os.uname()'), |
| 19 | although the exact information included depends on the OS; eg. for IRIX |
| 20 | the architecture isn't particularly important (IRIX only runs on SGI |
| 21 | hardware), but for Linux the kernel version isn't particularly |
| 22 | important. |
Tarek Ziadé | 8b441d0 | 2010-01-29 11:46:31 +0000 | [diff] [blame] | 23 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 24 | Examples of returned values: |
| 25 | linux-i586 |
| 26 | linux-alpha (?) |
| 27 | solaris-2.6-sun4u |
| 28 | irix-5.3 |
| 29 | irix64-6.2 |
Tarek Ziadé | 8b441d0 | 2010-01-29 11:46:31 +0000 | [diff] [blame] | 30 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 31 | Windows will return one of: |
| 32 | win-amd64 (64bit Windows on AMD64 (aka x86_64, Intel64, EM64T, etc) |
| 33 | win-ia64 (64bit Windows on Itanium) |
| 34 | win32 (all others - specifically, sys.platform is returned) |
| 35 | |
| 36 | For other non-POSIX platforms, currently just returns 'sys.platform'. |
Tarek Ziadé | 8b441d0 | 2010-01-29 11:46:31 +0000 | [diff] [blame] | 37 | """ |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 38 | if os.name == 'nt': |
| 39 | # sniff sys.version for architecture. |
| 40 | prefix = " bit (" |
| 41 | i = sys.version.find(prefix) |
| 42 | if i == -1: |
| 43 | return sys.platform |
| 44 | j = sys.version.find(")", i) |
| 45 | look = sys.version[i+len(prefix):j].lower() |
| 46 | if look == 'amd64': |
| 47 | return 'win-amd64' |
| 48 | if look == 'itanium': |
| 49 | return 'win-ia64' |
| 50 | return sys.platform |
Tarek Ziadé | 8b441d0 | 2010-01-29 11:46:31 +0000 | [diff] [blame] | 51 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 52 | if os.name != "posix" or not hasattr(os, 'uname'): |
| 53 | # XXX what about the architecture? NT is Intel or Alpha, |
| 54 | # Mac OS is M68k or PPC, etc. |
| 55 | return sys.platform |
Tarek Ziadé | 8b441d0 | 2010-01-29 11:46:31 +0000 | [diff] [blame] | 56 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 57 | # Try to distinguish various flavours of Unix |
Greg Ward | 5091929 | 2000-03-07 03:27:08 +0000 | [diff] [blame] | 58 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 59 | (osname, host, release, version, machine) = os.uname() |
Greg Ward | 5091929 | 2000-03-07 03:27:08 +0000 | [diff] [blame] | 60 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 61 | # Convert the OS name to lowercase, remove '/' characters |
| 62 | # (to accommodate BSD/OS), and translate spaces (for "Power Macintosh") |
| 63 | osname = osname.lower().replace('/', '') |
| 64 | machine = machine.replace(' ', '_') |
| 65 | machine = machine.replace('/', '-') |
| 66 | |
| 67 | if osname[:5] == "linux": |
| 68 | # At least on Linux/Intel, 'machine' is the processor -- |
| 69 | # i386, etc. |
| 70 | # XXX what about Alpha, SPARC, etc? |
| 71 | return "%s-%s" % (osname, machine) |
| 72 | elif osname[:5] == "sunos": |
| 73 | if release[0] >= "5": # SunOS 5 == Solaris 2 |
| 74 | osname = "solaris" |
| 75 | release = "%d.%s" % (int(release[0]) - 3, release[2:]) |
| 76 | # fall through to standard osname-release-machine representation |
| 77 | elif osname[:4] == "irix": # could be "irix64"! |
| 78 | return "%s-%s" % (osname, release) |
| 79 | elif osname[:3] == "aix": |
| 80 | return "%s-%s.%s" % (osname, version, release) |
| 81 | elif osname[:6] == "cygwin": |
| 82 | osname = "cygwin" |
| 83 | rel_re = re.compile (r'[\d.]+', re.ASCII) |
| 84 | m = rel_re.match(release) |
| 85 | if m: |
| 86 | release = m.group() |
| 87 | elif osname[:6] == "darwin": |
| 88 | # |
| 89 | # For our purposes, we'll assume that the system version from |
| 90 | # distutils' perspective is what MACOSX_DEPLOYMENT_TARGET is set |
| 91 | # to. This makes the compatibility story a bit more sane because the |
| 92 | # machine is going to compile and link as if it were |
| 93 | # MACOSX_DEPLOYMENT_TARGET. |
| 94 | from distutils.sysconfig import get_config_vars |
| 95 | cfgvars = get_config_vars() |
| 96 | |
Ronald Oussoren | 222e89a | 2011-05-15 16:46:11 +0200 | [diff] [blame] | 97 | macver = cfgvars.get('MACOSX_DEPLOYMENT_TARGET') |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 98 | |
| 99 | if 1: |
| 100 | # Always calculate the release of the running machine, |
| 101 | # needed to determine if we can build fat binaries or not. |
| 102 | |
| 103 | macrelease = macver |
| 104 | # Get the system version. Reading this plist is a documented |
| 105 | # way to get the system version (see the documentation for |
| 106 | # the Gestalt Manager) |
| 107 | try: |
| 108 | f = open('/System/Library/CoreServices/SystemVersion.plist') |
| 109 | except IOError: |
| 110 | # We're on a plain darwin box, fall back to the default |
| 111 | # behaviour. |
| 112 | pass |
| 113 | else: |
Éric Araujo | bee5cef | 2010-11-05 23:51:56 +0000 | [diff] [blame] | 114 | try: |
| 115 | m = re.search( |
| 116 | r'<key>ProductUserVisibleVersion</key>\s*' + |
| 117 | r'<string>(.*?)</string>', f.read()) |
| 118 | if m is not None: |
| 119 | macrelease = '.'.join(m.group(1).split('.')[:2]) |
| 120 | # else: fall back to the default behaviour |
| 121 | finally: |
| 122 | f.close() |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 123 | |
| 124 | if not macver: |
| 125 | macver = macrelease |
| 126 | |
| 127 | if macver: |
| 128 | from distutils.sysconfig import get_config_vars |
| 129 | release = macver |
| 130 | osname = "macosx" |
| 131 | |
| 132 | if (macrelease + '.') >= '10.4.' and \ |
| 133 | '-arch' in get_config_vars().get('CFLAGS', '').strip(): |
| 134 | # The universal build will build fat binaries, but not on |
| 135 | # systems before 10.4 |
| 136 | # |
| 137 | # Try to detect 4-way universal builds, those have machine-type |
| 138 | # 'universal' instead of 'fat'. |
| 139 | |
| 140 | machine = 'fat' |
| 141 | cflags = get_config_vars().get('CFLAGS') |
| 142 | |
| 143 | archs = re.findall('-arch\s+(\S+)', cflags) |
| 144 | archs = tuple(sorted(set(archs))) |
| 145 | |
| 146 | if len(archs) == 1: |
| 147 | machine = archs[0] |
| 148 | elif archs == ('i386', 'ppc'): |
| 149 | machine = 'fat' |
| 150 | elif archs == ('i386', 'x86_64'): |
| 151 | machine = 'intel' |
| 152 | elif archs == ('i386', 'ppc', 'x86_64'): |
| 153 | machine = 'fat3' |
| 154 | elif archs == ('ppc64', 'x86_64'): |
| 155 | machine = 'fat64' |
| 156 | elif archs == ('i386', 'ppc', 'ppc64', 'x86_64'): |
| 157 | machine = 'universal' |
| 158 | else: |
| 159 | raise ValueError( |
| 160 | "Don't know machine value for archs=%r"%(archs,)) |
| 161 | |
| 162 | elif machine == 'i386': |
| 163 | # On OSX the machine type returned by uname is always the |
| 164 | # 32-bit variant, even if the executable architecture is |
| 165 | # the 64-bit variant |
| 166 | if sys.maxsize >= 2**32: |
| 167 | machine = 'x86_64' |
| 168 | |
| 169 | elif machine in ('PowerPC', 'Power_Macintosh'): |
| 170 | # Pick a sane name for the PPC architecture. |
| 171 | machine = 'ppc' |
| 172 | |
| 173 | # See 'i386' case |
| 174 | if sys.maxsize >= 2**32: |
| 175 | machine = 'ppc64' |
| 176 | |
| 177 | return "%s-%s-%s" % (osname, release, machine) |
| 178 | |
| 179 | # get_platform () |
| 180 | |
| 181 | |
| 182 | def convert_path (pathname): |
| 183 | """Return 'pathname' as a name that will work on the native filesystem, |
Greg Ward | b8b263b | 2000-09-30 18:40:42 +0000 | [diff] [blame] | 184 | i.e. split it on '/' and put it back together again using the current |
| 185 | directory separator. Needed because filenames in the setup script are |
| 186 | always supplied in Unix style, and have to be converted to the local |
| 187 | convention before we can actually use them in the filesystem. Raises |
Greg Ward | 4752769 | 2000-09-30 18:49:14 +0000 | [diff] [blame] | 188 | ValueError on non-Unix-ish systems if 'pathname' either starts or |
| 189 | ends with a slash. |
Greg Ward | b8b263b | 2000-09-30 18:40:42 +0000 | [diff] [blame] | 190 | """ |
Greg Ward | 7ec0535 | 2000-09-22 01:05:43 +0000 | [diff] [blame] | 191 | if os.sep == '/': |
| 192 | return pathname |
Neal Norwitz | b0df6a1 | 2002-08-13 17:42:57 +0000 | [diff] [blame] | 193 | if not pathname: |
| 194 | return pathname |
| 195 | if pathname[0] == '/': |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 196 | raise ValueError("path '%s' cannot be absolute" % pathname) |
Neal Norwitz | b0df6a1 | 2002-08-13 17:42:57 +0000 | [diff] [blame] | 197 | if pathname[-1] == '/': |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 198 | raise ValueError("path '%s' cannot end with '/'" % pathname) |
Greg Ward | 7ec0535 | 2000-09-22 01:05:43 +0000 | [diff] [blame] | 199 | |
Neal Norwitz | 9d72bb4 | 2007-04-17 08:48:32 +0000 | [diff] [blame] | 200 | paths = pathname.split('/') |
Jack Jansen | b4cd5c1 | 2001-01-28 12:23:32 +0000 | [diff] [blame] | 201 | while '.' in paths: |
| 202 | paths.remove('.') |
| 203 | if not paths: |
| 204 | return os.curdir |
Neal Norwitz | d910855 | 2006-03-17 08:00:19 +0000 | [diff] [blame] | 205 | return os.path.join(*paths) |
Greg Ward | 5091929 | 2000-03-07 03:27:08 +0000 | [diff] [blame] | 206 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 207 | # convert_path () |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 208 | |
| 209 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 210 | def change_root (new_root, pathname): |
| 211 | """Return 'pathname' with 'new_root' prepended. If 'pathname' is |
| 212 | relative, this is equivalent to "os.path.join(new_root,pathname)". |
Greg Ward | 67f75d4 | 2000-04-27 01:53:46 +0000 | [diff] [blame] | 213 | Otherwise, it requires making 'pathname' relative and then joining the |
Greg Ward | 4b46ef9 | 2000-05-31 02:14:32 +0000 | [diff] [blame] | 214 | two, which is tricky on DOS/Windows and Mac OS. |
| 215 | """ |
| 216 | if os.name == 'posix': |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 217 | if not os.path.isabs(pathname): |
| 218 | return os.path.join(new_root, pathname) |
Greg Ward | 4b46ef9 | 2000-05-31 02:14:32 +0000 | [diff] [blame] | 219 | else: |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 220 | return os.path.join(new_root, pathname[1:]) |
Greg Ward | 67f75d4 | 2000-04-27 01:53:46 +0000 | [diff] [blame] | 221 | |
| 222 | elif os.name == 'nt': |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 223 | (drive, path) = os.path.splitdrive(pathname) |
Greg Ward | 4b46ef9 | 2000-05-31 02:14:32 +0000 | [diff] [blame] | 224 | if path[0] == '\\': |
| 225 | path = path[1:] |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 226 | return os.path.join(new_root, path) |
Greg Ward | 67f75d4 | 2000-04-27 01:53:46 +0000 | [diff] [blame] | 227 | |
Marc-André Lemburg | 2544f51 | 2002-01-31 18:56:00 +0000 | [diff] [blame] | 228 | elif os.name == 'os2': |
| 229 | (drive, path) = os.path.splitdrive(pathname) |
| 230 | if path[0] == os.sep: |
| 231 | path = path[1:] |
| 232 | return os.path.join(new_root, path) |
| 233 | |
Greg Ward | 67f75d4 | 2000-04-27 01:53:46 +0000 | [diff] [blame] | 234 | else: |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 235 | raise DistutilsPlatformError("nothing known about platform '%s'" % os.name) |
| 236 | |
Greg Ward | 67f75d4 | 2000-04-27 01:53:46 +0000 | [diff] [blame] | 237 | |
Gregory P. Smith | e7e35ac | 2000-05-12 00:40:00 +0000 | [diff] [blame] | 238 | _environ_checked = 0 |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 239 | def check_environ (): |
| 240 | """Ensure that 'os.environ' has all the environment variables we |
| 241 | guarantee that users can use in config files, command-line options, |
Greg Ward | b8b263b | 2000-09-30 18:40:42 +0000 | [diff] [blame] | 242 | etc. Currently this includes: |
| 243 | HOME - user's home directory (Unix only) |
| 244 | PLAT - description of the current platform, including hardware |
| 245 | and OS (see 'get_platform()') |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 246 | """ |
Gregory P. Smith | e7e35ac | 2000-05-12 00:40:00 +0000 | [diff] [blame] | 247 | global _environ_checked |
| 248 | if _environ_checked: |
| 249 | return |
| 250 | |
Guido van Rossum | e2b70bc | 2006-08-18 22:13:04 +0000 | [diff] [blame] | 251 | if os.name == 'posix' and 'HOME' not in os.environ: |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 252 | import pwd |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 253 | os.environ['HOME'] = pwd.getpwuid(os.getuid())[5] |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 254 | |
Guido van Rossum | e2b70bc | 2006-08-18 22:13:04 +0000 | [diff] [blame] | 255 | if 'PLAT' not in os.environ: |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 256 | os.environ['PLAT'] = get_platform() |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 257 | |
Gregory P. Smith | e7e35ac | 2000-05-12 00:40:00 +0000 | [diff] [blame] | 258 | _environ_checked = 1 |
| 259 | |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 260 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 261 | def subst_vars (s, local_vars): |
| 262 | """Perform shell/Perl-style variable substitution on 'string'. Every |
| 263 | occurrence of '$' followed by a name is considered a variable, and |
Greg Ward | 4752769 | 2000-09-30 18:49:14 +0000 | [diff] [blame] | 264 | variable is substituted by the value found in the 'local_vars' |
| 265 | dictionary, or in 'os.environ' if it's not in 'local_vars'. |
| 266 | 'os.environ' is first checked/augmented to guarantee that it contains |
| 267 | certain values: see 'check_environ()'. Raise ValueError for any |
| 268 | variables not found in either 'local_vars' or 'os.environ'. |
Greg Ward | b8b263b | 2000-09-30 18:40:42 +0000 | [diff] [blame] | 269 | """ |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 270 | check_environ() |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 271 | def _subst (match, local_vars=local_vars): |
| 272 | var_name = match.group(1) |
Guido van Rossum | e2b70bc | 2006-08-18 22:13:04 +0000 | [diff] [blame] | 273 | if var_name in local_vars: |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 274 | return str(local_vars[var_name]) |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 275 | else: |
| 276 | return os.environ[var_name] |
| 277 | |
Greg Ward | 4752769 | 2000-09-30 18:49:14 +0000 | [diff] [blame] | 278 | try: |
Jeremy Hylton | 5e2d076 | 2001-01-25 20:10:32 +0000 | [diff] [blame] | 279 | return re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s) |
Guido van Rossum | b940e11 | 2007-01-10 16:19:56 +0000 | [diff] [blame] | 280 | except KeyError as var: |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 281 | raise ValueError("invalid variable '$%s'" % var) |
Greg Ward | 1b4ede5 | 2000-03-22 00:22:44 +0000 | [diff] [blame] | 282 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 283 | # subst_vars () |
Greg Ward | 7c1a6d4 | 2000-03-29 02:48:40 +0000 | [diff] [blame] | 284 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 285 | |
| 286 | def grok_environment_error (exc, prefix="error: "): |
| 287 | """Generate a useful error message from an EnvironmentError (IOError or |
| 288 | OSError) exception object. Handles Python 1.5.1 and 1.5.2 styles, and |
Greg Ward | e905513 | 2000-06-17 02:16:46 +0000 | [diff] [blame] | 289 | does what it can to deal with exception objects that don't have a |
| 290 | filename (which happens when the error is due to a two-file operation, |
| 291 | such as 'rename()' or 'link()'. Returns the error message as a string |
| 292 | prefixed with 'prefix'. |
| 293 | """ |
| 294 | # check for Python 1.5.2-style {IO,OS}Error exception objects |
Greg Ward | be86bde | 2000-09-26 01:56:15 +0000 | [diff] [blame] | 295 | if hasattr(exc, 'filename') and hasattr(exc, 'strerror'): |
Greg Ward | e905513 | 2000-06-17 02:16:46 +0000 | [diff] [blame] | 296 | if exc.filename: |
| 297 | error = prefix + "%s: %s" % (exc.filename, exc.strerror) |
| 298 | else: |
| 299 | # two-argument functions in posix module don't |
| 300 | # include the filename in the exception object! |
| 301 | error = prefix + "%s" % exc.strerror |
| 302 | else: |
Georg Brandl | 5dfe0de | 2008-01-06 21:41:49 +0000 | [diff] [blame] | 303 | error = prefix + str(exc.args[-1]) |
Greg Ward | e905513 | 2000-06-17 02:16:46 +0000 | [diff] [blame] | 304 | |
| 305 | return error |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 306 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 307 | |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 308 | # Needed by 'split_quoted()' |
Martin v. Löwis | 1c0f1f9 | 2004-03-25 14:58:19 +0000 | [diff] [blame] | 309 | _wordchars_re = _squote_re = _dquote_re = None |
| 310 | def _init_regex(): |
| 311 | global _wordchars_re, _squote_re, _dquote_re |
| 312 | _wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace) |
| 313 | _squote_re = re.compile(r"'(?:[^'\\]|\\.)*'") |
| 314 | _dquote_re = re.compile(r'"(?:[^"\\]|\\.)*"') |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 315 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 316 | def split_quoted (s): |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 317 | """Split a string up according to Unix shell-like rules for quotes and |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 318 | backslashes. In short: words are delimited by spaces, as long as those |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 319 | spaces are not escaped by a backslash, or inside a quoted string. |
| 320 | Single and double quotes are equivalent, and the quote characters can |
| 321 | be backslash-escaped. The backslash is stripped from any two-character |
| 322 | escape sequence, leaving only the escaped character. The quote |
| 323 | characters are stripped from any quoted string. Returns a list of |
| 324 | words. |
| 325 | """ |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 326 | |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 327 | # This is a nice algorithm for splitting up a single string, since it |
| 328 | # doesn't require character-by-character examination. It was a little |
| 329 | # bit of a brain-bender to get it working right, though... |
Martin v. Löwis | 1c0f1f9 | 2004-03-25 14:58:19 +0000 | [diff] [blame] | 330 | if _wordchars_re is None: _init_regex() |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 331 | |
Neal Norwitz | 9d72bb4 | 2007-04-17 08:48:32 +0000 | [diff] [blame] | 332 | s = s.strip() |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 333 | words = [] |
| 334 | pos = 0 |
| 335 | |
| 336 | while s: |
| 337 | m = _wordchars_re.match(s, pos) |
| 338 | end = m.end() |
| 339 | if end == len(s): |
| 340 | words.append(s[:end]) |
| 341 | break |
| 342 | |
Greg Ward | 2b042de | 2000-08-08 14:38:13 +0000 | [diff] [blame] | 343 | if s[end] in string.whitespace: # unescaped, unquoted whitespace: now |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 344 | words.append(s[:end]) # we definitely have a word delimiter |
Neal Norwitz | 9d72bb4 | 2007-04-17 08:48:32 +0000 | [diff] [blame] | 345 | s = s[end:].lstrip() |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 346 | pos = 0 |
| 347 | |
| 348 | elif s[end] == '\\': # preserve whatever is being escaped; |
| 349 | # will become part of the current word |
| 350 | s = s[:end] + s[end+1:] |
| 351 | pos = end+1 |
| 352 | |
| 353 | else: |
| 354 | if s[end] == "'": # slurp singly-quoted string |
| 355 | m = _squote_re.match(s, end) |
| 356 | elif s[end] == '"': # slurp doubly-quoted string |
| 357 | m = _dquote_re.match(s, end) |
| 358 | else: |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 359 | raise RuntimeError("this can't happen (bad char '%c')" % s[end]) |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 360 | |
| 361 | if m is None: |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 362 | raise ValueError("bad string (mismatched %s quotes?)" % s[end]) |
Greg Ward | 6a2a3db | 2000-06-24 20:40:02 +0000 | [diff] [blame] | 363 | |
| 364 | (beg, end) = m.span() |
| 365 | s = s[:beg] + s[beg+1:end-1] + s[end:] |
| 366 | pos = m.end() - 2 |
| 367 | |
| 368 | if pos >= len(s): |
| 369 | words.append(s) |
| 370 | break |
| 371 | |
| 372 | return words |
| 373 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 374 | # split_quoted () |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 375 | |
| 376 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 377 | def execute (func, args, msg=None, verbose=0, dry_run=0): |
| 378 | """Perform some action that affects the outside world (eg. by |
| 379 | writing to the filesystem). Such actions are special because they |
| 380 | are disabled by the 'dry_run' flag. This method takes care of all |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 381 | that bureaucracy for you; all you have to do is supply the |
| 382 | function to call and an argument tuple for it (to embody the |
| 383 | "external action" being performed), and an optional message to |
| 384 | print. |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 385 | """ |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 386 | if msg is None: |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 387 | msg = "%s%r" % (func.__name__, args) |
Fred Drake | b94b849 | 2001-12-06 20:51:35 +0000 | [diff] [blame] | 388 | if msg[-2:] == ',)': # correct for singleton tuple |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 389 | msg = msg[0:-2] + ')' |
| 390 | |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 391 | log.info(msg) |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 392 | if not dry_run: |
Neal Norwitz | d910855 | 2006-03-17 08:00:19 +0000 | [diff] [blame] | 393 | func(*args) |
Greg Ward | 1c16ac3 | 2000-08-02 01:37:30 +0000 | [diff] [blame] | 394 | |
Greg Ward | 817dc09 | 2000-09-25 01:25:06 +0000 | [diff] [blame] | 395 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 396 | def strtobool (val): |
Greg Ward | 817dc09 | 2000-09-25 01:25:06 +0000 | [diff] [blame] | 397 | """Convert a string representation of truth to true (1) or false (0). |
Tim Peters | 182b5ac | 2004-07-18 06:16:08 +0000 | [diff] [blame] | 398 | |
Greg Ward | 817dc09 | 2000-09-25 01:25:06 +0000 | [diff] [blame] | 399 | True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values |
| 400 | are 'n', 'no', 'f', 'false', 'off', and '0'. Raises ValueError if |
| 401 | 'val' is anything else. |
| 402 | """ |
Neal Norwitz | 9d72bb4 | 2007-04-17 08:48:32 +0000 | [diff] [blame] | 403 | val = val.lower() |
Greg Ward | 817dc09 | 2000-09-25 01:25:06 +0000 | [diff] [blame] | 404 | if val in ('y', 'yes', 't', 'true', 'on', '1'): |
| 405 | return 1 |
| 406 | elif val in ('n', 'no', 'f', 'false', 'off', '0'): |
| 407 | return 0 |
| 408 | else: |
Collin Winter | 5b7e9d7 | 2007-08-30 03:52:21 +0000 | [diff] [blame] | 409 | raise ValueError("invalid truth value %r" % (val,)) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 410 | |
| 411 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 412 | def byte_compile (py_files, |
| 413 | optimize=0, force=0, |
| 414 | prefix=None, base_dir=None, |
| 415 | verbose=1, dry_run=0, |
| 416 | direct=None): |
Greg Ward | f217e21 | 2000-10-01 23:49:30 +0000 | [diff] [blame] | 417 | """Byte-compile a collection of Python source files to either .pyc |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 418 | or .pyo files in the same directory. 'py_files' is a list of files |
| 419 | to compile; any files that don't end in ".py" are silently skipped. |
| 420 | 'optimize' must be one of the following: |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 421 | 0 - don't optimize (generate .pyc) |
| 422 | 1 - normal optimization (like "python -O") |
| 423 | 2 - extra optimization (like "python -OO") |
| 424 | If 'force' is true, all files are recompiled regardless of |
| 425 | timestamps. |
| 426 | |
| 427 | The source filename encoded in each bytecode file defaults to the |
| 428 | filenames listed in 'py_files'; you can modify these with 'prefix' and |
| 429 | 'basedir'. 'prefix' is a string that will be stripped off of each |
| 430 | source filename, and 'base_dir' is a directory name that will be |
| 431 | prepended (after 'prefix' is stripped). You can supply either or both |
| 432 | (or neither) of 'prefix' and 'base_dir', as you wish. |
| 433 | |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 434 | If 'dry_run' is true, doesn't actually do anything that would |
| 435 | affect the filesystem. |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 436 | |
| 437 | Byte-compilation is either done directly in this interpreter process |
| 438 | with the standard py_compile module, or indirectly by writing a |
| 439 | temporary script and executing it. Normally, you should let |
| 440 | 'byte_compile()' figure out to use direct compilation or not (see |
| 441 | the source for details). The 'direct' flag is used by the script |
| 442 | generated in indirect mode; unless you know what you're doing, leave |
| 443 | it set to None. |
| 444 | """ |
Tarek Ziadé | 04fe7c0 | 2009-10-25 23:08:47 +0000 | [diff] [blame] | 445 | # nothing is done if sys.dont_write_bytecode is True |
| 446 | if sys.dont_write_bytecode: |
| 447 | raise DistutilsByteCompileError('byte-compiling is disabled.') |
| 448 | |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 449 | # First, if the caller didn't force us into direct or indirect mode, |
| 450 | # figure out which mode we should be in. We take a conservative |
| 451 | # approach: choose direct mode *only* if the current interpreter is |
| 452 | # in debug mode and optimize is 0. If we're not in debug mode (-O |
| 453 | # or -OO), we don't know which level of optimization this |
| 454 | # interpreter is running with, so we can't do direct |
| 455 | # byte-compilation and be certain that it's the right thing. Thus, |
| 456 | # always compile indirectly if the current interpreter is in either |
| 457 | # optimize mode, or if either optimization level was requested by |
| 458 | # the caller. |
| 459 | if direct is None: |
| 460 | direct = (__debug__ and optimize == 0) |
| 461 | |
| 462 | # "Indirect" byte-compilation: write a temporary script and then |
| 463 | # run it with the appropriate flags. |
| 464 | if not direct: |
Marc-André Lemburg | 0375079 | 2002-12-03 08:45:11 +0000 | [diff] [blame] | 465 | try: |
| 466 | from tempfile import mkstemp |
| 467 | (script_fd, script_name) = mkstemp(".py") |
| 468 | except ImportError: |
| 469 | from tempfile import mktemp |
| 470 | (script_fd, script_name) = None, mktemp(".py") |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 471 | log.info("writing byte-compilation script '%s'", script_name) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 472 | if not dry_run: |
Marc-André Lemburg | 0375079 | 2002-12-03 08:45:11 +0000 | [diff] [blame] | 473 | if script_fd is not None: |
| 474 | script = os.fdopen(script_fd, "w") |
| 475 | else: |
| 476 | script = open(script_name, "w") |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 477 | |
| 478 | script.write("""\ |
| 479 | from distutils.util import byte_compile |
| 480 | files = [ |
| 481 | """) |
Greg Ward | 9216cfe | 2000-10-03 03:31:05 +0000 | [diff] [blame] | 482 | |
| 483 | # XXX would be nice to write absolute filenames, just for |
| 484 | # safety's sake (script should be more robust in the face of |
| 485 | # chdir'ing before running it). But this requires abspath'ing |
| 486 | # 'prefix' as well, and that breaks the hack in build_lib's |
| 487 | # 'byte_compile()' method that carefully tacks on a trailing |
| 488 | # slash (os.sep really) to make sure the prefix here is "just |
| 489 | # right". This whole prefix business is rather delicate -- the |
| 490 | # problem is that it's really a directory, but I'm treating it |
| 491 | # as a dumb string, so trailing slashes and so forth matter. |
| 492 | |
| 493 | #py_files = map(os.path.abspath, py_files) |
| 494 | #if prefix: |
| 495 | # prefix = os.path.abspath(prefix) |
| 496 | |
Neal Norwitz | 9d72bb4 | 2007-04-17 08:48:32 +0000 | [diff] [blame] | 497 | script.write(",\n".join(map(repr, py_files)) + "]\n") |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 498 | script.write(""" |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 499 | byte_compile(files, optimize=%r, force=%r, |
| 500 | prefix=%r, base_dir=%r, |
| 501 | verbose=%r, dry_run=0, |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 502 | direct=1) |
Walter Dörwald | 70a6b49 | 2004-02-12 17:35:32 +0000 | [diff] [blame] | 503 | """ % (optimize, force, prefix, base_dir, verbose)) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 504 | |
| 505 | script.close() |
| 506 | |
| 507 | cmd = [sys.executable, script_name] |
| 508 | if optimize == 1: |
| 509 | cmd.insert(1, "-O") |
| 510 | elif optimize == 2: |
| 511 | cmd.insert(1, "-OO") |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 512 | spawn(cmd, dry_run=dry_run) |
Greg Ward | 9216cfe | 2000-10-03 03:31:05 +0000 | [diff] [blame] | 513 | execute(os.remove, (script_name,), "removing %s" % script_name, |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 514 | dry_run=dry_run) |
Fred Drake | b94b849 | 2001-12-06 20:51:35 +0000 | [diff] [blame] | 515 | |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 516 | # "Direct" byte-compilation: use the py_compile module to compile |
| 517 | # right here, right now. Note that the script generated in indirect |
| 518 | # mode simply calls 'byte_compile()' in direct mode, a weird sort of |
| 519 | # cross-process recursion. Hey, it works! |
| 520 | else: |
| 521 | from py_compile import compile |
| 522 | |
| 523 | for file in py_files: |
| 524 | if file[-3:] != ".py": |
Greg Ward | f217e21 | 2000-10-01 23:49:30 +0000 | [diff] [blame] | 525 | # This lets us be lazy and not filter filenames in |
| 526 | # the "install_lib" command. |
| 527 | continue |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 528 | |
| 529 | # Terminology from the py_compile module: |
| 530 | # cfile - byte-compiled file |
| 531 | # dfile - purported source filename (same as 'file' by default) |
| 532 | cfile = file + (__debug__ and "c" or "o") |
| 533 | dfile = file |
| 534 | if prefix: |
| 535 | if file[:len(prefix)] != prefix: |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 536 | raise ValueError("invalid prefix: filename %r doesn't start with %r" |
| 537 | % (file, prefix)) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 538 | dfile = dfile[len(prefix):] |
| 539 | if base_dir: |
| 540 | dfile = os.path.join(base_dir, dfile) |
| 541 | |
| 542 | cfile_base = os.path.basename(cfile) |
| 543 | if direct: |
| 544 | if force or newer(file, cfile): |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 545 | log.info("byte-compiling %s to %s", file, cfile_base) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 546 | if not dry_run: |
| 547 | compile(file, cfile, dfile) |
| 548 | else: |
Jeremy Hylton | cd8a114 | 2002-06-04 20:14:43 +0000 | [diff] [blame] | 549 | log.debug("skipping byte-compilation of %s to %s", |
| 550 | file, cfile_base) |
Greg Ward | 1297b5c | 2000-09-30 20:37:56 +0000 | [diff] [blame] | 551 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 552 | # byte_compile () |
Andrew M. Kuchling | df66df0 | 2001-03-22 03:03:41 +0000 | [diff] [blame] | 553 | |
Tarek Ziadé | 3679727 | 2010-07-22 12:50:05 +0000 | [diff] [blame] | 554 | def rfc822_escape (header): |
Andrew M. Kuchling | df66df0 | 2001-03-22 03:03:41 +0000 | [diff] [blame] | 555 | """Return a version of the string escaped for inclusion in an |
Andrew M. Kuchling | 88b0884 | 2001-03-23 17:30:26 +0000 | [diff] [blame] | 556 | RFC-822 header, by ensuring there are 8 spaces space after each newline. |
Andrew M. Kuchling | df66df0 | 2001-03-22 03:03:41 +0000 | [diff] [blame] | 557 | """ |
Tarek Ziadé | df872d4 | 2009-12-06 09:28:17 +0000 | [diff] [blame] | 558 | lines = header.split('\n') |
| 559 | sep = '\n' + 8 * ' ' |
Neal Norwitz | 9d72bb4 | 2007-04-17 08:48:32 +0000 | [diff] [blame] | 560 | return sep.join(lines) |
Martin v. Löwis | 6178db6 | 2008-12-01 04:38:52 +0000 | [diff] [blame] | 561 | |
| 562 | # 2to3 support |
| 563 | |
| 564 | def run_2to3(files, fixer_names=None, options=None, explicit=None): |
| 565 | """Invoke 2to3 on a list of Python files. |
| 566 | The files should all come from the build area, as the |
| 567 | modification is done in-place. To reduce the build time, |
| 568 | only files modified since the last invocation of this |
| 569 | function should be passed in the files argument.""" |
| 570 | |
| 571 | if not files: |
| 572 | return |
| 573 | |
| 574 | # Make this class local, to delay import of 2to3 |
| 575 | from lib2to3.refactor import RefactoringTool, get_fixers_from_package |
| 576 | class DistutilsRefactoringTool(RefactoringTool): |
| 577 | def log_error(self, msg, *args, **kw): |
| 578 | log.error(msg, *args) |
| 579 | |
| 580 | def log_message(self, msg, *args): |
| 581 | log.info(msg, *args) |
| 582 | |
| 583 | def log_debug(self, msg, *args): |
| 584 | log.debug(msg, *args) |
| 585 | |
| 586 | if fixer_names is None: |
| 587 | fixer_names = get_fixers_from_package('lib2to3.fixes') |
| 588 | r = DistutilsRefactoringTool(fixer_names, options=options) |
| 589 | r.refactor(files, write=True) |
| 590 | |
Georg Brandl | 6d4a9cf | 2009-03-31 00:34:54 +0000 | [diff] [blame] | 591 | def copydir_run_2to3(src, dest, template=None, fixer_names=None, |
| 592 | options=None, explicit=None): |
| 593 | """Recursively copy a directory, only copying new and changed files, |
| 594 | running run_2to3 over all newly copied Python modules afterward. |
| 595 | |
| 596 | If you give a template string, it's parsed like a MANIFEST.in. |
| 597 | """ |
| 598 | from distutils.dir_util import mkpath |
| 599 | from distutils.file_util import copy_file |
| 600 | from distutils.filelist import FileList |
| 601 | filelist = FileList() |
| 602 | curdir = os.getcwd() |
| 603 | os.chdir(src) |
| 604 | try: |
| 605 | filelist.findall() |
| 606 | finally: |
| 607 | os.chdir(curdir) |
| 608 | filelist.files[:] = filelist.allfiles |
| 609 | if template: |
| 610 | for line in template.splitlines(): |
| 611 | line = line.strip() |
| 612 | if not line: continue |
| 613 | filelist.process_template_line(line) |
| 614 | copied = [] |
| 615 | for filename in filelist.files: |
| 616 | outname = os.path.join(dest, filename) |
| 617 | mkpath(os.path.dirname(outname)) |
| 618 | res = copy_file(os.path.join(src, filename), outname, update=1) |
| 619 | if res[1]: copied.append(outname) |
| 620 | run_2to3([fn for fn in copied if fn.lower().endswith('.py')], |
| 621 | fixer_names=fixer_names, options=options, explicit=explicit) |
| 622 | return copied |
| 623 | |
Martin v. Löwis | 6178db6 | 2008-12-01 04:38:52 +0000 | [diff] [blame] | 624 | class Mixin2to3: |
| 625 | '''Mixin class for commands that run 2to3. |
| 626 | To configure 2to3, setup scripts may either change |
| 627 | the class variables, or inherit from individual commands |
| 628 | to override how 2to3 is invoked.''' |
| 629 | |
| 630 | # provide list of fixers to run; |
| 631 | # defaults to all from lib2to3.fixers |
| 632 | fixer_names = None |
| 633 | |
| 634 | # options dictionary |
| 635 | options = None |
| 636 | |
| 637 | # list of fixers to invoke even though they are marked as explicit |
| 638 | explicit = None |
| 639 | |
| 640 | def run_2to3(self, files): |
| 641 | return run_2to3(files, self.fixer_names, self.options, self.explicit) |