blob: bce840274dce0f8f1d24dcfb03990ff1932bf064 [file] [log] [blame]
Greg Ward2689e3d1999-03-22 14:52:19 +00001"""distutils.util
2
Greg Wardaebf7062000-04-04 02:05:59 +00003Miscellaneous utility functions -- anything that doesn't fit into
Greg Ward47527692000-09-30 18:49:14 +00004one of the other *util.py modules.
5"""
Greg Ward2689e3d1999-03-22 14:52:19 +00006
Éric Araujo47a45212011-10-08 00:34:13 +02007import os
8import re
9import imp
10import sys
11import string
Greg Ward1297b5c2000-09-30 20:37:56 +000012from distutils.errors import DistutilsPlatformError
13from distutils.dep_util import newer
Tarek Ziadé36797272010-07-22 12:50:05 +000014from distutils.spawn import spawn
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +000015from distutils import log
Tarek Ziadé04fe7c02009-10-25 23:08:47 +000016from distutils.errors import DistutilsByteCompileError
Greg Wardaa458bc2000-04-22 15:14:58 +000017
Tarek Ziadé36797272010-07-22 12:50:05 +000018def get_platform ():
19 """Return a string that identifies the current platform. This is used
20 mainly to distinguish platform-specific build directories and
21 platform-specific built distributions. Typically includes the OS name
22 and version and the architecture (as supplied by 'os.uname()'),
23 although the exact information included depends on the OS; eg. for IRIX
24 the architecture isn't particularly important (IRIX only runs on SGI
25 hardware), but for Linux the kernel version isn't particularly
26 important.
Tarek Ziadé8b441d02010-01-29 11:46:31 +000027
Tarek Ziadé36797272010-07-22 12:50:05 +000028 Examples of returned values:
29 linux-i586
30 linux-alpha (?)
31 solaris-2.6-sun4u
32 irix-5.3
33 irix64-6.2
Tarek Ziadé8b441d02010-01-29 11:46:31 +000034
Tarek Ziadé36797272010-07-22 12:50:05 +000035 Windows will return one of:
36 win-amd64 (64bit Windows on AMD64 (aka x86_64, Intel64, EM64T, etc)
37 win-ia64 (64bit Windows on Itanium)
38 win32 (all others - specifically, sys.platform is returned)
39
40 For other non-POSIX platforms, currently just returns 'sys.platform'.
Tarek Ziadé8b441d02010-01-29 11:46:31 +000041 """
Tarek Ziadé36797272010-07-22 12:50:05 +000042 if os.name == 'nt':
43 # sniff sys.version for architecture.
44 prefix = " bit ("
45 i = sys.version.find(prefix)
46 if i == -1:
47 return sys.platform
48 j = sys.version.find(")", i)
49 look = sys.version[i+len(prefix):j].lower()
50 if look == 'amd64':
51 return 'win-amd64'
52 if look == 'itanium':
53 return 'win-ia64'
54 return sys.platform
Tarek Ziadé8b441d02010-01-29 11:46:31 +000055
Tarek Ziadé36797272010-07-22 12:50:05 +000056 if os.name != "posix" or not hasattr(os, 'uname'):
57 # XXX what about the architecture? NT is Intel or Alpha,
58 # Mac OS is M68k or PPC, etc.
59 return sys.platform
Tarek Ziadé8b441d02010-01-29 11:46:31 +000060
Tarek Ziadé36797272010-07-22 12:50:05 +000061 # Try to distinguish various flavours of Unix
Greg Ward50919292000-03-07 03:27:08 +000062
Tarek Ziadé36797272010-07-22 12:50:05 +000063 (osname, host, release, version, machine) = os.uname()
Greg Ward50919292000-03-07 03:27:08 +000064
Tarek Ziadé36797272010-07-22 12:50:05 +000065 # Convert the OS name to lowercase, remove '/' characters
66 # (to accommodate BSD/OS), and translate spaces (for "Power Macintosh")
67 osname = osname.lower().replace('/', '')
68 machine = machine.replace(' ', '_')
69 machine = machine.replace('/', '-')
70
71 if osname[:5] == "linux":
72 # At least on Linux/Intel, 'machine' is the processor --
73 # i386, etc.
74 # XXX what about Alpha, SPARC, etc?
75 return "%s-%s" % (osname, machine)
76 elif osname[:5] == "sunos":
77 if release[0] >= "5": # SunOS 5 == Solaris 2
78 osname = "solaris"
79 release = "%d.%s" % (int(release[0]) - 3, release[2:])
Jesus Cea6e35d412012-01-18 04:27:37 +010080 # We can't use "platform.architecture()[0]" because a
81 # bootstrap problem. We use a dict to get an error
82 # if some suspicious happens.
83 bitness = {2147483647:"32bit", 9223372036854775807:"64bit"}
Jesus Cea031605a2012-01-18 05:04:49 +010084 machine += ".%s" % bitness[sys.maxsize]
Tarek Ziadé36797272010-07-22 12:50:05 +000085 # fall through to standard osname-release-machine representation
86 elif osname[:4] == "irix": # could be "irix64"!
87 return "%s-%s" % (osname, release)
88 elif osname[:3] == "aix":
89 return "%s-%s.%s" % (osname, version, release)
90 elif osname[:6] == "cygwin":
91 osname = "cygwin"
92 rel_re = re.compile (r'[\d.]+', re.ASCII)
93 m = rel_re.match(release)
94 if m:
95 release = m.group()
96 elif osname[:6] == "darwin":
97 #
98 # For our purposes, we'll assume that the system version from
99 # distutils' perspective is what MACOSX_DEPLOYMENT_TARGET is set
100 # to. This makes the compatibility story a bit more sane because the
101 # machine is going to compile and link as if it were
102 # MACOSX_DEPLOYMENT_TARGET.
103 from distutils.sysconfig import get_config_vars
104 cfgvars = get_config_vars()
105
Ronald Oussoren222e89a2011-05-15 16:46:11 +0200106 macver = cfgvars.get('MACOSX_DEPLOYMENT_TARGET')
Tarek Ziadé36797272010-07-22 12:50:05 +0000107
108 if 1:
109 # Always calculate the release of the running machine,
110 # needed to determine if we can build fat binaries or not.
111
112 macrelease = macver
113 # Get the system version. Reading this plist is a documented
114 # way to get the system version (see the documentation for
115 # the Gestalt Manager)
116 try:
117 f = open('/System/Library/CoreServices/SystemVersion.plist')
118 except IOError:
119 # We're on a plain darwin box, fall back to the default
120 # behaviour.
121 pass
122 else:
Éric Araujobee5cef2010-11-05 23:51:56 +0000123 try:
124 m = re.search(
125 r'<key>ProductUserVisibleVersion</key>\s*' +
126 r'<string>(.*?)</string>', f.read())
127 if m is not None:
128 macrelease = '.'.join(m.group(1).split('.')[:2])
129 # else: fall back to the default behaviour
130 finally:
131 f.close()
Tarek Ziadé36797272010-07-22 12:50:05 +0000132
133 if not macver:
134 macver = macrelease
135
136 if macver:
137 from distutils.sysconfig import get_config_vars
138 release = macver
139 osname = "macosx"
140
141 if (macrelease + '.') >= '10.4.' and \
142 '-arch' in get_config_vars().get('CFLAGS', '').strip():
143 # The universal build will build fat binaries, but not on
144 # systems before 10.4
145 #
146 # Try to detect 4-way universal builds, those have machine-type
147 # 'universal' instead of 'fat'.
148
149 machine = 'fat'
150 cflags = get_config_vars().get('CFLAGS')
151
152 archs = re.findall('-arch\s+(\S+)', cflags)
153 archs = tuple(sorted(set(archs)))
154
155 if len(archs) == 1:
156 machine = archs[0]
157 elif archs == ('i386', 'ppc'):
158 machine = 'fat'
159 elif archs == ('i386', 'x86_64'):
160 machine = 'intel'
161 elif archs == ('i386', 'ppc', 'x86_64'):
162 machine = 'fat3'
163 elif archs == ('ppc64', 'x86_64'):
164 machine = 'fat64'
165 elif archs == ('i386', 'ppc', 'ppc64', 'x86_64'):
166 machine = 'universal'
167 else:
168 raise ValueError(
169 "Don't know machine value for archs=%r"%(archs,))
170
171 elif machine == 'i386':
172 # On OSX the machine type returned by uname is always the
173 # 32-bit variant, even if the executable architecture is
174 # the 64-bit variant
175 if sys.maxsize >= 2**32:
176 machine = 'x86_64'
177
178 elif machine in ('PowerPC', 'Power_Macintosh'):
179 # Pick a sane name for the PPC architecture.
180 machine = 'ppc'
181
182 # See 'i386' case
183 if sys.maxsize >= 2**32:
184 machine = 'ppc64'
185
186 return "%s-%s-%s" % (osname, release, machine)
187
188# get_platform ()
189
190
191def convert_path (pathname):
192 """Return 'pathname' as a name that will work on the native filesystem,
Greg Wardb8b263b2000-09-30 18:40:42 +0000193 i.e. split it on '/' and put it back together again using the current
194 directory separator. Needed because filenames in the setup script are
195 always supplied in Unix style, and have to be converted to the local
196 convention before we can actually use them in the filesystem. Raises
Greg Ward47527692000-09-30 18:49:14 +0000197 ValueError on non-Unix-ish systems if 'pathname' either starts or
198 ends with a slash.
Greg Wardb8b263b2000-09-30 18:40:42 +0000199 """
Greg Ward7ec05352000-09-22 01:05:43 +0000200 if os.sep == '/':
201 return pathname
Neal Norwitzb0df6a12002-08-13 17:42:57 +0000202 if not pathname:
203 return pathname
204 if pathname[0] == '/':
Collin Winter5b7e9d72007-08-30 03:52:21 +0000205 raise ValueError("path '%s' cannot be absolute" % pathname)
Neal Norwitzb0df6a12002-08-13 17:42:57 +0000206 if pathname[-1] == '/':
Collin Winter5b7e9d72007-08-30 03:52:21 +0000207 raise ValueError("path '%s' cannot end with '/'" % pathname)
Greg Ward7ec05352000-09-22 01:05:43 +0000208
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000209 paths = pathname.split('/')
Jack Jansenb4cd5c12001-01-28 12:23:32 +0000210 while '.' in paths:
211 paths.remove('.')
212 if not paths:
213 return os.curdir
Neal Norwitzd9108552006-03-17 08:00:19 +0000214 return os.path.join(*paths)
Greg Ward50919292000-03-07 03:27:08 +0000215
Tarek Ziadé36797272010-07-22 12:50:05 +0000216# convert_path ()
Greg Ward1b4ede52000-03-22 00:22:44 +0000217
218
Tarek Ziadé36797272010-07-22 12:50:05 +0000219def change_root (new_root, pathname):
220 """Return 'pathname' with 'new_root' prepended. If 'pathname' is
221 relative, this is equivalent to "os.path.join(new_root,pathname)".
Greg Ward67f75d42000-04-27 01:53:46 +0000222 Otherwise, it requires making 'pathname' relative and then joining the
Greg Ward4b46ef92000-05-31 02:14:32 +0000223 two, which is tricky on DOS/Windows and Mac OS.
224 """
225 if os.name == 'posix':
Greg Wardbe86bde2000-09-26 01:56:15 +0000226 if not os.path.isabs(pathname):
227 return os.path.join(new_root, pathname)
Greg Ward4b46ef92000-05-31 02:14:32 +0000228 else:
Greg Wardbe86bde2000-09-26 01:56:15 +0000229 return os.path.join(new_root, pathname[1:])
Greg Ward67f75d42000-04-27 01:53:46 +0000230
231 elif os.name == 'nt':
Greg Wardbe86bde2000-09-26 01:56:15 +0000232 (drive, path) = os.path.splitdrive(pathname)
Greg Ward4b46ef92000-05-31 02:14:32 +0000233 if path[0] == '\\':
234 path = path[1:]
Greg Wardbe86bde2000-09-26 01:56:15 +0000235 return os.path.join(new_root, path)
Greg Ward67f75d42000-04-27 01:53:46 +0000236
Marc-André Lemburg2544f512002-01-31 18:56:00 +0000237 elif os.name == 'os2':
238 (drive, path) = os.path.splitdrive(pathname)
239 if path[0] == os.sep:
240 path = path[1:]
241 return os.path.join(new_root, path)
242
Greg Ward67f75d42000-04-27 01:53:46 +0000243 else:
Tarek Ziadé36797272010-07-22 12:50:05 +0000244 raise DistutilsPlatformError("nothing known about platform '%s'" % os.name)
245
Greg Ward67f75d42000-04-27 01:53:46 +0000246
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000247_environ_checked = 0
Tarek Ziadé36797272010-07-22 12:50:05 +0000248def check_environ ():
249 """Ensure that 'os.environ' has all the environment variables we
250 guarantee that users can use in config files, command-line options,
Greg Wardb8b263b2000-09-30 18:40:42 +0000251 etc. Currently this includes:
252 HOME - user's home directory (Unix only)
253 PLAT - description of the current platform, including hardware
254 and OS (see 'get_platform()')
Greg Ward1b4ede52000-03-22 00:22:44 +0000255 """
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000256 global _environ_checked
257 if _environ_checked:
258 return
259
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000260 if os.name == 'posix' and 'HOME' not in os.environ:
Greg Ward1b4ede52000-03-22 00:22:44 +0000261 import pwd
Greg Wardbe86bde2000-09-26 01:56:15 +0000262 os.environ['HOME'] = pwd.getpwuid(os.getuid())[5]
Greg Ward1b4ede52000-03-22 00:22:44 +0000263
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000264 if 'PLAT' not in os.environ:
Tarek Ziadé36797272010-07-22 12:50:05 +0000265 os.environ['PLAT'] = get_platform()
Greg Ward1b4ede52000-03-22 00:22:44 +0000266
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000267 _environ_checked = 1
268
Greg Ward1b4ede52000-03-22 00:22:44 +0000269
Tarek Ziadé36797272010-07-22 12:50:05 +0000270def subst_vars (s, local_vars):
271 """Perform shell/Perl-style variable substitution on 'string'. Every
272 occurrence of '$' followed by a name is considered a variable, and
Greg Ward47527692000-09-30 18:49:14 +0000273 variable is substituted by the value found in the 'local_vars'
274 dictionary, or in 'os.environ' if it's not in 'local_vars'.
275 'os.environ' is first checked/augmented to guarantee that it contains
276 certain values: see 'check_environ()'. Raise ValueError for any
277 variables not found in either 'local_vars' or 'os.environ'.
Greg Wardb8b263b2000-09-30 18:40:42 +0000278 """
Greg Wardbe86bde2000-09-26 01:56:15 +0000279 check_environ()
Greg Ward1b4ede52000-03-22 00:22:44 +0000280 def _subst (match, local_vars=local_vars):
281 var_name = match.group(1)
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000282 if var_name in local_vars:
Greg Wardbe86bde2000-09-26 01:56:15 +0000283 return str(local_vars[var_name])
Greg Ward1b4ede52000-03-22 00:22:44 +0000284 else:
285 return os.environ[var_name]
286
Greg Ward47527692000-09-30 18:49:14 +0000287 try:
Jeremy Hylton5e2d0762001-01-25 20:10:32 +0000288 return re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s)
Guido van Rossumb940e112007-01-10 16:19:56 +0000289 except KeyError as var:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000290 raise ValueError("invalid variable '$%s'" % var)
Greg Ward1b4ede52000-03-22 00:22:44 +0000291
Tarek Ziadé36797272010-07-22 12:50:05 +0000292# subst_vars ()
Greg Ward7c1a6d42000-03-29 02:48:40 +0000293
Tarek Ziadé36797272010-07-22 12:50:05 +0000294
295def grok_environment_error (exc, prefix="error: "):
296 """Generate a useful error message from an EnvironmentError (IOError or
297 OSError) exception object. Handles Python 1.5.1 and 1.5.2 styles, and
Greg Warde9055132000-06-17 02:16:46 +0000298 does what it can to deal with exception objects that don't have a
299 filename (which happens when the error is due to a two-file operation,
300 such as 'rename()' or 'link()'. Returns the error message as a string
301 prefixed with 'prefix'.
302 """
303 # check for Python 1.5.2-style {IO,OS}Error exception objects
Greg Wardbe86bde2000-09-26 01:56:15 +0000304 if hasattr(exc, 'filename') and hasattr(exc, 'strerror'):
Greg Warde9055132000-06-17 02:16:46 +0000305 if exc.filename:
306 error = prefix + "%s: %s" % (exc.filename, exc.strerror)
307 else:
308 # two-argument functions in posix module don't
309 # include the filename in the exception object!
310 error = prefix + "%s" % exc.strerror
311 else:
Georg Brandl5dfe0de2008-01-06 21:41:49 +0000312 error = prefix + str(exc.args[-1])
Greg Warde9055132000-06-17 02:16:46 +0000313
314 return error
Greg Ward6a2a3db2000-06-24 20:40:02 +0000315
Tarek Ziadé36797272010-07-22 12:50:05 +0000316
Greg Ward6a2a3db2000-06-24 20:40:02 +0000317# Needed by 'split_quoted()'
Martin v. Löwis1c0f1f92004-03-25 14:58:19 +0000318_wordchars_re = _squote_re = _dquote_re = None
319def _init_regex():
320 global _wordchars_re, _squote_re, _dquote_re
321 _wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace)
322 _squote_re = re.compile(r"'(?:[^'\\]|\\.)*'")
323 _dquote_re = re.compile(r'"(?:[^"\\]|\\.)*"')
Greg Ward6a2a3db2000-06-24 20:40:02 +0000324
Tarek Ziadé36797272010-07-22 12:50:05 +0000325def split_quoted (s):
Greg Ward6a2a3db2000-06-24 20:40:02 +0000326 """Split a string up according to Unix shell-like rules for quotes and
Tarek Ziadé36797272010-07-22 12:50:05 +0000327 backslashes. In short: words are delimited by spaces, as long as those
Greg Ward6a2a3db2000-06-24 20:40:02 +0000328 spaces are not escaped by a backslash, or inside a quoted string.
329 Single and double quotes are equivalent, and the quote characters can
330 be backslash-escaped. The backslash is stripped from any two-character
331 escape sequence, leaving only the escaped character. The quote
332 characters are stripped from any quoted string. Returns a list of
333 words.
334 """
Tarek Ziadé36797272010-07-22 12:50:05 +0000335
Greg Ward6a2a3db2000-06-24 20:40:02 +0000336 # This is a nice algorithm for splitting up a single string, since it
337 # doesn't require character-by-character examination. It was a little
338 # bit of a brain-bender to get it working right, though...
Martin v. Löwis1c0f1f92004-03-25 14:58:19 +0000339 if _wordchars_re is None: _init_regex()
Greg Ward6a2a3db2000-06-24 20:40:02 +0000340
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000341 s = s.strip()
Greg Ward6a2a3db2000-06-24 20:40:02 +0000342 words = []
343 pos = 0
344
345 while s:
346 m = _wordchars_re.match(s, pos)
347 end = m.end()
348 if end == len(s):
349 words.append(s[:end])
350 break
351
Greg Ward2b042de2000-08-08 14:38:13 +0000352 if s[end] in string.whitespace: # unescaped, unquoted whitespace: now
Greg Ward6a2a3db2000-06-24 20:40:02 +0000353 words.append(s[:end]) # we definitely have a word delimiter
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000354 s = s[end:].lstrip()
Greg Ward6a2a3db2000-06-24 20:40:02 +0000355 pos = 0
356
357 elif s[end] == '\\': # preserve whatever is being escaped;
358 # will become part of the current word
359 s = s[:end] + s[end+1:]
360 pos = end+1
361
362 else:
363 if s[end] == "'": # slurp singly-quoted string
364 m = _squote_re.match(s, end)
365 elif s[end] == '"': # slurp doubly-quoted string
366 m = _dquote_re.match(s, end)
367 else:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000368 raise RuntimeError("this can't happen (bad char '%c')" % s[end])
Greg Ward6a2a3db2000-06-24 20:40:02 +0000369
370 if m is None:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000371 raise ValueError("bad string (mismatched %s quotes?)" % s[end])
Greg Ward6a2a3db2000-06-24 20:40:02 +0000372
373 (beg, end) = m.span()
374 s = s[:beg] + s[beg+1:end-1] + s[end:]
375 pos = m.end() - 2
376
377 if pos >= len(s):
378 words.append(s)
379 break
380
381 return words
382
Tarek Ziadé36797272010-07-22 12:50:05 +0000383# split_quoted ()
Greg Ward1c16ac32000-08-02 01:37:30 +0000384
385
Tarek Ziadé36797272010-07-22 12:50:05 +0000386def execute (func, args, msg=None, verbose=0, dry_run=0):
387 """Perform some action that affects the outside world (eg. by
388 writing to the filesystem). Such actions are special because they
389 are disabled by the 'dry_run' flag. This method takes care of all
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000390 that bureaucracy for you; all you have to do is supply the
391 function to call and an argument tuple for it (to embody the
392 "external action" being performed), and an optional message to
393 print.
Greg Ward1c16ac32000-08-02 01:37:30 +0000394 """
Greg Ward1c16ac32000-08-02 01:37:30 +0000395 if msg is None:
Walter Dörwald70a6b492004-02-12 17:35:32 +0000396 msg = "%s%r" % (func.__name__, args)
Fred Drakeb94b8492001-12-06 20:51:35 +0000397 if msg[-2:] == ',)': # correct for singleton tuple
Greg Ward1c16ac32000-08-02 01:37:30 +0000398 msg = msg[0:-2] + ')'
399
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000400 log.info(msg)
Greg Ward1c16ac32000-08-02 01:37:30 +0000401 if not dry_run:
Neal Norwitzd9108552006-03-17 08:00:19 +0000402 func(*args)
Greg Ward1c16ac32000-08-02 01:37:30 +0000403
Greg Ward817dc092000-09-25 01:25:06 +0000404
Tarek Ziadé36797272010-07-22 12:50:05 +0000405def strtobool (val):
Greg Ward817dc092000-09-25 01:25:06 +0000406 """Convert a string representation of truth to true (1) or false (0).
Tim Peters182b5ac2004-07-18 06:16:08 +0000407
Greg Ward817dc092000-09-25 01:25:06 +0000408 True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values
409 are 'n', 'no', 'f', 'false', 'off', and '0'. Raises ValueError if
410 'val' is anything else.
411 """
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000412 val = val.lower()
Greg Ward817dc092000-09-25 01:25:06 +0000413 if val in ('y', 'yes', 't', 'true', 'on', '1'):
414 return 1
415 elif val in ('n', 'no', 'f', 'false', 'off', '0'):
416 return 0
417 else:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000418 raise ValueError("invalid truth value %r" % (val,))
Greg Ward1297b5c2000-09-30 20:37:56 +0000419
420
Tarek Ziadé36797272010-07-22 12:50:05 +0000421def byte_compile (py_files,
422 optimize=0, force=0,
423 prefix=None, base_dir=None,
424 verbose=1, dry_run=0,
425 direct=None):
Greg Wardf217e212000-10-01 23:49:30 +0000426 """Byte-compile a collection of Python source files to either .pyc
Éric Araujo04ea9532011-10-08 03:02:37 +0200427 or .pyo files in a __pycache__ subdirectory. 'py_files' is a list
428 of files to compile; any files that don't end in ".py" are silently
429 skipped. 'optimize' must be one of the following:
Greg Ward1297b5c2000-09-30 20:37:56 +0000430 0 - don't optimize (generate .pyc)
431 1 - normal optimization (like "python -O")
432 2 - extra optimization (like "python -OO")
433 If 'force' is true, all files are recompiled regardless of
434 timestamps.
435
436 The source filename encoded in each bytecode file defaults to the
437 filenames listed in 'py_files'; you can modify these with 'prefix' and
438 'basedir'. 'prefix' is a string that will be stripped off of each
439 source filename, and 'base_dir' is a directory name that will be
440 prepended (after 'prefix' is stripped). You can supply either or both
441 (or neither) of 'prefix' and 'base_dir', as you wish.
442
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000443 If 'dry_run' is true, doesn't actually do anything that would
444 affect the filesystem.
Greg Ward1297b5c2000-09-30 20:37:56 +0000445
446 Byte-compilation is either done directly in this interpreter process
447 with the standard py_compile module, or indirectly by writing a
448 temporary script and executing it. Normally, you should let
449 'byte_compile()' figure out to use direct compilation or not (see
450 the source for details). The 'direct' flag is used by the script
451 generated in indirect mode; unless you know what you're doing, leave
452 it set to None.
453 """
Tarek Ziadé04fe7c02009-10-25 23:08:47 +0000454 # nothing is done if sys.dont_write_bytecode is True
455 if sys.dont_write_bytecode:
456 raise DistutilsByteCompileError('byte-compiling is disabled.')
457
Greg Ward1297b5c2000-09-30 20:37:56 +0000458 # First, if the caller didn't force us into direct or indirect mode,
459 # figure out which mode we should be in. We take a conservative
460 # approach: choose direct mode *only* if the current interpreter is
461 # in debug mode and optimize is 0. If we're not in debug mode (-O
462 # or -OO), we don't know which level of optimization this
463 # interpreter is running with, so we can't do direct
464 # byte-compilation and be certain that it's the right thing. Thus,
465 # always compile indirectly if the current interpreter is in either
466 # optimize mode, or if either optimization level was requested by
467 # the caller.
468 if direct is None:
469 direct = (__debug__ and optimize == 0)
470
471 # "Indirect" byte-compilation: write a temporary script and then
472 # run it with the appropriate flags.
473 if not direct:
Marc-André Lemburg03750792002-12-03 08:45:11 +0000474 try:
475 from tempfile import mkstemp
476 (script_fd, script_name) = mkstemp(".py")
477 except ImportError:
478 from tempfile import mktemp
479 (script_fd, script_name) = None, mktemp(".py")
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000480 log.info("writing byte-compilation script '%s'", script_name)
Greg Ward1297b5c2000-09-30 20:37:56 +0000481 if not dry_run:
Marc-André Lemburg03750792002-12-03 08:45:11 +0000482 if script_fd is not None:
483 script = os.fdopen(script_fd, "w")
484 else:
485 script = open(script_name, "w")
Greg Ward1297b5c2000-09-30 20:37:56 +0000486
487 script.write("""\
488from distutils.util import byte_compile
489files = [
490""")
Greg Ward9216cfe2000-10-03 03:31:05 +0000491
492 # XXX would be nice to write absolute filenames, just for
493 # safety's sake (script should be more robust in the face of
494 # chdir'ing before running it). But this requires abspath'ing
495 # 'prefix' as well, and that breaks the hack in build_lib's
496 # 'byte_compile()' method that carefully tacks on a trailing
497 # slash (os.sep really) to make sure the prefix here is "just
498 # right". This whole prefix business is rather delicate -- the
499 # problem is that it's really a directory, but I'm treating it
500 # as a dumb string, so trailing slashes and so forth matter.
501
502 #py_files = map(os.path.abspath, py_files)
503 #if prefix:
504 # prefix = os.path.abspath(prefix)
505
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000506 script.write(",\n".join(map(repr, py_files)) + "]\n")
Greg Ward1297b5c2000-09-30 20:37:56 +0000507 script.write("""
Walter Dörwald70a6b492004-02-12 17:35:32 +0000508byte_compile(files, optimize=%r, force=%r,
509 prefix=%r, base_dir=%r,
510 verbose=%r, dry_run=0,
Greg Ward1297b5c2000-09-30 20:37:56 +0000511 direct=1)
Walter Dörwald70a6b492004-02-12 17:35:32 +0000512""" % (optimize, force, prefix, base_dir, verbose))
Greg Ward1297b5c2000-09-30 20:37:56 +0000513
514 script.close()
515
516 cmd = [sys.executable, script_name]
517 if optimize == 1:
518 cmd.insert(1, "-O")
519 elif optimize == 2:
520 cmd.insert(1, "-OO")
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000521 spawn(cmd, dry_run=dry_run)
Greg Ward9216cfe2000-10-03 03:31:05 +0000522 execute(os.remove, (script_name,), "removing %s" % script_name,
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000523 dry_run=dry_run)
Fred Drakeb94b8492001-12-06 20:51:35 +0000524
Greg Ward1297b5c2000-09-30 20:37:56 +0000525 # "Direct" byte-compilation: use the py_compile module to compile
526 # right here, right now. Note that the script generated in indirect
527 # mode simply calls 'byte_compile()' in direct mode, a weird sort of
528 # cross-process recursion. Hey, it works!
529 else:
530 from py_compile import compile
531
532 for file in py_files:
533 if file[-3:] != ".py":
Greg Wardf217e212000-10-01 23:49:30 +0000534 # This lets us be lazy and not filter filenames in
535 # the "install_lib" command.
536 continue
Greg Ward1297b5c2000-09-30 20:37:56 +0000537
538 # Terminology from the py_compile module:
539 # cfile - byte-compiled file
540 # dfile - purported source filename (same as 'file' by default)
Éric Araujo47a45212011-10-08 00:34:13 +0200541 if optimize >= 0:
542 cfile = imp.cache_from_source(file, debug_override=not optimize)
543 else:
544 cfile = imp.cache_from_source(file)
Greg Ward1297b5c2000-09-30 20:37:56 +0000545 dfile = file
546 if prefix:
547 if file[:len(prefix)] != prefix:
Tarek Ziadé36797272010-07-22 12:50:05 +0000548 raise ValueError("invalid prefix: filename %r doesn't start with %r"
549 % (file, prefix))
Greg Ward1297b5c2000-09-30 20:37:56 +0000550 dfile = dfile[len(prefix):]
551 if base_dir:
552 dfile = os.path.join(base_dir, dfile)
553
554 cfile_base = os.path.basename(cfile)
555 if direct:
556 if force or newer(file, cfile):
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000557 log.info("byte-compiling %s to %s", file, cfile_base)
Greg Ward1297b5c2000-09-30 20:37:56 +0000558 if not dry_run:
559 compile(file, cfile, dfile)
560 else:
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000561 log.debug("skipping byte-compilation of %s to %s",
562 file, cfile_base)
Greg Ward1297b5c2000-09-30 20:37:56 +0000563
Tarek Ziadé36797272010-07-22 12:50:05 +0000564# byte_compile ()
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000565
Tarek Ziadé36797272010-07-22 12:50:05 +0000566def rfc822_escape (header):
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000567 """Return a version of the string escaped for inclusion in an
Andrew M. Kuchling88b08842001-03-23 17:30:26 +0000568 RFC-822 header, by ensuring there are 8 spaces space after each newline.
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000569 """
Tarek Ziadédf872d42009-12-06 09:28:17 +0000570 lines = header.split('\n')
571 sep = '\n' + 8 * ' '
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000572 return sep.join(lines)
Martin v. Löwis6178db62008-12-01 04:38:52 +0000573
574# 2to3 support
575
576def run_2to3(files, fixer_names=None, options=None, explicit=None):
577 """Invoke 2to3 on a list of Python files.
578 The files should all come from the build area, as the
579 modification is done in-place. To reduce the build time,
580 only files modified since the last invocation of this
581 function should be passed in the files argument."""
582
583 if not files:
584 return
585
586 # Make this class local, to delay import of 2to3
587 from lib2to3.refactor import RefactoringTool, get_fixers_from_package
588 class DistutilsRefactoringTool(RefactoringTool):
589 def log_error(self, msg, *args, **kw):
590 log.error(msg, *args)
591
592 def log_message(self, msg, *args):
593 log.info(msg, *args)
594
595 def log_debug(self, msg, *args):
596 log.debug(msg, *args)
597
598 if fixer_names is None:
599 fixer_names = get_fixers_from_package('lib2to3.fixes')
600 r = DistutilsRefactoringTool(fixer_names, options=options)
601 r.refactor(files, write=True)
602
Georg Brandl6d4a9cf2009-03-31 00:34:54 +0000603def copydir_run_2to3(src, dest, template=None, fixer_names=None,
604 options=None, explicit=None):
605 """Recursively copy a directory, only copying new and changed files,
606 running run_2to3 over all newly copied Python modules afterward.
607
608 If you give a template string, it's parsed like a MANIFEST.in.
609 """
610 from distutils.dir_util import mkpath
611 from distutils.file_util import copy_file
612 from distutils.filelist import FileList
613 filelist = FileList()
614 curdir = os.getcwd()
615 os.chdir(src)
616 try:
617 filelist.findall()
618 finally:
619 os.chdir(curdir)
620 filelist.files[:] = filelist.allfiles
621 if template:
622 for line in template.splitlines():
623 line = line.strip()
624 if not line: continue
625 filelist.process_template_line(line)
626 copied = []
627 for filename in filelist.files:
628 outname = os.path.join(dest, filename)
629 mkpath(os.path.dirname(outname))
630 res = copy_file(os.path.join(src, filename), outname, update=1)
631 if res[1]: copied.append(outname)
632 run_2to3([fn for fn in copied if fn.lower().endswith('.py')],
633 fixer_names=fixer_names, options=options, explicit=explicit)
634 return copied
635
Martin v. Löwis6178db62008-12-01 04:38:52 +0000636class Mixin2to3:
637 '''Mixin class for commands that run 2to3.
638 To configure 2to3, setup scripts may either change
639 the class variables, or inherit from individual commands
640 to override how 2to3 is invoked.'''
641
642 # provide list of fixers to run;
643 # defaults to all from lib2to3.fixers
644 fixer_names = None
645
646 # options dictionary
647 options = None
648
649 # list of fixers to invoke even though they are marked as explicit
650 explicit = None
651
652 def run_2to3(self, files):
653 return run_2to3(files, self.fixer_names, self.options, self.explicit)