blob: 8175434586df387bef70022e489abb7c83c630bd [file] [log] [blame]
Greg Ward2689e3d1999-03-22 14:52:19 +00001"""distutils.util
2
Greg Wardaebf7062000-04-04 02:05:59 +00003Miscellaneous utility functions -- anything that doesn't fit into
Greg Ward47527692000-09-30 18:49:14 +00004one of the other *util.py modules.
5"""
Greg Ward2689e3d1999-03-22 14:52:19 +00006
Greg Ward3ce77fd2000-03-02 01:49:45 +00007__revision__ = "$Id$"
Greg Ward2689e3d1999-03-22 14:52:19 +00008
Greg Ward1297b5c2000-09-30 20:37:56 +00009import sys, os, string, re
10from distutils.errors import DistutilsPlatformError
11from distutils.dep_util import newer
Tarek Ziadé36797272010-07-22 12:50:05 +000012from distutils.spawn import spawn
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +000013from distutils import log
Tarek Ziadé04fe7c02009-10-25 23:08:47 +000014from distutils.errors import DistutilsByteCompileError
Greg Wardaa458bc2000-04-22 15:14:58 +000015
Tarek Ziadé36797272010-07-22 12:50:05 +000016def get_platform ():
17 """Return a string that identifies the current platform. This is used
18 mainly to distinguish platform-specific build directories and
19 platform-specific built distributions. Typically includes the OS name
20 and version and the architecture (as supplied by 'os.uname()'),
21 although the exact information included depends on the OS; eg. for IRIX
22 the architecture isn't particularly important (IRIX only runs on SGI
23 hardware), but for Linux the kernel version isn't particularly
24 important.
Tarek Ziadé8b441d02010-01-29 11:46:31 +000025
Tarek Ziadé36797272010-07-22 12:50:05 +000026 Examples of returned values:
27 linux-i586
28 linux-alpha (?)
29 solaris-2.6-sun4u
30 irix-5.3
31 irix64-6.2
Tarek Ziadé8b441d02010-01-29 11:46:31 +000032
Tarek Ziadé36797272010-07-22 12:50:05 +000033 Windows will return one of:
34 win-amd64 (64bit Windows on AMD64 (aka x86_64, Intel64, EM64T, etc)
35 win-ia64 (64bit Windows on Itanium)
36 win32 (all others - specifically, sys.platform is returned)
37
38 For other non-POSIX platforms, currently just returns 'sys.platform'.
Tarek Ziadé8b441d02010-01-29 11:46:31 +000039 """
Tarek Ziadé36797272010-07-22 12:50:05 +000040 if os.name == 'nt':
41 # sniff sys.version for architecture.
42 prefix = " bit ("
43 i = sys.version.find(prefix)
44 if i == -1:
45 return sys.platform
46 j = sys.version.find(")", i)
47 look = sys.version[i+len(prefix):j].lower()
48 if look == 'amd64':
49 return 'win-amd64'
50 if look == 'itanium':
51 return 'win-ia64'
52 return sys.platform
Tarek Ziadé8b441d02010-01-29 11:46:31 +000053
Tarek Ziadé36797272010-07-22 12:50:05 +000054 if os.name != "posix" or not hasattr(os, 'uname'):
55 # XXX what about the architecture? NT is Intel or Alpha,
56 # Mac OS is M68k or PPC, etc.
57 return sys.platform
Tarek Ziadé8b441d02010-01-29 11:46:31 +000058
Tarek Ziadé36797272010-07-22 12:50:05 +000059 # Try to distinguish various flavours of Unix
Greg Ward50919292000-03-07 03:27:08 +000060
Tarek Ziadé36797272010-07-22 12:50:05 +000061 (osname, host, release, version, machine) = os.uname()
Greg Ward50919292000-03-07 03:27:08 +000062
Tarek Ziadé36797272010-07-22 12:50:05 +000063 # Convert the OS name to lowercase, remove '/' characters
64 # (to accommodate BSD/OS), and translate spaces (for "Power Macintosh")
65 osname = osname.lower().replace('/', '')
66 machine = machine.replace(' ', '_')
67 machine = machine.replace('/', '-')
68
69 if osname[:5] == "linux":
70 # At least on Linux/Intel, 'machine' is the processor --
71 # i386, etc.
72 # XXX what about Alpha, SPARC, etc?
73 return "%s-%s" % (osname, machine)
74 elif osname[:5] == "sunos":
75 if release[0] >= "5": # SunOS 5 == Solaris 2
76 osname = "solaris"
77 release = "%d.%s" % (int(release[0]) - 3, release[2:])
78 # fall through to standard osname-release-machine representation
79 elif osname[:4] == "irix": # could be "irix64"!
80 return "%s-%s" % (osname, release)
81 elif osname[:3] == "aix":
82 return "%s-%s.%s" % (osname, version, release)
83 elif osname[:6] == "cygwin":
84 osname = "cygwin"
85 rel_re = re.compile (r'[\d.]+', re.ASCII)
86 m = rel_re.match(release)
87 if m:
88 release = m.group()
89 elif osname[:6] == "darwin":
90 #
91 # For our purposes, we'll assume that the system version from
92 # distutils' perspective is what MACOSX_DEPLOYMENT_TARGET is set
93 # to. This makes the compatibility story a bit more sane because the
94 # machine is going to compile and link as if it were
95 # MACOSX_DEPLOYMENT_TARGET.
96 from distutils.sysconfig import get_config_vars
97 cfgvars = get_config_vars()
98
99 macver = os.environ.get('MACOSX_DEPLOYMENT_TARGET')
100 if not macver:
101 macver = cfgvars.get('MACOSX_DEPLOYMENT_TARGET')
102
103 if 1:
104 # Always calculate the release of the running machine,
105 # needed to determine if we can build fat binaries or not.
106
107 macrelease = macver
108 # Get the system version. Reading this plist is a documented
109 # way to get the system version (see the documentation for
110 # the Gestalt Manager)
111 try:
112 f = open('/System/Library/CoreServices/SystemVersion.plist')
113 except IOError:
114 # We're on a plain darwin box, fall back to the default
115 # behaviour.
116 pass
117 else:
118 m = re.search(
119 r'<key>ProductUserVisibleVersion</key>\s*' +
120 r'<string>(.*?)</string>', f.read())
121 f.close()
122 if m is not None:
123 macrelease = '.'.join(m.group(1).split('.')[:2])
124 # else: fall back to the default behaviour
125
126 if not macver:
127 macver = macrelease
128
129 if macver:
130 from distutils.sysconfig import get_config_vars
131 release = macver
132 osname = "macosx"
133
134 if (macrelease + '.') >= '10.4.' and \
135 '-arch' in get_config_vars().get('CFLAGS', '').strip():
136 # The universal build will build fat binaries, but not on
137 # systems before 10.4
138 #
139 # Try to detect 4-way universal builds, those have machine-type
140 # 'universal' instead of 'fat'.
141
142 machine = 'fat'
143 cflags = get_config_vars().get('CFLAGS')
144
145 archs = re.findall('-arch\s+(\S+)', cflags)
146 archs = tuple(sorted(set(archs)))
147
148 if len(archs) == 1:
149 machine = archs[0]
150 elif archs == ('i386', 'ppc'):
151 machine = 'fat'
152 elif archs == ('i386', 'x86_64'):
153 machine = 'intel'
154 elif archs == ('i386', 'ppc', 'x86_64'):
155 machine = 'fat3'
156 elif archs == ('ppc64', 'x86_64'):
157 machine = 'fat64'
158 elif archs == ('i386', 'ppc', 'ppc64', 'x86_64'):
159 machine = 'universal'
160 else:
161 raise ValueError(
162 "Don't know machine value for archs=%r"%(archs,))
163
164 elif machine == 'i386':
165 # On OSX the machine type returned by uname is always the
166 # 32-bit variant, even if the executable architecture is
167 # the 64-bit variant
168 if sys.maxsize >= 2**32:
169 machine = 'x86_64'
170
171 elif machine in ('PowerPC', 'Power_Macintosh'):
172 # Pick a sane name for the PPC architecture.
173 machine = 'ppc'
174
175 # See 'i386' case
176 if sys.maxsize >= 2**32:
177 machine = 'ppc64'
178
179 return "%s-%s-%s" % (osname, release, machine)
180
181# get_platform ()
182
183
184def convert_path (pathname):
185 """Return 'pathname' as a name that will work on the native filesystem,
Greg Wardb8b263b2000-09-30 18:40:42 +0000186 i.e. split it on '/' and put it back together again using the current
187 directory separator. Needed because filenames in the setup script are
188 always supplied in Unix style, and have to be converted to the local
189 convention before we can actually use them in the filesystem. Raises
Greg Ward47527692000-09-30 18:49:14 +0000190 ValueError on non-Unix-ish systems if 'pathname' either starts or
191 ends with a slash.
Greg Wardb8b263b2000-09-30 18:40:42 +0000192 """
Greg Ward7ec05352000-09-22 01:05:43 +0000193 if os.sep == '/':
194 return pathname
Neal Norwitzb0df6a12002-08-13 17:42:57 +0000195 if not pathname:
196 return pathname
197 if pathname[0] == '/':
Collin Winter5b7e9d72007-08-30 03:52:21 +0000198 raise ValueError("path '%s' cannot be absolute" % pathname)
Neal Norwitzb0df6a12002-08-13 17:42:57 +0000199 if pathname[-1] == '/':
Collin Winter5b7e9d72007-08-30 03:52:21 +0000200 raise ValueError("path '%s' cannot end with '/'" % pathname)
Greg Ward7ec05352000-09-22 01:05:43 +0000201
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000202 paths = pathname.split('/')
Jack Jansenb4cd5c12001-01-28 12:23:32 +0000203 while '.' in paths:
204 paths.remove('.')
205 if not paths:
206 return os.curdir
Neal Norwitzd9108552006-03-17 08:00:19 +0000207 return os.path.join(*paths)
Greg Ward50919292000-03-07 03:27:08 +0000208
Tarek Ziadé36797272010-07-22 12:50:05 +0000209# convert_path ()
Greg Ward1b4ede52000-03-22 00:22:44 +0000210
211
Tarek Ziadé36797272010-07-22 12:50:05 +0000212def change_root (new_root, pathname):
213 """Return 'pathname' with 'new_root' prepended. If 'pathname' is
214 relative, this is equivalent to "os.path.join(new_root,pathname)".
Greg Ward67f75d42000-04-27 01:53:46 +0000215 Otherwise, it requires making 'pathname' relative and then joining the
Greg Ward4b46ef92000-05-31 02:14:32 +0000216 two, which is tricky on DOS/Windows and Mac OS.
217 """
218 if os.name == 'posix':
Greg Wardbe86bde2000-09-26 01:56:15 +0000219 if not os.path.isabs(pathname):
220 return os.path.join(new_root, pathname)
Greg Ward4b46ef92000-05-31 02:14:32 +0000221 else:
Greg Wardbe86bde2000-09-26 01:56:15 +0000222 return os.path.join(new_root, pathname[1:])
Greg Ward67f75d42000-04-27 01:53:46 +0000223
224 elif os.name == 'nt':
Greg Wardbe86bde2000-09-26 01:56:15 +0000225 (drive, path) = os.path.splitdrive(pathname)
Greg Ward4b46ef92000-05-31 02:14:32 +0000226 if path[0] == '\\':
227 path = path[1:]
Greg Wardbe86bde2000-09-26 01:56:15 +0000228 return os.path.join(new_root, path)
Greg Ward67f75d42000-04-27 01:53:46 +0000229
Marc-André Lemburg2544f512002-01-31 18:56:00 +0000230 elif os.name == 'os2':
231 (drive, path) = os.path.splitdrive(pathname)
232 if path[0] == os.sep:
233 path = path[1:]
234 return os.path.join(new_root, path)
235
Tarek Ziadé36797272010-07-22 12:50:05 +0000236 elif os.name == 'mac':
237 if not os.path.isabs(pathname):
238 return os.path.join(new_root, pathname)
239 else:
240 # Chop off volume name from start of path
241 elements = pathname.split(":", 1)
242 pathname = ":" + elements[1]
243 return os.path.join(new_root, pathname)
244
Greg Ward67f75d42000-04-27 01:53:46 +0000245 else:
Tarek Ziadé36797272010-07-22 12:50:05 +0000246 raise DistutilsPlatformError("nothing known about platform '%s'" % os.name)
247
Greg Ward67f75d42000-04-27 01:53:46 +0000248
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000249_environ_checked = 0
Tarek Ziadé36797272010-07-22 12:50:05 +0000250def check_environ ():
251 """Ensure that 'os.environ' has all the environment variables we
252 guarantee that users can use in config files, command-line options,
Greg Wardb8b263b2000-09-30 18:40:42 +0000253 etc. Currently this includes:
254 HOME - user's home directory (Unix only)
255 PLAT - description of the current platform, including hardware
256 and OS (see 'get_platform()')
Greg Ward1b4ede52000-03-22 00:22:44 +0000257 """
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000258 global _environ_checked
259 if _environ_checked:
260 return
261
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000262 if os.name == 'posix' and 'HOME' not in os.environ:
Greg Ward1b4ede52000-03-22 00:22:44 +0000263 import pwd
Greg Wardbe86bde2000-09-26 01:56:15 +0000264 os.environ['HOME'] = pwd.getpwuid(os.getuid())[5]
Greg Ward1b4ede52000-03-22 00:22:44 +0000265
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000266 if 'PLAT' not in os.environ:
Tarek Ziadé36797272010-07-22 12:50:05 +0000267 os.environ['PLAT'] = get_platform()
Greg Ward1b4ede52000-03-22 00:22:44 +0000268
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000269 _environ_checked = 1
270
Greg Ward1b4ede52000-03-22 00:22:44 +0000271
Tarek Ziadé36797272010-07-22 12:50:05 +0000272def subst_vars (s, local_vars):
273 """Perform shell/Perl-style variable substitution on 'string'. Every
274 occurrence of '$' followed by a name is considered a variable, and
Greg Ward47527692000-09-30 18:49:14 +0000275 variable is substituted by the value found in the 'local_vars'
276 dictionary, or in 'os.environ' if it's not in 'local_vars'.
277 'os.environ' is first checked/augmented to guarantee that it contains
278 certain values: see 'check_environ()'. Raise ValueError for any
279 variables not found in either 'local_vars' or 'os.environ'.
Greg Wardb8b263b2000-09-30 18:40:42 +0000280 """
Greg Wardbe86bde2000-09-26 01:56:15 +0000281 check_environ()
Greg Ward1b4ede52000-03-22 00:22:44 +0000282 def _subst (match, local_vars=local_vars):
283 var_name = match.group(1)
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000284 if var_name in local_vars:
Greg Wardbe86bde2000-09-26 01:56:15 +0000285 return str(local_vars[var_name])
Greg Ward1b4ede52000-03-22 00:22:44 +0000286 else:
287 return os.environ[var_name]
288
Greg Ward47527692000-09-30 18:49:14 +0000289 try:
Jeremy Hylton5e2d0762001-01-25 20:10:32 +0000290 return re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s)
Guido van Rossumb940e112007-01-10 16:19:56 +0000291 except KeyError as var:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000292 raise ValueError("invalid variable '$%s'" % var)
Greg Ward1b4ede52000-03-22 00:22:44 +0000293
Tarek Ziadé36797272010-07-22 12:50:05 +0000294# subst_vars ()
Greg Ward7c1a6d42000-03-29 02:48:40 +0000295
Tarek Ziadé36797272010-07-22 12:50:05 +0000296
297def grok_environment_error (exc, prefix="error: "):
298 """Generate a useful error message from an EnvironmentError (IOError or
299 OSError) exception object. Handles Python 1.5.1 and 1.5.2 styles, and
Greg Warde9055132000-06-17 02:16:46 +0000300 does what it can to deal with exception objects that don't have a
301 filename (which happens when the error is due to a two-file operation,
302 such as 'rename()' or 'link()'. Returns the error message as a string
303 prefixed with 'prefix'.
304 """
305 # check for Python 1.5.2-style {IO,OS}Error exception objects
Greg Wardbe86bde2000-09-26 01:56:15 +0000306 if hasattr(exc, 'filename') and hasattr(exc, 'strerror'):
Greg Warde9055132000-06-17 02:16:46 +0000307 if exc.filename:
308 error = prefix + "%s: %s" % (exc.filename, exc.strerror)
309 else:
310 # two-argument functions in posix module don't
311 # include the filename in the exception object!
312 error = prefix + "%s" % exc.strerror
313 else:
Georg Brandl5dfe0de2008-01-06 21:41:49 +0000314 error = prefix + str(exc.args[-1])
Greg Warde9055132000-06-17 02:16:46 +0000315
316 return error
Greg Ward6a2a3db2000-06-24 20:40:02 +0000317
Tarek Ziadé36797272010-07-22 12:50:05 +0000318
Greg Ward6a2a3db2000-06-24 20:40:02 +0000319# Needed by 'split_quoted()'
Martin v. Löwis1c0f1f92004-03-25 14:58:19 +0000320_wordchars_re = _squote_re = _dquote_re = None
321def _init_regex():
322 global _wordchars_re, _squote_re, _dquote_re
323 _wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace)
324 _squote_re = re.compile(r"'(?:[^'\\]|\\.)*'")
325 _dquote_re = re.compile(r'"(?:[^"\\]|\\.)*"')
Greg Ward6a2a3db2000-06-24 20:40:02 +0000326
Tarek Ziadé36797272010-07-22 12:50:05 +0000327def split_quoted (s):
Greg Ward6a2a3db2000-06-24 20:40:02 +0000328 """Split a string up according to Unix shell-like rules for quotes and
Tarek Ziadé36797272010-07-22 12:50:05 +0000329 backslashes. In short: words are delimited by spaces, as long as those
Greg Ward6a2a3db2000-06-24 20:40:02 +0000330 spaces are not escaped by a backslash, or inside a quoted string.
331 Single and double quotes are equivalent, and the quote characters can
332 be backslash-escaped. The backslash is stripped from any two-character
333 escape sequence, leaving only the escaped character. The quote
334 characters are stripped from any quoted string. Returns a list of
335 words.
336 """
Tarek Ziadé36797272010-07-22 12:50:05 +0000337
Greg Ward6a2a3db2000-06-24 20:40:02 +0000338 # This is a nice algorithm for splitting up a single string, since it
339 # doesn't require character-by-character examination. It was a little
340 # bit of a brain-bender to get it working right, though...
Martin v. Löwis1c0f1f92004-03-25 14:58:19 +0000341 if _wordchars_re is None: _init_regex()
Greg Ward6a2a3db2000-06-24 20:40:02 +0000342
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000343 s = s.strip()
Greg Ward6a2a3db2000-06-24 20:40:02 +0000344 words = []
345 pos = 0
346
347 while s:
348 m = _wordchars_re.match(s, pos)
349 end = m.end()
350 if end == len(s):
351 words.append(s[:end])
352 break
353
Greg Ward2b042de2000-08-08 14:38:13 +0000354 if s[end] in string.whitespace: # unescaped, unquoted whitespace: now
Greg Ward6a2a3db2000-06-24 20:40:02 +0000355 words.append(s[:end]) # we definitely have a word delimiter
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000356 s = s[end:].lstrip()
Greg Ward6a2a3db2000-06-24 20:40:02 +0000357 pos = 0
358
359 elif s[end] == '\\': # preserve whatever is being escaped;
360 # will become part of the current word
361 s = s[:end] + s[end+1:]
362 pos = end+1
363
364 else:
365 if s[end] == "'": # slurp singly-quoted string
366 m = _squote_re.match(s, end)
367 elif s[end] == '"': # slurp doubly-quoted string
368 m = _dquote_re.match(s, end)
369 else:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000370 raise RuntimeError("this can't happen (bad char '%c')" % s[end])
Greg Ward6a2a3db2000-06-24 20:40:02 +0000371
372 if m is None:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000373 raise ValueError("bad string (mismatched %s quotes?)" % s[end])
Greg Ward6a2a3db2000-06-24 20:40:02 +0000374
375 (beg, end) = m.span()
376 s = s[:beg] + s[beg+1:end-1] + s[end:]
377 pos = m.end() - 2
378
379 if pos >= len(s):
380 words.append(s)
381 break
382
383 return words
384
Tarek Ziadé36797272010-07-22 12:50:05 +0000385# split_quoted ()
Greg Ward1c16ac32000-08-02 01:37:30 +0000386
387
Tarek Ziadé36797272010-07-22 12:50:05 +0000388def execute (func, args, msg=None, verbose=0, dry_run=0):
389 """Perform some action that affects the outside world (eg. by
390 writing to the filesystem). Such actions are special because they
391 are disabled by the 'dry_run' flag. This method takes care of all
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000392 that bureaucracy for you; all you have to do is supply the
393 function to call and an argument tuple for it (to embody the
394 "external action" being performed), and an optional message to
395 print.
Greg Ward1c16ac32000-08-02 01:37:30 +0000396 """
Greg Ward1c16ac32000-08-02 01:37:30 +0000397 if msg is None:
Walter Dörwald70a6b492004-02-12 17:35:32 +0000398 msg = "%s%r" % (func.__name__, args)
Fred Drakeb94b8492001-12-06 20:51:35 +0000399 if msg[-2:] == ',)': # correct for singleton tuple
Greg Ward1c16ac32000-08-02 01:37:30 +0000400 msg = msg[0:-2] + ')'
401
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000402 log.info(msg)
Greg Ward1c16ac32000-08-02 01:37:30 +0000403 if not dry_run:
Neal Norwitzd9108552006-03-17 08:00:19 +0000404 func(*args)
Greg Ward1c16ac32000-08-02 01:37:30 +0000405
Greg Ward817dc092000-09-25 01:25:06 +0000406
Tarek Ziadé36797272010-07-22 12:50:05 +0000407def strtobool (val):
Greg Ward817dc092000-09-25 01:25:06 +0000408 """Convert a string representation of truth to true (1) or false (0).
Tim Peters182b5ac2004-07-18 06:16:08 +0000409
Greg Ward817dc092000-09-25 01:25:06 +0000410 True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values
411 are 'n', 'no', 'f', 'false', 'off', and '0'. Raises ValueError if
412 'val' is anything else.
413 """
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000414 val = val.lower()
Greg Ward817dc092000-09-25 01:25:06 +0000415 if val in ('y', 'yes', 't', 'true', 'on', '1'):
416 return 1
417 elif val in ('n', 'no', 'f', 'false', 'off', '0'):
418 return 0
419 else:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000420 raise ValueError("invalid truth value %r" % (val,))
Greg Ward1297b5c2000-09-30 20:37:56 +0000421
422
Tarek Ziadé36797272010-07-22 12:50:05 +0000423def byte_compile (py_files,
424 optimize=0, force=0,
425 prefix=None, base_dir=None,
426 verbose=1, dry_run=0,
427 direct=None):
Greg Wardf217e212000-10-01 23:49:30 +0000428 """Byte-compile a collection of Python source files to either .pyc
Tarek Ziadé36797272010-07-22 12:50:05 +0000429 or .pyo files in the same directory. 'py_files' is a list of files
430 to compile; any files that don't end in ".py" are silently skipped.
431 'optimize' must be one of the following:
Greg Ward1297b5c2000-09-30 20:37:56 +0000432 0 - don't optimize (generate .pyc)
433 1 - normal optimization (like "python -O")
434 2 - extra optimization (like "python -OO")
435 If 'force' is true, all files are recompiled regardless of
436 timestamps.
437
438 The source filename encoded in each bytecode file defaults to the
439 filenames listed in 'py_files'; you can modify these with 'prefix' and
440 'basedir'. 'prefix' is a string that will be stripped off of each
441 source filename, and 'base_dir' is a directory name that will be
442 prepended (after 'prefix' is stripped). You can supply either or both
443 (or neither) of 'prefix' and 'base_dir', as you wish.
444
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000445 If 'dry_run' is true, doesn't actually do anything that would
446 affect the filesystem.
Greg Ward1297b5c2000-09-30 20:37:56 +0000447
448 Byte-compilation is either done directly in this interpreter process
449 with the standard py_compile module, or indirectly by writing a
450 temporary script and executing it. Normally, you should let
451 'byte_compile()' figure out to use direct compilation or not (see
452 the source for details). The 'direct' flag is used by the script
453 generated in indirect mode; unless you know what you're doing, leave
454 it set to None.
455 """
Tarek Ziadé04fe7c02009-10-25 23:08:47 +0000456 # nothing is done if sys.dont_write_bytecode is True
457 if sys.dont_write_bytecode:
458 raise DistutilsByteCompileError('byte-compiling is disabled.')
459
Greg Ward1297b5c2000-09-30 20:37:56 +0000460 # First, if the caller didn't force us into direct or indirect mode,
461 # figure out which mode we should be in. We take a conservative
462 # approach: choose direct mode *only* if the current interpreter is
463 # in debug mode and optimize is 0. If we're not in debug mode (-O
464 # or -OO), we don't know which level of optimization this
465 # interpreter is running with, so we can't do direct
466 # byte-compilation and be certain that it's the right thing. Thus,
467 # always compile indirectly if the current interpreter is in either
468 # optimize mode, or if either optimization level was requested by
469 # the caller.
470 if direct is None:
471 direct = (__debug__ and optimize == 0)
472
473 # "Indirect" byte-compilation: write a temporary script and then
474 # run it with the appropriate flags.
475 if not direct:
Marc-André Lemburg03750792002-12-03 08:45:11 +0000476 try:
477 from tempfile import mkstemp
478 (script_fd, script_name) = mkstemp(".py")
479 except ImportError:
480 from tempfile import mktemp
481 (script_fd, script_name) = None, mktemp(".py")
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000482 log.info("writing byte-compilation script '%s'", script_name)
Greg Ward1297b5c2000-09-30 20:37:56 +0000483 if not dry_run:
Marc-André Lemburg03750792002-12-03 08:45:11 +0000484 if script_fd is not None:
485 script = os.fdopen(script_fd, "w")
486 else:
487 script = open(script_name, "w")
Greg Ward1297b5c2000-09-30 20:37:56 +0000488
489 script.write("""\
490from distutils.util import byte_compile
491files = [
492""")
Greg Ward9216cfe2000-10-03 03:31:05 +0000493
494 # XXX would be nice to write absolute filenames, just for
495 # safety's sake (script should be more robust in the face of
496 # chdir'ing before running it). But this requires abspath'ing
497 # 'prefix' as well, and that breaks the hack in build_lib's
498 # 'byte_compile()' method that carefully tacks on a trailing
499 # slash (os.sep really) to make sure the prefix here is "just
500 # right". This whole prefix business is rather delicate -- the
501 # problem is that it's really a directory, but I'm treating it
502 # as a dumb string, so trailing slashes and so forth matter.
503
504 #py_files = map(os.path.abspath, py_files)
505 #if prefix:
506 # prefix = os.path.abspath(prefix)
507
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000508 script.write(",\n".join(map(repr, py_files)) + "]\n")
Greg Ward1297b5c2000-09-30 20:37:56 +0000509 script.write("""
Walter Dörwald70a6b492004-02-12 17:35:32 +0000510byte_compile(files, optimize=%r, force=%r,
511 prefix=%r, base_dir=%r,
512 verbose=%r, dry_run=0,
Greg Ward1297b5c2000-09-30 20:37:56 +0000513 direct=1)
Walter Dörwald70a6b492004-02-12 17:35:32 +0000514""" % (optimize, force, prefix, base_dir, verbose))
Greg Ward1297b5c2000-09-30 20:37:56 +0000515
516 script.close()
517
518 cmd = [sys.executable, script_name]
519 if optimize == 1:
520 cmd.insert(1, "-O")
521 elif optimize == 2:
522 cmd.insert(1, "-OO")
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000523 spawn(cmd, dry_run=dry_run)
Greg Ward9216cfe2000-10-03 03:31:05 +0000524 execute(os.remove, (script_name,), "removing %s" % script_name,
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000525 dry_run=dry_run)
Fred Drakeb94b8492001-12-06 20:51:35 +0000526
Greg Ward1297b5c2000-09-30 20:37:56 +0000527 # "Direct" byte-compilation: use the py_compile module to compile
528 # right here, right now. Note that the script generated in indirect
529 # mode simply calls 'byte_compile()' in direct mode, a weird sort of
530 # cross-process recursion. Hey, it works!
531 else:
532 from py_compile import compile
533
534 for file in py_files:
535 if file[-3:] != ".py":
Greg Wardf217e212000-10-01 23:49:30 +0000536 # This lets us be lazy and not filter filenames in
537 # the "install_lib" command.
538 continue
Greg Ward1297b5c2000-09-30 20:37:56 +0000539
540 # Terminology from the py_compile module:
541 # cfile - byte-compiled file
542 # dfile - purported source filename (same as 'file' by default)
543 cfile = file + (__debug__ and "c" or "o")
544 dfile = file
545 if prefix:
546 if file[:len(prefix)] != prefix:
Tarek Ziadé36797272010-07-22 12:50:05 +0000547 raise ValueError("invalid prefix: filename %r doesn't start with %r"
548 % (file, prefix))
Greg Ward1297b5c2000-09-30 20:37:56 +0000549 dfile = dfile[len(prefix):]
550 if base_dir:
551 dfile = os.path.join(base_dir, dfile)
552
553 cfile_base = os.path.basename(cfile)
554 if direct:
555 if force or newer(file, cfile):
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000556 log.info("byte-compiling %s to %s", file, cfile_base)
Greg Ward1297b5c2000-09-30 20:37:56 +0000557 if not dry_run:
558 compile(file, cfile, dfile)
559 else:
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000560 log.debug("skipping byte-compilation of %s to %s",
561 file, cfile_base)
Greg Ward1297b5c2000-09-30 20:37:56 +0000562
Tarek Ziadé36797272010-07-22 12:50:05 +0000563# byte_compile ()
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000564
Tarek Ziadé36797272010-07-22 12:50:05 +0000565def rfc822_escape (header):
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000566 """Return a version of the string escaped for inclusion in an
Andrew M. Kuchling88b08842001-03-23 17:30:26 +0000567 RFC-822 header, by ensuring there are 8 spaces space after each newline.
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000568 """
Tarek Ziadédf872d42009-12-06 09:28:17 +0000569 lines = header.split('\n')
570 sep = '\n' + 8 * ' '
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000571 return sep.join(lines)
Martin v. Löwis6178db62008-12-01 04:38:52 +0000572
573# 2to3 support
574
575def run_2to3(files, fixer_names=None, options=None, explicit=None):
576 """Invoke 2to3 on a list of Python files.
577 The files should all come from the build area, as the
578 modification is done in-place. To reduce the build time,
579 only files modified since the last invocation of this
580 function should be passed in the files argument."""
581
582 if not files:
583 return
584
585 # Make this class local, to delay import of 2to3
586 from lib2to3.refactor import RefactoringTool, get_fixers_from_package
587 class DistutilsRefactoringTool(RefactoringTool):
588 def log_error(self, msg, *args, **kw):
589 log.error(msg, *args)
590
591 def log_message(self, msg, *args):
592 log.info(msg, *args)
593
594 def log_debug(self, msg, *args):
595 log.debug(msg, *args)
596
597 if fixer_names is None:
598 fixer_names = get_fixers_from_package('lib2to3.fixes')
599 r = DistutilsRefactoringTool(fixer_names, options=options)
600 r.refactor(files, write=True)
601
Georg Brandl6d4a9cf2009-03-31 00:34:54 +0000602def copydir_run_2to3(src, dest, template=None, fixer_names=None,
603 options=None, explicit=None):
604 """Recursively copy a directory, only copying new and changed files,
605 running run_2to3 over all newly copied Python modules afterward.
606
607 If you give a template string, it's parsed like a MANIFEST.in.
608 """
609 from distutils.dir_util import mkpath
610 from distutils.file_util import copy_file
611 from distutils.filelist import FileList
612 filelist = FileList()
613 curdir = os.getcwd()
614 os.chdir(src)
615 try:
616 filelist.findall()
617 finally:
618 os.chdir(curdir)
619 filelist.files[:] = filelist.allfiles
620 if template:
621 for line in template.splitlines():
622 line = line.strip()
623 if not line: continue
624 filelist.process_template_line(line)
625 copied = []
626 for filename in filelist.files:
627 outname = os.path.join(dest, filename)
628 mkpath(os.path.dirname(outname))
629 res = copy_file(os.path.join(src, filename), outname, update=1)
630 if res[1]: copied.append(outname)
631 run_2to3([fn for fn in copied if fn.lower().endswith('.py')],
632 fixer_names=fixer_names, options=options, explicit=explicit)
633 return copied
634
Martin v. Löwis6178db62008-12-01 04:38:52 +0000635class Mixin2to3:
636 '''Mixin class for commands that run 2to3.
637 To configure 2to3, setup scripts may either change
638 the class variables, or inherit from individual commands
639 to override how 2to3 is invoked.'''
640
641 # provide list of fixers to run;
642 # defaults to all from lib2to3.fixers
643 fixer_names = None
644
645 # options dictionary
646 options = None
647
648 # list of fixers to invoke even though they are marked as explicit
649 explicit = None
650
651 def run_2to3(self, files):
652 return run_2to3(files, self.fixer_names, self.options, self.explicit)