blob: 3081245b62523213a71e5b13bbf065d829f64bb7 [file] [log] [blame]
Greg Ward2689e3d1999-03-22 14:52:19 +00001"""distutils.util
2
Greg Wardaebf7062000-04-04 02:05:59 +00003Miscellaneous utility functions -- anything that doesn't fit into
Greg Ward47527692000-09-30 18:49:14 +00004one of the other *util.py modules.
5"""
Greg Ward2689e3d1999-03-22 14:52:19 +00006
Greg Ward3ce77fd2000-03-02 01:49:45 +00007__revision__ = "$Id$"
Greg Ward2689e3d1999-03-22 14:52:19 +00008
Greg Ward1297b5c2000-09-30 20:37:56 +00009import sys, os, string, re
10from distutils.errors import DistutilsPlatformError
11from distutils.dep_util import newer
Tarek Ziadé36797272010-07-22 12:50:05 +000012from distutils.spawn import spawn
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +000013from distutils import log
Tarek Ziadé04fe7c02009-10-25 23:08:47 +000014from distutils.errors import DistutilsByteCompileError
Greg Wardaa458bc2000-04-22 15:14:58 +000015
Tarek Ziadé36797272010-07-22 12:50:05 +000016def get_platform ():
17 """Return a string that identifies the current platform. This is used
18 mainly to distinguish platform-specific build directories and
19 platform-specific built distributions. Typically includes the OS name
20 and version and the architecture (as supplied by 'os.uname()'),
21 although the exact information included depends on the OS; eg. for IRIX
22 the architecture isn't particularly important (IRIX only runs on SGI
23 hardware), but for Linux the kernel version isn't particularly
24 important.
Tarek Ziadé8b441d02010-01-29 11:46:31 +000025
Tarek Ziadé36797272010-07-22 12:50:05 +000026 Examples of returned values:
27 linux-i586
28 linux-alpha (?)
29 solaris-2.6-sun4u
30 irix-5.3
31 irix64-6.2
Tarek Ziadé8b441d02010-01-29 11:46:31 +000032
Tarek Ziadé36797272010-07-22 12:50:05 +000033 Windows will return one of:
34 win-amd64 (64bit Windows on AMD64 (aka x86_64, Intel64, EM64T, etc)
35 win-ia64 (64bit Windows on Itanium)
36 win32 (all others - specifically, sys.platform is returned)
37
38 For other non-POSIX platforms, currently just returns 'sys.platform'.
Tarek Ziadé8b441d02010-01-29 11:46:31 +000039 """
Tarek Ziadé36797272010-07-22 12:50:05 +000040 if os.name == 'nt':
41 # sniff sys.version for architecture.
42 prefix = " bit ("
43 i = sys.version.find(prefix)
44 if i == -1:
45 return sys.platform
46 j = sys.version.find(")", i)
47 look = sys.version[i+len(prefix):j].lower()
48 if look == 'amd64':
49 return 'win-amd64'
50 if look == 'itanium':
51 return 'win-ia64'
52 return sys.platform
Tarek Ziadé8b441d02010-01-29 11:46:31 +000053
Tarek Ziadé36797272010-07-22 12:50:05 +000054 if os.name != "posix" or not hasattr(os, 'uname'):
55 # XXX what about the architecture? NT is Intel or Alpha,
56 # Mac OS is M68k or PPC, etc.
57 return sys.platform
Tarek Ziadé8b441d02010-01-29 11:46:31 +000058
Tarek Ziadé36797272010-07-22 12:50:05 +000059 # Try to distinguish various flavours of Unix
Greg Ward50919292000-03-07 03:27:08 +000060
Tarek Ziadé36797272010-07-22 12:50:05 +000061 (osname, host, release, version, machine) = os.uname()
Greg Ward50919292000-03-07 03:27:08 +000062
Tarek Ziadé36797272010-07-22 12:50:05 +000063 # Convert the OS name to lowercase, remove '/' characters
64 # (to accommodate BSD/OS), and translate spaces (for "Power Macintosh")
65 osname = osname.lower().replace('/', '')
66 machine = machine.replace(' ', '_')
67 machine = machine.replace('/', '-')
68
69 if osname[:5] == "linux":
70 # At least on Linux/Intel, 'machine' is the processor --
71 # i386, etc.
72 # XXX what about Alpha, SPARC, etc?
73 return "%s-%s" % (osname, machine)
74 elif osname[:5] == "sunos":
75 if release[0] >= "5": # SunOS 5 == Solaris 2
76 osname = "solaris"
77 release = "%d.%s" % (int(release[0]) - 3, release[2:])
78 # fall through to standard osname-release-machine representation
79 elif osname[:4] == "irix": # could be "irix64"!
80 return "%s-%s" % (osname, release)
81 elif osname[:3] == "aix":
82 return "%s-%s.%s" % (osname, version, release)
83 elif osname[:6] == "cygwin":
84 osname = "cygwin"
85 rel_re = re.compile (r'[\d.]+', re.ASCII)
86 m = rel_re.match(release)
87 if m:
88 release = m.group()
89 elif osname[:6] == "darwin":
90 #
91 # For our purposes, we'll assume that the system version from
92 # distutils' perspective is what MACOSX_DEPLOYMENT_TARGET is set
93 # to. This makes the compatibility story a bit more sane because the
94 # machine is going to compile and link as if it were
95 # MACOSX_DEPLOYMENT_TARGET.
96 from distutils.sysconfig import get_config_vars
97 cfgvars = get_config_vars()
98
99 macver = os.environ.get('MACOSX_DEPLOYMENT_TARGET')
100 if not macver:
101 macver = cfgvars.get('MACOSX_DEPLOYMENT_TARGET')
102
103 if 1:
104 # Always calculate the release of the running machine,
105 # needed to determine if we can build fat binaries or not.
106
107 macrelease = macver
108 # Get the system version. Reading this plist is a documented
109 # way to get the system version (see the documentation for
110 # the Gestalt Manager)
111 try:
112 f = open('/System/Library/CoreServices/SystemVersion.plist')
113 except IOError:
114 # We're on a plain darwin box, fall back to the default
115 # behaviour.
116 pass
117 else:
Éric Araujobee5cef2010-11-05 23:51:56 +0000118 try:
119 m = re.search(
120 r'<key>ProductUserVisibleVersion</key>\s*' +
121 r'<string>(.*?)</string>', f.read())
122 if m is not None:
123 macrelease = '.'.join(m.group(1).split('.')[:2])
124 # else: fall back to the default behaviour
125 finally:
126 f.close()
Tarek Ziadé36797272010-07-22 12:50:05 +0000127
128 if not macver:
129 macver = macrelease
130
131 if macver:
132 from distutils.sysconfig import get_config_vars
133 release = macver
134 osname = "macosx"
135
136 if (macrelease + '.') >= '10.4.' and \
137 '-arch' in get_config_vars().get('CFLAGS', '').strip():
138 # The universal build will build fat binaries, but not on
139 # systems before 10.4
140 #
141 # Try to detect 4-way universal builds, those have machine-type
142 # 'universal' instead of 'fat'.
143
144 machine = 'fat'
145 cflags = get_config_vars().get('CFLAGS')
146
147 archs = re.findall('-arch\s+(\S+)', cflags)
148 archs = tuple(sorted(set(archs)))
149
150 if len(archs) == 1:
151 machine = archs[0]
152 elif archs == ('i386', 'ppc'):
153 machine = 'fat'
154 elif archs == ('i386', 'x86_64'):
155 machine = 'intel'
156 elif archs == ('i386', 'ppc', 'x86_64'):
157 machine = 'fat3'
158 elif archs == ('ppc64', 'x86_64'):
159 machine = 'fat64'
160 elif archs == ('i386', 'ppc', 'ppc64', 'x86_64'):
161 machine = 'universal'
162 else:
163 raise ValueError(
164 "Don't know machine value for archs=%r"%(archs,))
165
166 elif machine == 'i386':
167 # On OSX the machine type returned by uname is always the
168 # 32-bit variant, even if the executable architecture is
169 # the 64-bit variant
170 if sys.maxsize >= 2**32:
171 machine = 'x86_64'
172
173 elif machine in ('PowerPC', 'Power_Macintosh'):
174 # Pick a sane name for the PPC architecture.
175 machine = 'ppc'
176
177 # See 'i386' case
178 if sys.maxsize >= 2**32:
179 machine = 'ppc64'
180
181 return "%s-%s-%s" % (osname, release, machine)
182
183# get_platform ()
184
185
186def convert_path (pathname):
187 """Return 'pathname' as a name that will work on the native filesystem,
Greg Wardb8b263b2000-09-30 18:40:42 +0000188 i.e. split it on '/' and put it back together again using the current
189 directory separator. Needed because filenames in the setup script are
190 always supplied in Unix style, and have to be converted to the local
191 convention before we can actually use them in the filesystem. Raises
Greg Ward47527692000-09-30 18:49:14 +0000192 ValueError on non-Unix-ish systems if 'pathname' either starts or
193 ends with a slash.
Greg Wardb8b263b2000-09-30 18:40:42 +0000194 """
Greg Ward7ec05352000-09-22 01:05:43 +0000195 if os.sep == '/':
196 return pathname
Neal Norwitzb0df6a12002-08-13 17:42:57 +0000197 if not pathname:
198 return pathname
199 if pathname[0] == '/':
Collin Winter5b7e9d72007-08-30 03:52:21 +0000200 raise ValueError("path '%s' cannot be absolute" % pathname)
Neal Norwitzb0df6a12002-08-13 17:42:57 +0000201 if pathname[-1] == '/':
Collin Winter5b7e9d72007-08-30 03:52:21 +0000202 raise ValueError("path '%s' cannot end with '/'" % pathname)
Greg Ward7ec05352000-09-22 01:05:43 +0000203
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000204 paths = pathname.split('/')
Jack Jansenb4cd5c12001-01-28 12:23:32 +0000205 while '.' in paths:
206 paths.remove('.')
207 if not paths:
208 return os.curdir
Neal Norwitzd9108552006-03-17 08:00:19 +0000209 return os.path.join(*paths)
Greg Ward50919292000-03-07 03:27:08 +0000210
Tarek Ziadé36797272010-07-22 12:50:05 +0000211# convert_path ()
Greg Ward1b4ede52000-03-22 00:22:44 +0000212
213
Tarek Ziadé36797272010-07-22 12:50:05 +0000214def change_root (new_root, pathname):
215 """Return 'pathname' with 'new_root' prepended. If 'pathname' is
216 relative, this is equivalent to "os.path.join(new_root,pathname)".
Greg Ward67f75d42000-04-27 01:53:46 +0000217 Otherwise, it requires making 'pathname' relative and then joining the
Greg Ward4b46ef92000-05-31 02:14:32 +0000218 two, which is tricky on DOS/Windows and Mac OS.
219 """
220 if os.name == 'posix':
Greg Wardbe86bde2000-09-26 01:56:15 +0000221 if not os.path.isabs(pathname):
222 return os.path.join(new_root, pathname)
Greg Ward4b46ef92000-05-31 02:14:32 +0000223 else:
Greg Wardbe86bde2000-09-26 01:56:15 +0000224 return os.path.join(new_root, pathname[1:])
Greg Ward67f75d42000-04-27 01:53:46 +0000225
226 elif os.name == 'nt':
Greg Wardbe86bde2000-09-26 01:56:15 +0000227 (drive, path) = os.path.splitdrive(pathname)
Greg Ward4b46ef92000-05-31 02:14:32 +0000228 if path[0] == '\\':
229 path = path[1:]
Greg Wardbe86bde2000-09-26 01:56:15 +0000230 return os.path.join(new_root, path)
Greg Ward67f75d42000-04-27 01:53:46 +0000231
Marc-André Lemburg2544f512002-01-31 18:56:00 +0000232 elif os.name == 'os2':
233 (drive, path) = os.path.splitdrive(pathname)
234 if path[0] == os.sep:
235 path = path[1:]
236 return os.path.join(new_root, path)
237
Tarek Ziadé36797272010-07-22 12:50:05 +0000238 elif os.name == 'mac':
239 if not os.path.isabs(pathname):
240 return os.path.join(new_root, pathname)
241 else:
242 # Chop off volume name from start of path
243 elements = pathname.split(":", 1)
244 pathname = ":" + elements[1]
245 return os.path.join(new_root, pathname)
246
Greg Ward67f75d42000-04-27 01:53:46 +0000247 else:
Tarek Ziadé36797272010-07-22 12:50:05 +0000248 raise DistutilsPlatformError("nothing known about platform '%s'" % os.name)
249
Greg Ward67f75d42000-04-27 01:53:46 +0000250
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000251_environ_checked = 0
Tarek Ziadé36797272010-07-22 12:50:05 +0000252def check_environ ():
253 """Ensure that 'os.environ' has all the environment variables we
254 guarantee that users can use in config files, command-line options,
Greg Wardb8b263b2000-09-30 18:40:42 +0000255 etc. Currently this includes:
256 HOME - user's home directory (Unix only)
257 PLAT - description of the current platform, including hardware
258 and OS (see 'get_platform()')
Greg Ward1b4ede52000-03-22 00:22:44 +0000259 """
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000260 global _environ_checked
261 if _environ_checked:
262 return
263
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000264 if os.name == 'posix' and 'HOME' not in os.environ:
Greg Ward1b4ede52000-03-22 00:22:44 +0000265 import pwd
Greg Wardbe86bde2000-09-26 01:56:15 +0000266 os.environ['HOME'] = pwd.getpwuid(os.getuid())[5]
Greg Ward1b4ede52000-03-22 00:22:44 +0000267
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000268 if 'PLAT' not in os.environ:
Tarek Ziadé36797272010-07-22 12:50:05 +0000269 os.environ['PLAT'] = get_platform()
Greg Ward1b4ede52000-03-22 00:22:44 +0000270
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000271 _environ_checked = 1
272
Greg Ward1b4ede52000-03-22 00:22:44 +0000273
Tarek Ziadé36797272010-07-22 12:50:05 +0000274def subst_vars (s, local_vars):
275 """Perform shell/Perl-style variable substitution on 'string'. Every
276 occurrence of '$' followed by a name is considered a variable, and
Greg Ward47527692000-09-30 18:49:14 +0000277 variable is substituted by the value found in the 'local_vars'
278 dictionary, or in 'os.environ' if it's not in 'local_vars'.
279 'os.environ' is first checked/augmented to guarantee that it contains
280 certain values: see 'check_environ()'. Raise ValueError for any
281 variables not found in either 'local_vars' or 'os.environ'.
Greg Wardb8b263b2000-09-30 18:40:42 +0000282 """
Greg Wardbe86bde2000-09-26 01:56:15 +0000283 check_environ()
Greg Ward1b4ede52000-03-22 00:22:44 +0000284 def _subst (match, local_vars=local_vars):
285 var_name = match.group(1)
Guido van Rossume2b70bc2006-08-18 22:13:04 +0000286 if var_name in local_vars:
Greg Wardbe86bde2000-09-26 01:56:15 +0000287 return str(local_vars[var_name])
Greg Ward1b4ede52000-03-22 00:22:44 +0000288 else:
289 return os.environ[var_name]
290
Greg Ward47527692000-09-30 18:49:14 +0000291 try:
Jeremy Hylton5e2d0762001-01-25 20:10:32 +0000292 return re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s)
Guido van Rossumb940e112007-01-10 16:19:56 +0000293 except KeyError as var:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000294 raise ValueError("invalid variable '$%s'" % var)
Greg Ward1b4ede52000-03-22 00:22:44 +0000295
Tarek Ziadé36797272010-07-22 12:50:05 +0000296# subst_vars ()
Greg Ward7c1a6d42000-03-29 02:48:40 +0000297
Tarek Ziadé36797272010-07-22 12:50:05 +0000298
299def grok_environment_error (exc, prefix="error: "):
300 """Generate a useful error message from an EnvironmentError (IOError or
301 OSError) exception object. Handles Python 1.5.1 and 1.5.2 styles, and
Greg Warde9055132000-06-17 02:16:46 +0000302 does what it can to deal with exception objects that don't have a
303 filename (which happens when the error is due to a two-file operation,
304 such as 'rename()' or 'link()'. Returns the error message as a string
305 prefixed with 'prefix'.
306 """
307 # check for Python 1.5.2-style {IO,OS}Error exception objects
Greg Wardbe86bde2000-09-26 01:56:15 +0000308 if hasattr(exc, 'filename') and hasattr(exc, 'strerror'):
Greg Warde9055132000-06-17 02:16:46 +0000309 if exc.filename:
310 error = prefix + "%s: %s" % (exc.filename, exc.strerror)
311 else:
312 # two-argument functions in posix module don't
313 # include the filename in the exception object!
314 error = prefix + "%s" % exc.strerror
315 else:
Georg Brandl5dfe0de2008-01-06 21:41:49 +0000316 error = prefix + str(exc.args[-1])
Greg Warde9055132000-06-17 02:16:46 +0000317
318 return error
Greg Ward6a2a3db2000-06-24 20:40:02 +0000319
Tarek Ziadé36797272010-07-22 12:50:05 +0000320
Greg Ward6a2a3db2000-06-24 20:40:02 +0000321# Needed by 'split_quoted()'
Martin v. Löwis1c0f1f92004-03-25 14:58:19 +0000322_wordchars_re = _squote_re = _dquote_re = None
323def _init_regex():
324 global _wordchars_re, _squote_re, _dquote_re
325 _wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace)
326 _squote_re = re.compile(r"'(?:[^'\\]|\\.)*'")
327 _dquote_re = re.compile(r'"(?:[^"\\]|\\.)*"')
Greg Ward6a2a3db2000-06-24 20:40:02 +0000328
Tarek Ziadé36797272010-07-22 12:50:05 +0000329def split_quoted (s):
Greg Ward6a2a3db2000-06-24 20:40:02 +0000330 """Split a string up according to Unix shell-like rules for quotes and
Tarek Ziadé36797272010-07-22 12:50:05 +0000331 backslashes. In short: words are delimited by spaces, as long as those
Greg Ward6a2a3db2000-06-24 20:40:02 +0000332 spaces are not escaped by a backslash, or inside a quoted string.
333 Single and double quotes are equivalent, and the quote characters can
334 be backslash-escaped. The backslash is stripped from any two-character
335 escape sequence, leaving only the escaped character. The quote
336 characters are stripped from any quoted string. Returns a list of
337 words.
338 """
Tarek Ziadé36797272010-07-22 12:50:05 +0000339
Greg Ward6a2a3db2000-06-24 20:40:02 +0000340 # This is a nice algorithm for splitting up a single string, since it
341 # doesn't require character-by-character examination. It was a little
342 # bit of a brain-bender to get it working right, though...
Martin v. Löwis1c0f1f92004-03-25 14:58:19 +0000343 if _wordchars_re is None: _init_regex()
Greg Ward6a2a3db2000-06-24 20:40:02 +0000344
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000345 s = s.strip()
Greg Ward6a2a3db2000-06-24 20:40:02 +0000346 words = []
347 pos = 0
348
349 while s:
350 m = _wordchars_re.match(s, pos)
351 end = m.end()
352 if end == len(s):
353 words.append(s[:end])
354 break
355
Greg Ward2b042de2000-08-08 14:38:13 +0000356 if s[end] in string.whitespace: # unescaped, unquoted whitespace: now
Greg Ward6a2a3db2000-06-24 20:40:02 +0000357 words.append(s[:end]) # we definitely have a word delimiter
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000358 s = s[end:].lstrip()
Greg Ward6a2a3db2000-06-24 20:40:02 +0000359 pos = 0
360
361 elif s[end] == '\\': # preserve whatever is being escaped;
362 # will become part of the current word
363 s = s[:end] + s[end+1:]
364 pos = end+1
365
366 else:
367 if s[end] == "'": # slurp singly-quoted string
368 m = _squote_re.match(s, end)
369 elif s[end] == '"': # slurp doubly-quoted string
370 m = _dquote_re.match(s, end)
371 else:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000372 raise RuntimeError("this can't happen (bad char '%c')" % s[end])
Greg Ward6a2a3db2000-06-24 20:40:02 +0000373
374 if m is None:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000375 raise ValueError("bad string (mismatched %s quotes?)" % s[end])
Greg Ward6a2a3db2000-06-24 20:40:02 +0000376
377 (beg, end) = m.span()
378 s = s[:beg] + s[beg+1:end-1] + s[end:]
379 pos = m.end() - 2
380
381 if pos >= len(s):
382 words.append(s)
383 break
384
385 return words
386
Tarek Ziadé36797272010-07-22 12:50:05 +0000387# split_quoted ()
Greg Ward1c16ac32000-08-02 01:37:30 +0000388
389
Tarek Ziadé36797272010-07-22 12:50:05 +0000390def execute (func, args, msg=None, verbose=0, dry_run=0):
391 """Perform some action that affects the outside world (eg. by
392 writing to the filesystem). Such actions are special because they
393 are disabled by the 'dry_run' flag. This method takes care of all
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000394 that bureaucracy for you; all you have to do is supply the
395 function to call and an argument tuple for it (to embody the
396 "external action" being performed), and an optional message to
397 print.
Greg Ward1c16ac32000-08-02 01:37:30 +0000398 """
Greg Ward1c16ac32000-08-02 01:37:30 +0000399 if msg is None:
Walter Dörwald70a6b492004-02-12 17:35:32 +0000400 msg = "%s%r" % (func.__name__, args)
Fred Drakeb94b8492001-12-06 20:51:35 +0000401 if msg[-2:] == ',)': # correct for singleton tuple
Greg Ward1c16ac32000-08-02 01:37:30 +0000402 msg = msg[0:-2] + ')'
403
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000404 log.info(msg)
Greg Ward1c16ac32000-08-02 01:37:30 +0000405 if not dry_run:
Neal Norwitzd9108552006-03-17 08:00:19 +0000406 func(*args)
Greg Ward1c16ac32000-08-02 01:37:30 +0000407
Greg Ward817dc092000-09-25 01:25:06 +0000408
Tarek Ziadé36797272010-07-22 12:50:05 +0000409def strtobool (val):
Greg Ward817dc092000-09-25 01:25:06 +0000410 """Convert a string representation of truth to true (1) or false (0).
Tim Peters182b5ac2004-07-18 06:16:08 +0000411
Greg Ward817dc092000-09-25 01:25:06 +0000412 True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values
413 are 'n', 'no', 'f', 'false', 'off', and '0'. Raises ValueError if
414 'val' is anything else.
415 """
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000416 val = val.lower()
Greg Ward817dc092000-09-25 01:25:06 +0000417 if val in ('y', 'yes', 't', 'true', 'on', '1'):
418 return 1
419 elif val in ('n', 'no', 'f', 'false', 'off', '0'):
420 return 0
421 else:
Collin Winter5b7e9d72007-08-30 03:52:21 +0000422 raise ValueError("invalid truth value %r" % (val,))
Greg Ward1297b5c2000-09-30 20:37:56 +0000423
424
Tarek Ziadé36797272010-07-22 12:50:05 +0000425def byte_compile (py_files,
426 optimize=0, force=0,
427 prefix=None, base_dir=None,
428 verbose=1, dry_run=0,
429 direct=None):
Greg Wardf217e212000-10-01 23:49:30 +0000430 """Byte-compile a collection of Python source files to either .pyc
Tarek Ziadé36797272010-07-22 12:50:05 +0000431 or .pyo files in the same directory. 'py_files' is a list of files
432 to compile; any files that don't end in ".py" are silently skipped.
433 'optimize' must be one of the following:
Greg Ward1297b5c2000-09-30 20:37:56 +0000434 0 - don't optimize (generate .pyc)
435 1 - normal optimization (like "python -O")
436 2 - extra optimization (like "python -OO")
437 If 'force' is true, all files are recompiled regardless of
438 timestamps.
439
440 The source filename encoded in each bytecode file defaults to the
441 filenames listed in 'py_files'; you can modify these with 'prefix' and
442 'basedir'. 'prefix' is a string that will be stripped off of each
443 source filename, and 'base_dir' is a directory name that will be
444 prepended (after 'prefix' is stripped). You can supply either or both
445 (or neither) of 'prefix' and 'base_dir', as you wish.
446
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000447 If 'dry_run' is true, doesn't actually do anything that would
448 affect the filesystem.
Greg Ward1297b5c2000-09-30 20:37:56 +0000449
450 Byte-compilation is either done directly in this interpreter process
451 with the standard py_compile module, or indirectly by writing a
452 temporary script and executing it. Normally, you should let
453 'byte_compile()' figure out to use direct compilation or not (see
454 the source for details). The 'direct' flag is used by the script
455 generated in indirect mode; unless you know what you're doing, leave
456 it set to None.
457 """
Tarek Ziadé04fe7c02009-10-25 23:08:47 +0000458 # nothing is done if sys.dont_write_bytecode is True
459 if sys.dont_write_bytecode:
460 raise DistutilsByteCompileError('byte-compiling is disabled.')
461
Greg Ward1297b5c2000-09-30 20:37:56 +0000462 # First, if the caller didn't force us into direct or indirect mode,
463 # figure out which mode we should be in. We take a conservative
464 # approach: choose direct mode *only* if the current interpreter is
465 # in debug mode and optimize is 0. If we're not in debug mode (-O
466 # or -OO), we don't know which level of optimization this
467 # interpreter is running with, so we can't do direct
468 # byte-compilation and be certain that it's the right thing. Thus,
469 # always compile indirectly if the current interpreter is in either
470 # optimize mode, or if either optimization level was requested by
471 # the caller.
472 if direct is None:
473 direct = (__debug__ and optimize == 0)
474
475 # "Indirect" byte-compilation: write a temporary script and then
476 # run it with the appropriate flags.
477 if not direct:
Marc-André Lemburg03750792002-12-03 08:45:11 +0000478 try:
479 from tempfile import mkstemp
480 (script_fd, script_name) = mkstemp(".py")
481 except ImportError:
482 from tempfile import mktemp
483 (script_fd, script_name) = None, mktemp(".py")
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000484 log.info("writing byte-compilation script '%s'", script_name)
Greg Ward1297b5c2000-09-30 20:37:56 +0000485 if not dry_run:
Marc-André Lemburg03750792002-12-03 08:45:11 +0000486 if script_fd is not None:
487 script = os.fdopen(script_fd, "w")
488 else:
489 script = open(script_name, "w")
Greg Ward1297b5c2000-09-30 20:37:56 +0000490
491 script.write("""\
492from distutils.util import byte_compile
493files = [
494""")
Greg Ward9216cfe2000-10-03 03:31:05 +0000495
496 # XXX would be nice to write absolute filenames, just for
497 # safety's sake (script should be more robust in the face of
498 # chdir'ing before running it). But this requires abspath'ing
499 # 'prefix' as well, and that breaks the hack in build_lib's
500 # 'byte_compile()' method that carefully tacks on a trailing
501 # slash (os.sep really) to make sure the prefix here is "just
502 # right". This whole prefix business is rather delicate -- the
503 # problem is that it's really a directory, but I'm treating it
504 # as a dumb string, so trailing slashes and so forth matter.
505
506 #py_files = map(os.path.abspath, py_files)
507 #if prefix:
508 # prefix = os.path.abspath(prefix)
509
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000510 script.write(",\n".join(map(repr, py_files)) + "]\n")
Greg Ward1297b5c2000-09-30 20:37:56 +0000511 script.write("""
Walter Dörwald70a6b492004-02-12 17:35:32 +0000512byte_compile(files, optimize=%r, force=%r,
513 prefix=%r, base_dir=%r,
514 verbose=%r, dry_run=0,
Greg Ward1297b5c2000-09-30 20:37:56 +0000515 direct=1)
Walter Dörwald70a6b492004-02-12 17:35:32 +0000516""" % (optimize, force, prefix, base_dir, verbose))
Greg Ward1297b5c2000-09-30 20:37:56 +0000517
518 script.close()
519
520 cmd = [sys.executable, script_name]
521 if optimize == 1:
522 cmd.insert(1, "-O")
523 elif optimize == 2:
524 cmd.insert(1, "-OO")
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000525 spawn(cmd, dry_run=dry_run)
Greg Ward9216cfe2000-10-03 03:31:05 +0000526 execute(os.remove, (script_name,), "removing %s" % script_name,
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000527 dry_run=dry_run)
Fred Drakeb94b8492001-12-06 20:51:35 +0000528
Greg Ward1297b5c2000-09-30 20:37:56 +0000529 # "Direct" byte-compilation: use the py_compile module to compile
530 # right here, right now. Note that the script generated in indirect
531 # mode simply calls 'byte_compile()' in direct mode, a weird sort of
532 # cross-process recursion. Hey, it works!
533 else:
534 from py_compile import compile
535
536 for file in py_files:
537 if file[-3:] != ".py":
Greg Wardf217e212000-10-01 23:49:30 +0000538 # This lets us be lazy and not filter filenames in
539 # the "install_lib" command.
540 continue
Greg Ward1297b5c2000-09-30 20:37:56 +0000541
542 # Terminology from the py_compile module:
543 # cfile - byte-compiled file
544 # dfile - purported source filename (same as 'file' by default)
545 cfile = file + (__debug__ and "c" or "o")
546 dfile = file
547 if prefix:
548 if file[:len(prefix)] != prefix:
Tarek Ziadé36797272010-07-22 12:50:05 +0000549 raise ValueError("invalid prefix: filename %r doesn't start with %r"
550 % (file, prefix))
Greg Ward1297b5c2000-09-30 20:37:56 +0000551 dfile = dfile[len(prefix):]
552 if base_dir:
553 dfile = os.path.join(base_dir, dfile)
554
555 cfile_base = os.path.basename(cfile)
556 if direct:
557 if force or newer(file, cfile):
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000558 log.info("byte-compiling %s to %s", file, cfile_base)
Greg Ward1297b5c2000-09-30 20:37:56 +0000559 if not dry_run:
560 compile(file, cfile, dfile)
561 else:
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000562 log.debug("skipping byte-compilation of %s to %s",
563 file, cfile_base)
Greg Ward1297b5c2000-09-30 20:37:56 +0000564
Tarek Ziadé36797272010-07-22 12:50:05 +0000565# byte_compile ()
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000566
Tarek Ziadé36797272010-07-22 12:50:05 +0000567def rfc822_escape (header):
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000568 """Return a version of the string escaped for inclusion in an
Andrew M. Kuchling88b08842001-03-23 17:30:26 +0000569 RFC-822 header, by ensuring there are 8 spaces space after each newline.
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000570 """
Tarek Ziadédf872d42009-12-06 09:28:17 +0000571 lines = header.split('\n')
572 sep = '\n' + 8 * ' '
Neal Norwitz9d72bb42007-04-17 08:48:32 +0000573 return sep.join(lines)
Martin v. Löwis6178db62008-12-01 04:38:52 +0000574
575# 2to3 support
576
577def run_2to3(files, fixer_names=None, options=None, explicit=None):
578 """Invoke 2to3 on a list of Python files.
579 The files should all come from the build area, as the
580 modification is done in-place. To reduce the build time,
581 only files modified since the last invocation of this
582 function should be passed in the files argument."""
583
584 if not files:
585 return
586
587 # Make this class local, to delay import of 2to3
588 from lib2to3.refactor import RefactoringTool, get_fixers_from_package
589 class DistutilsRefactoringTool(RefactoringTool):
590 def log_error(self, msg, *args, **kw):
591 log.error(msg, *args)
592
593 def log_message(self, msg, *args):
594 log.info(msg, *args)
595
596 def log_debug(self, msg, *args):
597 log.debug(msg, *args)
598
599 if fixer_names is None:
600 fixer_names = get_fixers_from_package('lib2to3.fixes')
601 r = DistutilsRefactoringTool(fixer_names, options=options)
602 r.refactor(files, write=True)
603
Georg Brandl6d4a9cf2009-03-31 00:34:54 +0000604def copydir_run_2to3(src, dest, template=None, fixer_names=None,
605 options=None, explicit=None):
606 """Recursively copy a directory, only copying new and changed files,
607 running run_2to3 over all newly copied Python modules afterward.
608
609 If you give a template string, it's parsed like a MANIFEST.in.
610 """
611 from distutils.dir_util import mkpath
612 from distutils.file_util import copy_file
613 from distutils.filelist import FileList
614 filelist = FileList()
615 curdir = os.getcwd()
616 os.chdir(src)
617 try:
618 filelist.findall()
619 finally:
620 os.chdir(curdir)
621 filelist.files[:] = filelist.allfiles
622 if template:
623 for line in template.splitlines():
624 line = line.strip()
625 if not line: continue
626 filelist.process_template_line(line)
627 copied = []
628 for filename in filelist.files:
629 outname = os.path.join(dest, filename)
630 mkpath(os.path.dirname(outname))
631 res = copy_file(os.path.join(src, filename), outname, update=1)
632 if res[1]: copied.append(outname)
633 run_2to3([fn for fn in copied if fn.lower().endswith('.py')],
634 fixer_names=fixer_names, options=options, explicit=explicit)
635 return copied
636
Martin v. Löwis6178db62008-12-01 04:38:52 +0000637class Mixin2to3:
638 '''Mixin class for commands that run 2to3.
639 To configure 2to3, setup scripts may either change
640 the class variables, or inherit from individual commands
641 to override how 2to3 is invoked.'''
642
643 # provide list of fixers to run;
644 # defaults to all from lib2to3.fixers
645 fixer_names = None
646
647 # options dictionary
648 options = None
649
650 # list of fixers to invoke even though they are marked as explicit
651 explicit = None
652
653 def run_2to3(self, files):
654 return run_2to3(files, self.fixer_names, self.options, self.explicit)