blob: 2e4617ef277f10c0a369445fe52156169a167f38 [file] [log] [blame]
Greg Ward2689e3d1999-03-22 14:52:19 +00001"""distutils.util
2
Greg Wardaebf7062000-04-04 02:05:59 +00003Miscellaneous utility functions -- anything that doesn't fit into
Greg Ward47527692000-09-30 18:49:14 +00004one of the other *util.py modules.
5"""
Greg Ward2689e3d1999-03-22 14:52:19 +00006
Greg Ward3ce77fd2000-03-02 01:49:45 +00007__revision__ = "$Id$"
Greg Ward2689e3d1999-03-22 14:52:19 +00008
Jesus Cea4a8ba192012-01-18 03:51:38 +01009import sys, os, string, re, platform
Greg Ward1297b5c2000-09-30 20:37:56 +000010from distutils.errors import DistutilsPlatformError
11from distutils.dep_util import newer
Tarek Ziadédd7bef92010-03-05 00:16:02 +000012from distutils.spawn import spawn
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +000013from distutils import log
Tarek Ziadéb9c1cfc2009-10-24 15:10:37 +000014from distutils.errors import DistutilsByteCompileError
Greg Wardaa458bc2000-04-22 15:14:58 +000015
Tarek Ziadédd7bef92010-03-05 00:16:02 +000016def get_platform ():
17 """Return a string that identifies the current platform. This is used
18 mainly to distinguish platform-specific build directories and
19 platform-specific built distributions. Typically includes the OS name
20 and version and the architecture (as supplied by 'os.uname()'),
21 although the exact information included depends on the OS; eg. for IRIX
22 the architecture isn't particularly important (IRIX only runs on SGI
23 hardware), but for Linux the kernel version isn't particularly
24 important.
Greg Ward50919292000-03-07 03:27:08 +000025
Tarek Ziadédd7bef92010-03-05 00:16:02 +000026 Examples of returned values:
27 linux-i586
28 linux-alpha (?)
29 solaris-2.6-sun4u
30 irix-5.3
31 irix64-6.2
Tarek Ziadé92e68af2010-01-26 22:46:15 +000032
Tarek Ziadédd7bef92010-03-05 00:16:02 +000033 Windows will return one of:
34 win-amd64 (64bit Windows on AMD64 (aka x86_64, Intel64, EM64T, etc)
35 win-ia64 (64bit Windows on Itanium)
36 win32 (all others - specifically, sys.platform is returned)
37
38 For other non-POSIX platforms, currently just returns 'sys.platform'.
Tarek Ziadé92e68af2010-01-26 22:46:15 +000039 """
Tarek Ziadédd7bef92010-03-05 00:16:02 +000040 if os.name == 'nt':
41 # sniff sys.version for architecture.
42 prefix = " bit ("
43 i = string.find(sys.version, prefix)
44 if i == -1:
45 return sys.platform
46 j = string.find(sys.version, ")", i)
47 look = sys.version[i+len(prefix):j].lower()
48 if look=='amd64':
49 return 'win-amd64'
50 if look=='itanium':
51 return 'win-ia64'
52 return sys.platform
Tarek Ziadé92e68af2010-01-26 22:46:15 +000053
Tarek Ziadédd7bef92010-03-05 00:16:02 +000054 if os.name != "posix" or not hasattr(os, 'uname'):
55 # XXX what about the architecture? NT is Intel or Alpha,
56 # Mac OS is M68k or PPC, etc.
57 return sys.platform
Tarek Ziadé92e68af2010-01-26 22:46:15 +000058
Tarek Ziadédd7bef92010-03-05 00:16:02 +000059 # Try to distinguish various flavours of Unix
Tarek Ziadé0276c7a2010-01-26 21:21:54 +000060
Tarek Ziadédd7bef92010-03-05 00:16:02 +000061 (osname, host, release, version, machine) = os.uname()
Greg Ward50919292000-03-07 03:27:08 +000062
Tarek Ziadédd7bef92010-03-05 00:16:02 +000063 # Convert the OS name to lowercase, remove '/' characters
64 # (to accommodate BSD/OS), and translate spaces (for "Power Macintosh")
65 osname = string.lower(osname)
66 osname = string.replace(osname, '/', '')
67 machine = string.replace(machine, ' ', '_')
68 machine = string.replace(machine, '/', '-')
69
70 if osname[:5] == "linux":
71 # At least on Linux/Intel, 'machine' is the processor --
72 # i386, etc.
73 # XXX what about Alpha, SPARC, etc?
74 return "%s-%s" % (osname, machine)
75 elif osname[:5] == "sunos":
76 if release[0] >= "5": # SunOS 5 == Solaris 2
77 osname = "solaris"
78 release = "%d.%s" % (int(release[0]) - 3, release[2:])
Jesus Cea4a8ba192012-01-18 03:51:38 +010079 machine += ".%s" % platform.architecture()[0]
Tarek Ziadédd7bef92010-03-05 00:16:02 +000080 # fall through to standard osname-release-machine representation
81 elif osname[:4] == "irix": # could be "irix64"!
82 return "%s-%s" % (osname, release)
83 elif osname[:3] == "aix":
84 return "%s-%s.%s" % (osname, version, release)
85 elif osname[:6] == "cygwin":
86 osname = "cygwin"
87 rel_re = re.compile (r'[\d.]+')
88 m = rel_re.match(release)
89 if m:
90 release = m.group()
91 elif osname[:6] == "darwin":
92 #
93 # For our purposes, we'll assume that the system version from
94 # distutils' perspective is what MACOSX_DEPLOYMENT_TARGET is set
95 # to. This makes the compatibility story a bit more sane because the
96 # machine is going to compile and link as if it were
97 # MACOSX_DEPLOYMENT_TARGET.
98 from distutils.sysconfig import get_config_vars
99 cfgvars = get_config_vars()
100
Ronald Oussorena70286b2011-05-15 16:44:27 +0200101 macver = cfgvars.get('MACOSX_DEPLOYMENT_TARGET')
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000102
103 if 1:
104 # Always calculate the release of the running machine,
105 # needed to determine if we can build fat binaries or not.
106
107 macrelease = macver
108 # Get the system version. Reading this plist is a documented
109 # way to get the system version (see the documentation for
110 # the Gestalt Manager)
111 try:
112 f = open('/System/Library/CoreServices/SystemVersion.plist')
113 except IOError:
114 # We're on a plain darwin box, fall back to the default
115 # behaviour.
116 pass
117 else:
Éric Araujod1feff72010-11-06 04:06:18 +0000118 try:
119 m = re.search(
120 r'<key>ProductUserVisibleVersion</key>\s*' +
121 r'<string>(.*?)</string>', f.read())
122 if m is not None:
123 macrelease = '.'.join(m.group(1).split('.')[:2])
124 # else: fall back to the default behaviour
125 finally:
126 f.close()
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000127
128 if not macver:
129 macver = macrelease
130
131 if macver:
132 from distutils.sysconfig import get_config_vars
133 release = macver
134 osname = "macosx"
135
136 if (macrelease + '.') >= '10.4.' and \
137 '-arch' in get_config_vars().get('CFLAGS', '').strip():
138 # The universal build will build fat binaries, but not on
139 # systems before 10.4
140 #
141 # Try to detect 4-way universal builds, those have machine-type
142 # 'universal' instead of 'fat'.
143
144 machine = 'fat'
145 cflags = get_config_vars().get('CFLAGS')
146
147 archs = re.findall('-arch\s+(\S+)', cflags)
Ronald Oussoren75956202010-07-11 08:52:52 +0000148 archs = tuple(sorted(set(archs)))
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000149
150 if len(archs) == 1:
151 machine = archs[0]
152 elif archs == ('i386', 'ppc'):
153 machine = 'fat'
154 elif archs == ('i386', 'x86_64'):
155 machine = 'intel'
156 elif archs == ('i386', 'ppc', 'x86_64'):
157 machine = 'fat3'
158 elif archs == ('ppc64', 'x86_64'):
159 machine = 'fat64'
160 elif archs == ('i386', 'ppc', 'ppc64', 'x86_64'):
161 machine = 'universal'
162 else:
163 raise ValueError(
164 "Don't know machine value for archs=%r"%(archs,))
165
166 elif machine == 'i386':
167 # On OSX the machine type returned by uname is always the
168 # 32-bit variant, even if the executable architecture is
169 # the 64-bit variant
170 if sys.maxint >= 2**32:
171 machine = 'x86_64'
172
173 elif machine in ('PowerPC', 'Power_Macintosh'):
174 # Pick a sane name for the PPC architecture.
175 machine = 'ppc'
176
177 # See 'i386' case
178 if sys.maxint >= 2**32:
179 machine = 'ppc64'
180
181 return "%s-%s-%s" % (osname, release, machine)
182
183# get_platform ()
184
185
186def convert_path (pathname):
187 """Return 'pathname' as a name that will work on the native filesystem,
Greg Wardb8b263b2000-09-30 18:40:42 +0000188 i.e. split it on '/' and put it back together again using the current
189 directory separator. Needed because filenames in the setup script are
190 always supplied in Unix style, and have to be converted to the local
191 convention before we can actually use them in the filesystem. Raises
Greg Ward47527692000-09-30 18:49:14 +0000192 ValueError on non-Unix-ish systems if 'pathname' either starts or
193 ends with a slash.
Greg Wardb8b263b2000-09-30 18:40:42 +0000194 """
Greg Ward7ec05352000-09-22 01:05:43 +0000195 if os.sep == '/':
196 return pathname
Neal Norwitzb0df6a12002-08-13 17:42:57 +0000197 if not pathname:
198 return pathname
199 if pathname[0] == '/':
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000200 raise ValueError, "path '%s' cannot be absolute" % pathname
Neal Norwitzb0df6a12002-08-13 17:42:57 +0000201 if pathname[-1] == '/':
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000202 raise ValueError, "path '%s' cannot end with '/'" % pathname
Greg Ward7ec05352000-09-22 01:05:43 +0000203
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000204 paths = string.split(pathname, '/')
Jack Jansenb4cd5c12001-01-28 12:23:32 +0000205 while '.' in paths:
206 paths.remove('.')
207 if not paths:
208 return os.curdir
Florent Xicluna8d1da0f2010-04-01 18:17:09 +0000209 return os.path.join(*paths)
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000210
211# convert_path ()
Greg Ward1b4ede52000-03-22 00:22:44 +0000212
213
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000214def change_root (new_root, pathname):
215 """Return 'pathname' with 'new_root' prepended. If 'pathname' is
216 relative, this is equivalent to "os.path.join(new_root,pathname)".
Greg Ward67f75d42000-04-27 01:53:46 +0000217 Otherwise, it requires making 'pathname' relative and then joining the
Greg Ward4b46ef92000-05-31 02:14:32 +0000218 two, which is tricky on DOS/Windows and Mac OS.
219 """
220 if os.name == 'posix':
Greg Wardbe86bde2000-09-26 01:56:15 +0000221 if not os.path.isabs(pathname):
222 return os.path.join(new_root, pathname)
Greg Ward4b46ef92000-05-31 02:14:32 +0000223 else:
Greg Wardbe86bde2000-09-26 01:56:15 +0000224 return os.path.join(new_root, pathname[1:])
Greg Ward67f75d42000-04-27 01:53:46 +0000225
226 elif os.name == 'nt':
Greg Wardbe86bde2000-09-26 01:56:15 +0000227 (drive, path) = os.path.splitdrive(pathname)
Greg Ward4b46ef92000-05-31 02:14:32 +0000228 if path[0] == '\\':
229 path = path[1:]
Greg Wardbe86bde2000-09-26 01:56:15 +0000230 return os.path.join(new_root, path)
Greg Ward67f75d42000-04-27 01:53:46 +0000231
Marc-André Lemburg2544f512002-01-31 18:56:00 +0000232 elif os.name == 'os2':
233 (drive, path) = os.path.splitdrive(pathname)
234 if path[0] == os.sep:
235 path = path[1:]
236 return os.path.join(new_root, path)
237
Greg Ward67f75d42000-04-27 01:53:46 +0000238 else:
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000239 raise DistutilsPlatformError, \
240 "nothing known about platform '%s'" % os.name
241
Greg Ward67f75d42000-04-27 01:53:46 +0000242
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000243_environ_checked = 0
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000244def check_environ ():
245 """Ensure that 'os.environ' has all the environment variables we
246 guarantee that users can use in config files, command-line options,
Greg Wardb8b263b2000-09-30 18:40:42 +0000247 etc. Currently this includes:
248 HOME - user's home directory (Unix only)
249 PLAT - description of the current platform, including hardware
250 and OS (see 'get_platform()')
Greg Ward1b4ede52000-03-22 00:22:44 +0000251 """
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000252 global _environ_checked
253 if _environ_checked:
254 return
255
Guido van Rossum8bc09652008-02-21 18:18:37 +0000256 if os.name == 'posix' and 'HOME' not in os.environ:
Greg Ward1b4ede52000-03-22 00:22:44 +0000257 import pwd
Greg Wardbe86bde2000-09-26 01:56:15 +0000258 os.environ['HOME'] = pwd.getpwuid(os.getuid())[5]
Greg Ward1b4ede52000-03-22 00:22:44 +0000259
Guido van Rossum8bc09652008-02-21 18:18:37 +0000260 if 'PLAT' not in os.environ:
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000261 os.environ['PLAT'] = get_platform()
Greg Ward1b4ede52000-03-22 00:22:44 +0000262
Gregory P. Smithe7e35ac2000-05-12 00:40:00 +0000263 _environ_checked = 1
264
Greg Ward1b4ede52000-03-22 00:22:44 +0000265
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000266def subst_vars (s, local_vars):
267 """Perform shell/Perl-style variable substitution on 'string'. Every
268 occurrence of '$' followed by a name is considered a variable, and
Greg Ward47527692000-09-30 18:49:14 +0000269 variable is substituted by the value found in the 'local_vars'
270 dictionary, or in 'os.environ' if it's not in 'local_vars'.
271 'os.environ' is first checked/augmented to guarantee that it contains
272 certain values: see 'check_environ()'. Raise ValueError for any
273 variables not found in either 'local_vars' or 'os.environ'.
Greg Wardb8b263b2000-09-30 18:40:42 +0000274 """
Greg Wardbe86bde2000-09-26 01:56:15 +0000275 check_environ()
Greg Ward1b4ede52000-03-22 00:22:44 +0000276 def _subst (match, local_vars=local_vars):
277 var_name = match.group(1)
Guido van Rossum8bc09652008-02-21 18:18:37 +0000278 if var_name in local_vars:
Greg Wardbe86bde2000-09-26 01:56:15 +0000279 return str(local_vars[var_name])
Greg Ward1b4ede52000-03-22 00:22:44 +0000280 else:
281 return os.environ[var_name]
282
Greg Ward47527692000-09-30 18:49:14 +0000283 try:
Jeremy Hylton5e2d0762001-01-25 20:10:32 +0000284 return re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s)
Greg Ward47527692000-09-30 18:49:14 +0000285 except KeyError, var:
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000286 raise ValueError, "invalid variable '$%s'" % var
Greg Ward1b4ede52000-03-22 00:22:44 +0000287
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000288# subst_vars ()
Greg Ward7c1a6d42000-03-29 02:48:40 +0000289
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000290
291def grok_environment_error (exc, prefix="error: "):
292 """Generate a useful error message from an EnvironmentError (IOError or
293 OSError) exception object. Handles Python 1.5.1 and 1.5.2 styles, and
Greg Warde9055132000-06-17 02:16:46 +0000294 does what it can to deal with exception objects that don't have a
295 filename (which happens when the error is due to a two-file operation,
296 such as 'rename()' or 'link()'. Returns the error message as a string
297 prefixed with 'prefix'.
298 """
299 # check for Python 1.5.2-style {IO,OS}Error exception objects
Greg Wardbe86bde2000-09-26 01:56:15 +0000300 if hasattr(exc, 'filename') and hasattr(exc, 'strerror'):
Greg Warde9055132000-06-17 02:16:46 +0000301 if exc.filename:
302 error = prefix + "%s: %s" % (exc.filename, exc.strerror)
303 else:
304 # two-argument functions in posix module don't
305 # include the filename in the exception object!
306 error = prefix + "%s" % exc.strerror
307 else:
308 error = prefix + str(exc[-1])
309
310 return error
Greg Ward6a2a3db2000-06-24 20:40:02 +0000311
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000312
Greg Ward6a2a3db2000-06-24 20:40:02 +0000313# Needed by 'split_quoted()'
Martin v. Löwis1c0f1f92004-03-25 14:58:19 +0000314_wordchars_re = _squote_re = _dquote_re = None
315def _init_regex():
316 global _wordchars_re, _squote_re, _dquote_re
317 _wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace)
318 _squote_re = re.compile(r"'(?:[^'\\]|\\.)*'")
319 _dquote_re = re.compile(r'"(?:[^"\\]|\\.)*"')
Greg Ward6a2a3db2000-06-24 20:40:02 +0000320
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000321def split_quoted (s):
Greg Ward6a2a3db2000-06-24 20:40:02 +0000322 """Split a string up according to Unix shell-like rules for quotes and
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000323 backslashes. In short: words are delimited by spaces, as long as those
Greg Ward6a2a3db2000-06-24 20:40:02 +0000324 spaces are not escaped by a backslash, or inside a quoted string.
325 Single and double quotes are equivalent, and the quote characters can
326 be backslash-escaped. The backslash is stripped from any two-character
327 escape sequence, leaving only the escaped character. The quote
328 characters are stripped from any quoted string. Returns a list of
329 words.
330 """
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000331
Greg Ward6a2a3db2000-06-24 20:40:02 +0000332 # This is a nice algorithm for splitting up a single string, since it
333 # doesn't require character-by-character examination. It was a little
334 # bit of a brain-bender to get it working right, though...
Martin v. Löwis1c0f1f92004-03-25 14:58:19 +0000335 if _wordchars_re is None: _init_regex()
Greg Ward6a2a3db2000-06-24 20:40:02 +0000336
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000337 s = string.strip(s)
Greg Ward6a2a3db2000-06-24 20:40:02 +0000338 words = []
339 pos = 0
340
341 while s:
342 m = _wordchars_re.match(s, pos)
343 end = m.end()
344 if end == len(s):
345 words.append(s[:end])
346 break
347
Greg Ward2b042de2000-08-08 14:38:13 +0000348 if s[end] in string.whitespace: # unescaped, unquoted whitespace: now
Greg Ward6a2a3db2000-06-24 20:40:02 +0000349 words.append(s[:end]) # we definitely have a word delimiter
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000350 s = string.lstrip(s[end:])
Greg Ward6a2a3db2000-06-24 20:40:02 +0000351 pos = 0
352
353 elif s[end] == '\\': # preserve whatever is being escaped;
354 # will become part of the current word
355 s = s[:end] + s[end+1:]
356 pos = end+1
357
358 else:
359 if s[end] == "'": # slurp singly-quoted string
360 m = _squote_re.match(s, end)
361 elif s[end] == '"': # slurp doubly-quoted string
362 m = _dquote_re.match(s, end)
363 else:
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000364 raise RuntimeError, \
365 "this can't happen (bad char '%c')" % s[end]
Greg Ward6a2a3db2000-06-24 20:40:02 +0000366
367 if m is None:
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000368 raise ValueError, \
369 "bad string (mismatched %s quotes?)" % s[end]
Greg Ward6a2a3db2000-06-24 20:40:02 +0000370
371 (beg, end) = m.span()
372 s = s[:beg] + s[beg+1:end-1] + s[end:]
373 pos = m.end() - 2
374
375 if pos >= len(s):
376 words.append(s)
377 break
378
379 return words
380
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000381# split_quoted ()
Greg Ward1c16ac32000-08-02 01:37:30 +0000382
383
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000384def execute (func, args, msg=None, verbose=0, dry_run=0):
385 """Perform some action that affects the outside world (eg. by
386 writing to the filesystem). Such actions are special because they
387 are disabled by the 'dry_run' flag. This method takes care of all
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000388 that bureaucracy for you; all you have to do is supply the
389 function to call and an argument tuple for it (to embody the
390 "external action" being performed), and an optional message to
391 print.
Greg Ward1c16ac32000-08-02 01:37:30 +0000392 """
Greg Ward1c16ac32000-08-02 01:37:30 +0000393 if msg is None:
Walter Dörwald70a6b492004-02-12 17:35:32 +0000394 msg = "%s%r" % (func.__name__, args)
Fred Drakeb94b8492001-12-06 20:51:35 +0000395 if msg[-2:] == ',)': # correct for singleton tuple
Greg Ward1c16ac32000-08-02 01:37:30 +0000396 msg = msg[0:-2] + ')'
397
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000398 log.info(msg)
Greg Ward1c16ac32000-08-02 01:37:30 +0000399 if not dry_run:
Florent Xicluna1f3b4e12010-03-07 12:14:25 +0000400 func(*args)
Greg Ward1c16ac32000-08-02 01:37:30 +0000401
Greg Ward817dc092000-09-25 01:25:06 +0000402
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000403def strtobool (val):
Greg Ward817dc092000-09-25 01:25:06 +0000404 """Convert a string representation of truth to true (1) or false (0).
Tim Peters182b5ac2004-07-18 06:16:08 +0000405
Greg Ward817dc092000-09-25 01:25:06 +0000406 True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values
407 are 'n', 'no', 'f', 'false', 'off', and '0'. Raises ValueError if
408 'val' is anything else.
409 """
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000410 val = string.lower(val)
Greg Ward817dc092000-09-25 01:25:06 +0000411 if val in ('y', 'yes', 't', 'true', 'on', '1'):
412 return 1
413 elif val in ('n', 'no', 'f', 'false', 'off', '0'):
414 return 0
415 else:
Walter Dörwald70a6b492004-02-12 17:35:32 +0000416 raise ValueError, "invalid truth value %r" % (val,)
Greg Ward1297b5c2000-09-30 20:37:56 +0000417
418
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000419def byte_compile (py_files,
420 optimize=0, force=0,
421 prefix=None, base_dir=None,
422 verbose=1, dry_run=0,
423 direct=None):
Greg Wardf217e212000-10-01 23:49:30 +0000424 """Byte-compile a collection of Python source files to either .pyc
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000425 or .pyo files in the same directory. 'py_files' is a list of files
426 to compile; any files that don't end in ".py" are silently skipped.
427 'optimize' must be one of the following:
Greg Ward1297b5c2000-09-30 20:37:56 +0000428 0 - don't optimize (generate .pyc)
429 1 - normal optimization (like "python -O")
430 2 - extra optimization (like "python -OO")
431 If 'force' is true, all files are recompiled regardless of
432 timestamps.
433
434 The source filename encoded in each bytecode file defaults to the
435 filenames listed in 'py_files'; you can modify these with 'prefix' and
436 'basedir'. 'prefix' is a string that will be stripped off of each
437 source filename, and 'base_dir' is a directory name that will be
438 prepended (after 'prefix' is stripped). You can supply either or both
439 (or neither) of 'prefix' and 'base_dir', as you wish.
440
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000441 If 'dry_run' is true, doesn't actually do anything that would
442 affect the filesystem.
Greg Ward1297b5c2000-09-30 20:37:56 +0000443
444 Byte-compilation is either done directly in this interpreter process
445 with the standard py_compile module, or indirectly by writing a
446 temporary script and executing it. Normally, you should let
447 'byte_compile()' figure out to use direct compilation or not (see
448 the source for details). The 'direct' flag is used by the script
449 generated in indirect mode; unless you know what you're doing, leave
450 it set to None.
451 """
Tarek Ziadéb9c1cfc2009-10-24 15:10:37 +0000452 # nothing is done if sys.dont_write_bytecode is True
453 if sys.dont_write_bytecode:
Tarek Ziadé1733c932009-10-24 15:51:30 +0000454 raise DistutilsByteCompileError('byte-compiling is disabled.')
Tarek Ziadéb9c1cfc2009-10-24 15:10:37 +0000455
Greg Ward1297b5c2000-09-30 20:37:56 +0000456 # First, if the caller didn't force us into direct or indirect mode,
457 # figure out which mode we should be in. We take a conservative
458 # approach: choose direct mode *only* if the current interpreter is
459 # in debug mode and optimize is 0. If we're not in debug mode (-O
460 # or -OO), we don't know which level of optimization this
461 # interpreter is running with, so we can't do direct
462 # byte-compilation and be certain that it's the right thing. Thus,
463 # always compile indirectly if the current interpreter is in either
464 # optimize mode, or if either optimization level was requested by
465 # the caller.
466 if direct is None:
467 direct = (__debug__ and optimize == 0)
468
469 # "Indirect" byte-compilation: write a temporary script and then
470 # run it with the appropriate flags.
471 if not direct:
Marc-André Lemburg03750792002-12-03 08:45:11 +0000472 try:
473 from tempfile import mkstemp
474 (script_fd, script_name) = mkstemp(".py")
475 except ImportError:
476 from tempfile import mktemp
477 (script_fd, script_name) = None, mktemp(".py")
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000478 log.info("writing byte-compilation script '%s'", script_name)
Greg Ward1297b5c2000-09-30 20:37:56 +0000479 if not dry_run:
Marc-André Lemburg03750792002-12-03 08:45:11 +0000480 if script_fd is not None:
481 script = os.fdopen(script_fd, "w")
482 else:
483 script = open(script_name, "w")
Greg Ward1297b5c2000-09-30 20:37:56 +0000484
485 script.write("""\
486from distutils.util import byte_compile
487files = [
488""")
Greg Ward9216cfe2000-10-03 03:31:05 +0000489
490 # XXX would be nice to write absolute filenames, just for
491 # safety's sake (script should be more robust in the face of
492 # chdir'ing before running it). But this requires abspath'ing
493 # 'prefix' as well, and that breaks the hack in build_lib's
494 # 'byte_compile()' method that carefully tacks on a trailing
495 # slash (os.sep really) to make sure the prefix here is "just
496 # right". This whole prefix business is rather delicate -- the
497 # problem is that it's really a directory, but I'm treating it
498 # as a dumb string, so trailing slashes and so forth matter.
499
500 #py_files = map(os.path.abspath, py_files)
501 #if prefix:
502 # prefix = os.path.abspath(prefix)
503
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000504 script.write(string.join(map(repr, py_files), ",\n") + "]\n")
Greg Ward1297b5c2000-09-30 20:37:56 +0000505 script.write("""
Walter Dörwald70a6b492004-02-12 17:35:32 +0000506byte_compile(files, optimize=%r, force=%r,
507 prefix=%r, base_dir=%r,
508 verbose=%r, dry_run=0,
Greg Ward1297b5c2000-09-30 20:37:56 +0000509 direct=1)
Walter Dörwald70a6b492004-02-12 17:35:32 +0000510""" % (optimize, force, prefix, base_dir, verbose))
Greg Ward1297b5c2000-09-30 20:37:56 +0000511
512 script.close()
513
514 cmd = [sys.executable, script_name]
515 if optimize == 1:
516 cmd.insert(1, "-O")
517 elif optimize == 2:
518 cmd.insert(1, "-OO")
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000519 spawn(cmd, dry_run=dry_run)
Greg Ward9216cfe2000-10-03 03:31:05 +0000520 execute(os.remove, (script_name,), "removing %s" % script_name,
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000521 dry_run=dry_run)
Fred Drakeb94b8492001-12-06 20:51:35 +0000522
Greg Ward1297b5c2000-09-30 20:37:56 +0000523 # "Direct" byte-compilation: use the py_compile module to compile
524 # right here, right now. Note that the script generated in indirect
525 # mode simply calls 'byte_compile()' in direct mode, a weird sort of
526 # cross-process recursion. Hey, it works!
527 else:
528 from py_compile import compile
529
530 for file in py_files:
531 if file[-3:] != ".py":
Greg Wardf217e212000-10-01 23:49:30 +0000532 # This lets us be lazy and not filter filenames in
533 # the "install_lib" command.
534 continue
Greg Ward1297b5c2000-09-30 20:37:56 +0000535
536 # Terminology from the py_compile module:
537 # cfile - byte-compiled file
538 # dfile - purported source filename (same as 'file' by default)
539 cfile = file + (__debug__ and "c" or "o")
540 dfile = file
541 if prefix:
542 if file[:len(prefix)] != prefix:
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000543 raise ValueError, \
544 ("invalid prefix: filename %r doesn't start with %r"
545 % (file, prefix))
Greg Ward1297b5c2000-09-30 20:37:56 +0000546 dfile = dfile[len(prefix):]
547 if base_dir:
548 dfile = os.path.join(base_dir, dfile)
549
550 cfile_base = os.path.basename(cfile)
551 if direct:
552 if force or newer(file, cfile):
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000553 log.info("byte-compiling %s to %s", file, cfile_base)
Greg Ward1297b5c2000-09-30 20:37:56 +0000554 if not dry_run:
555 compile(file, cfile, dfile)
556 else:
Jeremy Hyltoncd8a1142002-06-04 20:14:43 +0000557 log.debug("skipping byte-compilation of %s to %s",
558 file, cfile_base)
Greg Ward1297b5c2000-09-30 20:37:56 +0000559
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000560# byte_compile ()
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000561
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000562def rfc822_escape (header):
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000563 """Return a version of the string escaped for inclusion in an
Andrew M. Kuchling88b08842001-03-23 17:30:26 +0000564 RFC-822 header, by ensuring there are 8 spaces space after each newline.
Andrew M. Kuchlingdf66df02001-03-22 03:03:41 +0000565 """
Tarek Ziadédd7bef92010-03-05 00:16:02 +0000566 lines = string.split(header, '\n')
567 header = string.join(lines, '\n' + 8*' ')
568 return header