blob: 6024911464ae2e3d5dfeb0cc194bdb969bbdb33c [file] [log] [blame]
Tor Norbye3a2425a2013-11-04 10:16:08 -08001"""distutils.util
2
3Miscellaneous utility functions -- anything that doesn't fit into
4one of the other *util.py modules.
5"""
6
7__revision__ = "$Id: util.py 59116 2007-11-22 10:14:26Z ronald.oussoren $"
8
9import sys, os, string, re
10from distutils.errors import DistutilsPlatformError
11from distutils.dep_util import newer
12from distutils.spawn import spawn
13from distutils import log
14
15def get_platform ():
16 """Return a string that identifies the current platform. This is used
17 mainly to distinguish platform-specific build directories and
18 platform-specific built distributions. Typically includes the OS name
19 and version and the architecture (as supplied by 'os.uname()'),
20 although the exact information included depends on the OS; eg. for IRIX
21 the architecture isn't particularly important (IRIX only runs on SGI
22 hardware), but for Linux the kernel version isn't particularly
23 important.
24
25 Examples of returned values:
26 linux-i586
27 linux-alpha (?)
28 solaris-2.6-sun4u
29 irix-5.3
30 irix64-6.2
31
32 For non-POSIX platforms, currently just returns 'sys.platform'.
33 """
34 if os.name != "posix" or not hasattr(os, 'uname'):
35 # XXX what about the architecture? NT is Intel or Alpha,
36 # Mac OS is M68k or PPC, etc.
37 return sys.platform
38
39 # Try to distinguish various flavours of Unix
40
41 (osname, host, release, version, machine) = os.uname()
42
43 # Convert the OS name to lowercase, remove '/' characters
44 # (to accommodate BSD/OS), and translate spaces (for "Power Macintosh")
45 osname = string.lower(osname)
46 osname = string.replace(osname, '/', '')
47 machine = string.replace(machine, ' ', '_')
48 machine = string.replace(machine, '/', '-')
49
50 if osname[:5] == "linux":
51 # At least on Linux/Intel, 'machine' is the processor --
52 # i386, etc.
53 # XXX what about Alpha, SPARC, etc?
54 return "%s-%s" % (osname, machine)
55 elif osname[:5] == "sunos":
56 if release[0] >= "5": # SunOS 5 == Solaris 2
57 osname = "solaris"
58 release = "%d.%s" % (int(release[0]) - 3, release[2:])
59 # fall through to standard osname-release-machine representation
60 elif osname[:4] == "irix": # could be "irix64"!
61 return "%s-%s" % (osname, release)
62 elif osname[:3] == "aix":
63 return "%s-%s.%s" % (osname, version, release)
64 elif osname[:6] == "cygwin":
65 osname = "cygwin"
66 rel_re = re.compile (r'[\d.]+')
67 m = rel_re.match(release)
68 if m:
69 release = m.group()
70 elif osname[:6] == "darwin":
71 #
72 # For our purposes, we'll assume that the system version from
73 # distutils' perspective is what MACOSX_DEPLOYMENT_TARGET is set
74 # to. This makes the compatibility story a bit more sane because the
75 # machine is going to compile and link as if it were
76 # MACOSX_DEPLOYMENT_TARGET.
77 from distutils.sysconfig import get_config_vars
78 cfgvars = get_config_vars()
79
80 macver = os.environ.get('MACOSX_DEPLOYMENT_TARGET')
81 if not macver:
82 macver = cfgvars.get('MACOSX_DEPLOYMENT_TARGET')
83
84 if not macver:
85 # Get the system version. Reading this plist is a documented
86 # way to get the system version (see the documentation for
87 # the Gestalt Manager)
88 try:
89 f = open('/System/Library/CoreServices/SystemVersion.plist')
90 except IOError:
91 # We're on a plain darwin box, fall back to the default
92 # behaviour.
93 pass
94 else:
95 m = re.search(
96 r'<key>ProductUserVisibleVersion</key>\s*' +
97 r'<string>(.*?)</string>', f.read())
98 f.close()
99 if m is not None:
100 macver = '.'.join(m.group(1).split('.')[:2])
101 # else: fall back to the default behaviour
102
103 if macver:
104 from distutils.sysconfig import get_config_vars
105 release = macver
106 osname = "macosx"
107
108
109 if (release + '.') >= '10.4.' and \
110 get_config_vars().get('UNIVERSALSDK', '').strip():
111 # The universal build will build fat binaries, but not on
112 # systems before 10.4
113 machine = 'fat'
114
115 elif machine in ('PowerPC', 'Power_Macintosh'):
116 # Pick a sane name for the PPC architecture.
117 machine = 'ppc'
118
119 return "%s-%s-%s" % (osname, release, machine)
120
121# get_platform ()
122
123
124def convert_path (pathname):
125 """Return 'pathname' as a name that will work on the native filesystem,
126 i.e. split it on '/' and put it back together again using the current
127 directory separator. Needed because filenames in the setup script are
128 always supplied in Unix style, and have to be converted to the local
129 convention before we can actually use them in the filesystem. Raises
130 ValueError on non-Unix-ish systems if 'pathname' either starts or
131 ends with a slash.
132 """
133 if os.sep == '/':
134 return pathname
135 if not pathname:
136 return pathname
137 if pathname[0] == '/':
138 raise ValueError, "path '%s' cannot be absolute" % pathname
139 if pathname[-1] == '/':
140 raise ValueError, "path '%s' cannot end with '/'" % pathname
141
142 paths = string.split(pathname, '/')
143 while '.' in paths:
144 paths.remove('.')
145 if not paths:
146 return os.curdir
147 return apply(os.path.join, paths)
148
149# convert_path ()
150
151
152def change_root (new_root, pathname):
153 """Return 'pathname' with 'new_root' prepended. If 'pathname' is
154 relative, this is equivalent to "os.path.join(new_root,pathname)".
155 Otherwise, it requires making 'pathname' relative and then joining the
156 two, which is tricky on DOS/Windows and Mac OS.
157 """
158 os_name = os._name if sys.platform.startswith('java') else os.name
159 if os_name == 'posix':
160 if not os.path.isabs(pathname):
161 return os.path.join(new_root, pathname)
162 else:
163 return os.path.join(new_root, pathname[1:])
164
165 elif os_name == 'nt':
166 (drive, path) = os.path.splitdrive(pathname)
167 if path[0] == '\\':
168 path = path[1:]
169 return os.path.join(new_root, path)
170
171 elif os_name == 'os2':
172 (drive, path) = os.path.splitdrive(pathname)
173 if path[0] == os.sep:
174 path = path[1:]
175 return os.path.join(new_root, path)
176
177 elif os_name == 'mac':
178 if not os.path.isabs(pathname):
179 return os.path.join(new_root, pathname)
180 else:
181 # Chop off volume name from start of path
182 elements = string.split(pathname, ":", 1)
183 pathname = ":" + elements[1]
184 return os.path.join(new_root, pathname)
185
186 else:
187 raise DistutilsPlatformError, \
188 "nothing known about platform '%s'" % os_name
189
190
191_environ_checked = 0
192def check_environ ():
193 """Ensure that 'os.environ' has all the environment variables we
194 guarantee that users can use in config files, command-line options,
195 etc. Currently this includes:
196 HOME - user's home directory (Unix only)
197 PLAT - description of the current platform, including hardware
198 and OS (see 'get_platform()')
199 """
200 global _environ_checked
201 if _environ_checked:
202 return
203
204 if os.name == 'posix' and not os.environ.has_key('HOME'):
205 import pwd
206 os.environ['HOME'] = pwd.getpwuid(os.getuid())[5]
207
208 if not os.environ.has_key('PLAT'):
209 os.environ['PLAT'] = get_platform()
210
211 _environ_checked = 1
212
213
214def subst_vars (s, local_vars):
215 """Perform shell/Perl-style variable substitution on 'string'. Every
216 occurrence of '$' followed by a name is considered a variable, and
217 variable is substituted by the value found in the 'local_vars'
218 dictionary, or in 'os.environ' if it's not in 'local_vars'.
219 'os.environ' is first checked/augmented to guarantee that it contains
220 certain values: see 'check_environ()'. Raise ValueError for any
221 variables not found in either 'local_vars' or 'os.environ'.
222 """
223 check_environ()
224 def _subst (match, local_vars=local_vars):
225 var_name = match.group(1)
226 if local_vars.has_key(var_name):
227 return str(local_vars[var_name])
228 else:
229 return os.environ[var_name]
230
231 try:
232 return re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s)
233 except KeyError, var:
234 raise ValueError, "invalid variable '$%s'" % var
235
236# subst_vars ()
237
238
239def grok_environment_error (exc, prefix="error: "):
240 """Generate a useful error message from an EnvironmentError (IOError or
241 OSError) exception object. Handles Python 1.5.1 and 1.5.2 styles, and
242 does what it can to deal with exception objects that don't have a
243 filename (which happens when the error is due to a two-file operation,
244 such as 'rename()' or 'link()'. Returns the error message as a string
245 prefixed with 'prefix'.
246 """
247 # check for Python 1.5.2-style {IO,OS}Error exception objects
248 if hasattr(exc, 'filename') and hasattr(exc, 'strerror'):
249 if exc.filename:
250 error = prefix + "%s: %s" % (exc.filename, exc.strerror)
251 else:
252 # two-argument functions in posix module don't
253 # include the filename in the exception object!
254 error = prefix + "%s" % exc.strerror
255 else:
256 error = prefix + str(exc[-1])
257
258 return error
259
260
261# Needed by 'split_quoted()'
262_wordchars_re = _squote_re = _dquote_re = None
263def _init_regex():
264 global _wordchars_re, _squote_re, _dquote_re
265 _wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace)
266 _squote_re = re.compile(r"'(?:[^'\\]|\\.)*'")
267 _dquote_re = re.compile(r'"(?:[^"\\]|\\.)*"')
268
269def split_quoted (s):
270 """Split a string up according to Unix shell-like rules for quotes and
271 backslashes. In short: words are delimited by spaces, as long as those
272 spaces are not escaped by a backslash, or inside a quoted string.
273 Single and double quotes are equivalent, and the quote characters can
274 be backslash-escaped. The backslash is stripped from any two-character
275 escape sequence, leaving only the escaped character. The quote
276 characters are stripped from any quoted string. Returns a list of
277 words.
278 """
279
280 # This is a nice algorithm for splitting up a single string, since it
281 # doesn't require character-by-character examination. It was a little
282 # bit of a brain-bender to get it working right, though...
283 if _wordchars_re is None: _init_regex()
284
285 s = string.strip(s)
286 words = []
287 pos = 0
288
289 while s:
290 m = _wordchars_re.match(s, pos)
291 end = m.end()
292 if end == len(s):
293 words.append(s[:end])
294 break
295
296 if s[end] in string.whitespace: # unescaped, unquoted whitespace: now
297 words.append(s[:end]) # we definitely have a word delimiter
298 s = string.lstrip(s[end:])
299 pos = 0
300
301 elif s[end] == '\\': # preserve whatever is being escaped;
302 # will become part of the current word
303 s = s[:end] + s[end+1:]
304 pos = end+1
305
306 else:
307 if s[end] == "'": # slurp singly-quoted string
308 m = _squote_re.match(s, end)
309 elif s[end] == '"': # slurp doubly-quoted string
310 m = _dquote_re.match(s, end)
311 else:
312 raise RuntimeError, \
313 "this can't happen (bad char '%c')" % s[end]
314
315 if m is None:
316 raise ValueError, \
317 "bad string (mismatched %s quotes?)" % s[end]
318
319 (beg, end) = m.span()
320 s = s[:beg] + s[beg+1:end-1] + s[end:]
321 pos = m.end() - 2
322
323 if pos >= len(s):
324 words.append(s)
325 break
326
327 return words
328
329# split_quoted ()
330
331
332def execute (func, args, msg=None, verbose=0, dry_run=0):
333 """Perform some action that affects the outside world (eg. by
334 writing to the filesystem). Such actions are special because they
335 are disabled by the 'dry_run' flag. This method takes care of all
336 that bureaucracy for you; all you have to do is supply the
337 function to call and an argument tuple for it (to embody the
338 "external action" being performed), and an optional message to
339 print.
340 """
341 if msg is None:
342 msg = "%s%r" % (func.__name__, args)
343 if msg[-2:] == ',)': # correct for singleton tuple
344 msg = msg[0:-2] + ')'
345
346 log.info(msg)
347 if not dry_run:
348 apply(func, args)
349
350
351def strtobool (val):
352 """Convert a string representation of truth to true (1) or false (0).
353
354 True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values
355 are 'n', 'no', 'f', 'false', 'off', and '0'. Raises ValueError if
356 'val' is anything else.
357 """
358 val = string.lower(val)
359 if val in ('y', 'yes', 't', 'true', 'on', '1'):
360 return 1
361 elif val in ('n', 'no', 'f', 'false', 'off', '0'):
362 return 0
363 else:
364 raise ValueError, "invalid truth value %r" % (val,)
365
366
367def byte_compile (py_files,
368 optimize=0, force=0,
369 prefix=None, base_dir=None,
370 verbose=1, dry_run=0,
371 direct=None):
372 """Byte-compile a collection of Python source files to either .pyc
373 or .pyo files in the same directory. 'py_files' is a list of files
374 to compile; any files that don't end in ".py" are silently skipped.
375 'optimize' must be one of the following:
376 0 - don't optimize (generate .pyc)
377 1 - normal optimization (like "python -O")
378 2 - extra optimization (like "python -OO")
379 If 'force' is true, all files are recompiled regardless of
380 timestamps.
381
382 The source filename encoded in each bytecode file defaults to the
383 filenames listed in 'py_files'; you can modify these with 'prefix' and
384 'basedir'. 'prefix' is a string that will be stripped off of each
385 source filename, and 'base_dir' is a directory name that will be
386 prepended (after 'prefix' is stripped). You can supply either or both
387 (or neither) of 'prefix' and 'base_dir', as you wish.
388
389 If 'dry_run' is true, doesn't actually do anything that would
390 affect the filesystem.
391
392 Byte-compilation is either done directly in this interpreter process
393 with the standard py_compile module, or indirectly by writing a
394 temporary script and executing it. Normally, you should let
395 'byte_compile()' figure out to use direct compilation or not (see
396 the source for details). The 'direct' flag is used by the script
397 generated in indirect mode; unless you know what you're doing, leave
398 it set to None.
399 """
400
401 # First, if the caller didn't force us into direct or indirect mode,
402 # figure out which mode we should be in. We take a conservative
403 # approach: choose direct mode *only* if the current interpreter is
404 # in debug mode and optimize is 0. If we're not in debug mode (-O
405 # or -OO), we don't know which level of optimization this
406 # interpreter is running with, so we can't do direct
407 # byte-compilation and be certain that it's the right thing. Thus,
408 # always compile indirectly if the current interpreter is in either
409 # optimize mode, or if either optimization level was requested by
410 # the caller.
411 if direct is None:
412 direct = (__debug__ and optimize == 0)
413
414 # "Indirect" byte-compilation: write a temporary script and then
415 # run it with the appropriate flags.
416 if not direct:
417 try:
418 from tempfile import mkstemp
419 (script_fd, script_name) = mkstemp(".py")
420 except ImportError:
421 from tempfile import mktemp
422 (script_fd, script_name) = None, mktemp(".py")
423 log.info("writing byte-compilation script '%s'", script_name)
424 if not dry_run:
425 if script_fd is not None:
426 script = os.fdopen(script_fd, "w")
427 else:
428 script = open(script_name, "w")
429
430 script.write("""\
431from distutils.util import byte_compile
432files = [
433""")
434
435 # XXX would be nice to write absolute filenames, just for
436 # safety's sake (script should be more robust in the face of
437 # chdir'ing before running it). But this requires abspath'ing
438 # 'prefix' as well, and that breaks the hack in build_lib's
439 # 'byte_compile()' method that carefully tacks on a trailing
440 # slash (os.sep really) to make sure the prefix here is "just
441 # right". This whole prefix business is rather delicate -- the
442 # problem is that it's really a directory, but I'm treating it
443 # as a dumb string, so trailing slashes and so forth matter.
444
445 #py_files = map(os.path.abspath, py_files)
446 #if prefix:
447 # prefix = os.path.abspath(prefix)
448
449 script.write(string.join(map(repr, py_files), ",\n") + "]\n")
450 script.write("""
451byte_compile(files, optimize=%r, force=%r,
452 prefix=%r, base_dir=%r,
453 verbose=%r, dry_run=0,
454 direct=1)
455""" % (optimize, force, prefix, base_dir, verbose))
456
457 script.close()
458
459 cmd = [sys.executable, script_name]
460 if optimize == 1:
461 cmd.insert(1, "-O")
462 elif optimize == 2:
463 cmd.insert(1, "-OO")
464 spawn(cmd, dry_run=dry_run)
465 execute(os.remove, (script_name,), "removing %s" % script_name,
466 dry_run=dry_run)
467
468 # "Direct" byte-compilation: use the py_compile module to compile
469 # right here, right now. Note that the script generated in indirect
470 # mode simply calls 'byte_compile()' in direct mode, a weird sort of
471 # cross-process recursion. Hey, it works!
472 else:
473 from py_compile import compile
474
475 for file in py_files:
476 if file[-3:] != ".py":
477 # This lets us be lazy and not filter filenames in
478 # the "install_lib" command.
479 continue
480
481 # Terminology from the py_compile module:
482 # cfile - byte-compiled file
483 # dfile - purported source filename (same as 'file' by default)
484 if sys.platform.startswith('java'):
485 cfile = file[:-3] + '$py.class'
486 else:
487 cfile = file + (__debug__ and "c" or "o")
488 dfile = file
489 if prefix:
490 if file[:len(prefix)] != prefix:
491 raise ValueError, \
492 ("invalid prefix: filename %r doesn't start with %r"
493 % (file, prefix))
494 dfile = dfile[len(prefix):]
495 if base_dir:
496 dfile = os.path.join(base_dir, dfile)
497
498 cfile_base = os.path.basename(cfile)
499 if direct:
500 if force or newer(file, cfile):
501 log.info("byte-compiling %s to %s", file, cfile_base)
502 if not dry_run:
503 compile(file, cfile, dfile)
504 else:
505 log.debug("skipping byte-compilation of %s to %s",
506 file, cfile_base)
507
508# byte_compile ()
509
510def rfc822_escape (header):
511 """Return a version of the string escaped for inclusion in an
512 RFC-822 header, by ensuring there are 8 spaces space after each newline.
513 """
514 lines = string.split(header, '\n')
515 lines = map(string.strip, lines)
516 header = string.join(lines, '\n' + 8*' ')
517 return header