Blame - python/lib/Lib/distutils/util.py - platform/tools/idea

blob: 6024911464ae2e3d5dfeb0cc194bdb969bbdb33c [file] [log] [blame]

Tor Norbye	3a2425a	2013-11-04 10:16:08 -0800	[diff] [blame^]	1	"""distutils.util
				2
				3	Miscellaneous utility functions -- anything that doesn't fit into
				4	one of the other *util.py modules.
				5	"""
				6
				7	__revision__ = "$Id: util.py 59116 2007-11-22 10:14:26Z ronald.oussoren $"
				8
				9	import sys, os, string, re
				10	from distutils.errors import DistutilsPlatformError
				11	from distutils.dep_util import newer
				12	from distutils.spawn import spawn
				13	from distutils import log
				14
				15	def get_platform ():
				16	"""Return a string that identifies the current platform. This is used
				17	mainly to distinguish platform-specific build directories and
				18	platform-specific built distributions. Typically includes the OS name
				19	and version and the architecture (as supplied by 'os.uname()'),
				20	although the exact information included depends on the OS; eg. for IRIX
				21	the architecture isn't particularly important (IRIX only runs on SGI
				22	hardware), but for Linux the kernel version isn't particularly
				23	important.
				24
				25	Examples of returned values:
				26	linux-i586
				27	linux-alpha (?)
				28	solaris-2.6-sun4u
				29	irix-5.3
				30	irix64-6.2
				31
				32	For non-POSIX platforms, currently just returns 'sys.platform'.
				33	"""
				34	if os.name != "posix" or not hasattr(os, 'uname'):
				35	# XXX what about the architecture? NT is Intel or Alpha,
				36	# Mac OS is M68k or PPC, etc.
				37	return sys.platform
				38
				39	# Try to distinguish various flavours of Unix
				40
				41	(osname, host, release, version, machine) = os.uname()
				42
				43	# Convert the OS name to lowercase, remove '/' characters
				44	# (to accommodate BSD/OS), and translate spaces (for "Power Macintosh")
				45	osname = string.lower(osname)
				46	osname = string.replace(osname, '/', '')
				47	machine = string.replace(machine, ' ', '_')
				48	machine = string.replace(machine, '/', '-')
				49
				50	if osname[:5] == "linux":
				51	# At least on Linux/Intel, 'machine' is the processor --
				52	# i386, etc.
				53	# XXX what about Alpha, SPARC, etc?
				54	return "%s-%s" % (osname, machine)
				55	elif osname[:5] == "sunos":
				56	if release[0] >= "5": # SunOS 5 == Solaris 2
				57	osname = "solaris"
				58	release = "%d.%s" % (int(release[0]) - 3, release[2:])
				59	# fall through to standard osname-release-machine representation
				60	elif osname[:4] == "irix": # could be "irix64"!
				61	return "%s-%s" % (osname, release)
				62	elif osname[:3] == "aix":
				63	return "%s-%s.%s" % (osname, version, release)
				64	elif osname[:6] == "cygwin":
				65	osname = "cygwin"
				66	rel_re = re.compile (r'[\d.]+')
				67	m = rel_re.match(release)
				68	if m:
				69	release = m.group()
				70	elif osname[:6] == "darwin":
				71	#
				72	# For our purposes, we'll assume that the system version from
				73	# distutils' perspective is what MACOSX_DEPLOYMENT_TARGET is set
				74	# to. This makes the compatibility story a bit more sane because the
				75	# machine is going to compile and link as if it were
				76	# MACOSX_DEPLOYMENT_TARGET.
				77	from distutils.sysconfig import get_config_vars
				78	cfgvars = get_config_vars()
				79
				80	macver = os.environ.get('MACOSX_DEPLOYMENT_TARGET')
				81	if not macver:
				82	macver = cfgvars.get('MACOSX_DEPLOYMENT_TARGET')
				83
				84	if not macver:
				85	# Get the system version. Reading this plist is a documented
				86	# way to get the system version (see the documentation for
				87	# the Gestalt Manager)
				88	try:
				89	f = open('/System/Library/CoreServices/SystemVersion.plist')
				90	except IOError:
				91	# We're on a plain darwin box, fall back to the default
				92	# behaviour.
				93	pass
				94	else:
				95	m = re.search(
				96	r'<key>ProductUserVisibleVersion</key>\s*' +
				97	r'<string>(.*?)</string>', f.read())
				98	f.close()
				99	if m is not None:
				100	macver = '.'.join(m.group(1).split('.')[:2])
				101	# else: fall back to the default behaviour
				102
				103	if macver:
				104	from distutils.sysconfig import get_config_vars
				105	release = macver
				106	osname = "macosx"
				107
				108
				109	if (release + '.') >= '10.4.' and \
				110	get_config_vars().get('UNIVERSALSDK', '').strip():
				111	# The universal build will build fat binaries, but not on
				112	# systems before 10.4
				113	machine = 'fat'
				114
				115	elif machine in ('PowerPC', 'Power_Macintosh'):
				116	# Pick a sane name for the PPC architecture.
				117	machine = 'ppc'
				118
				119	return "%s-%s-%s" % (osname, release, machine)
				120
				121	# get_platform ()
				122
				123
				124	def convert_path (pathname):
				125	"""Return 'pathname' as a name that will work on the native filesystem,
				126	i.e. split it on '/' and put it back together again using the current
				127	directory separator. Needed because filenames in the setup script are
				128	always supplied in Unix style, and have to be converted to the local
				129	convention before we can actually use them in the filesystem. Raises
				130	ValueError on non-Unix-ish systems if 'pathname' either starts or
				131	ends with a slash.
				132	"""
				133	if os.sep == '/':
				134	return pathname
				135	if not pathname:
				136	return pathname
				137	if pathname[0] == '/':
				138	raise ValueError, "path '%s' cannot be absolute" % pathname
				139	if pathname[-1] == '/':
				140	raise ValueError, "path '%s' cannot end with '/'" % pathname
				141
				142	paths = string.split(pathname, '/')
				143	while '.' in paths:
				144	paths.remove('.')
				145	if not paths:
				146	return os.curdir
				147	return apply(os.path.join, paths)
				148
				149	# convert_path ()
				150
				151
				152	def change_root (new_root, pathname):
				153	"""Return 'pathname' with 'new_root' prepended. If 'pathname' is
				154	relative, this is equivalent to "os.path.join(new_root,pathname)".
				155	Otherwise, it requires making 'pathname' relative and then joining the
				156	two, which is tricky on DOS/Windows and Mac OS.
				157	"""
				158	os_name = os._name if sys.platform.startswith('java') else os.name
				159	if os_name == 'posix':
				160	if not os.path.isabs(pathname):
				161	return os.path.join(new_root, pathname)
				162	else:
				163	return os.path.join(new_root, pathname[1:])
				164
				165	elif os_name == 'nt':
				166	(drive, path) = os.path.splitdrive(pathname)
				167	if path[0] == '\\':
				168	path = path[1:]
				169	return os.path.join(new_root, path)
				170
				171	elif os_name == 'os2':
				172	(drive, path) = os.path.splitdrive(pathname)
				173	if path[0] == os.sep:
				174	path = path[1:]
				175	return os.path.join(new_root, path)
				176
				177	elif os_name == 'mac':
				178	if not os.path.isabs(pathname):
				179	return os.path.join(new_root, pathname)
				180	else:
				181	# Chop off volume name from start of path
				182	elements = string.split(pathname, ":", 1)
				183	pathname = ":" + elements[1]
				184	return os.path.join(new_root, pathname)
				185
				186	else:
				187	raise DistutilsPlatformError, \
				188	"nothing known about platform '%s'" % os_name
				189
				190
				191	_environ_checked = 0
				192	def check_environ ():
				193	"""Ensure that 'os.environ' has all the environment variables we
				194	guarantee that users can use in config files, command-line options,
				195	etc. Currently this includes:
				196	HOME - user's home directory (Unix only)
				197	PLAT - description of the current platform, including hardware
				198	and OS (see 'get_platform()')
				199	"""
				200	global _environ_checked
				201	if _environ_checked:
				202	return
				203
				204	if os.name == 'posix' and not os.environ.has_key('HOME'):
				205	import pwd
				206	os.environ['HOME'] = pwd.getpwuid(os.getuid())[5]
				207
				208	if not os.environ.has_key('PLAT'):
				209	os.environ['PLAT'] = get_platform()
				210
				211	_environ_checked = 1
				212
				213
				214	def subst_vars (s, local_vars):
				215	"""Perform shell/Perl-style variable substitution on 'string'. Every
				216	occurrence of '$' followed by a name is considered a variable, and
				217	variable is substituted by the value found in the 'local_vars'
				218	dictionary, or in 'os.environ' if it's not in 'local_vars'.
				219	'os.environ' is first checked/augmented to guarantee that it contains
				220	certain values: see 'check_environ()'. Raise ValueError for any
				221	variables not found in either 'local_vars' or 'os.environ'.
				222	"""
				223	check_environ()
				224	def _subst (match, local_vars=local_vars):
				225	var_name = match.group(1)
				226	if local_vars.has_key(var_name):
				227	return str(local_vars[var_name])
				228	else:
				229	return os.environ[var_name]
				230
				231	try:
				232	return re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s)
				233	except KeyError, var:
				234	raise ValueError, "invalid variable '$%s'" % var
				235
				236	# subst_vars ()
				237
				238
				239	def grok_environment_error (exc, prefix="error: "):
				240	"""Generate a useful error message from an EnvironmentError (IOError or
				241	OSError) exception object. Handles Python 1.5.1 and 1.5.2 styles, and
				242	does what it can to deal with exception objects that don't have a
				243	filename (which happens when the error is due to a two-file operation,
				244	such as 'rename()' or 'link()'. Returns the error message as a string
				245	prefixed with 'prefix'.
				246	"""
				247	# check for Python 1.5.2-style {IO,OS}Error exception objects
				248	if hasattr(exc, 'filename') and hasattr(exc, 'strerror'):
				249	if exc.filename:
				250	error = prefix + "%s: %s" % (exc.filename, exc.strerror)
				251	else:
				252	# two-argument functions in posix module don't
				253	# include the filename in the exception object!
				254	error = prefix + "%s" % exc.strerror
				255	else:
				256	error = prefix + str(exc[-1])
				257
				258	return error
				259
				260
				261	# Needed by 'split_quoted()'
				262	_wordchars_re = _squote_re = _dquote_re = None
				263	def _init_regex():
				264	global _wordchars_re, _squote_re, _dquote_re
				265	_wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace)
				266	_squote_re = re.compile(r"'(?:[^'\\]\|\\.)*'")
				267	_dquote_re = re.compile(r'"(?:[^"\\]\|\\.)*"')
				268
				269	def split_quoted (s):
				270	"""Split a string up according to Unix shell-like rules for quotes and
				271	backslashes. In short: words are delimited by spaces, as long as those
				272	spaces are not escaped by a backslash, or inside a quoted string.
				273	Single and double quotes are equivalent, and the quote characters can
				274	be backslash-escaped. The backslash is stripped from any two-character
				275	escape sequence, leaving only the escaped character. The quote
				276	characters are stripped from any quoted string. Returns a list of
				277	words.
				278	"""
				279
				280	# This is a nice algorithm for splitting up a single string, since it
				281	# doesn't require character-by-character examination. It was a little
				282	# bit of a brain-bender to get it working right, though...
				283	if _wordchars_re is None: _init_regex()
				284
				285	s = string.strip(s)
				286	words = []
				287	pos = 0
				288
				289	while s:
				290	m = _wordchars_re.match(s, pos)
				291	end = m.end()
				292	if end == len(s):
				293	words.append(s[:end])
				294	break
				295
				296	if s[end] in string.whitespace: # unescaped, unquoted whitespace: now
				297	words.append(s[:end]) # we definitely have a word delimiter
				298	s = string.lstrip(s[end:])
				299	pos = 0
				300
				301	elif s[end] == '\\': # preserve whatever is being escaped;
				302	# will become part of the current word
				303	s = s[:end] + s[end+1:]
				304	pos = end+1
				305
				306	else:
				307	if s[end] == "'": # slurp singly-quoted string
				308	m = _squote_re.match(s, end)
				309	elif s[end] == '"': # slurp doubly-quoted string
				310	m = _dquote_re.match(s, end)
				311	else:
				312	raise RuntimeError, \
				313	"this can't happen (bad char '%c')" % s[end]
				314
				315	if m is None:
				316	raise ValueError, \
				317	"bad string (mismatched %s quotes?)" % s[end]
				318
				319	(beg, end) = m.span()
				320	s = s[:beg] + s[beg+1:end-1] + s[end:]
				321	pos = m.end() - 2
				322
				323	if pos >= len(s):
				324	words.append(s)
				325	break
				326
				327	return words
				328
				329	# split_quoted ()
				330
				331
				332	def execute (func, args, msg=None, verbose=0, dry_run=0):
				333	"""Perform some action that affects the outside world (eg. by
				334	writing to the filesystem). Such actions are special because they
				335	are disabled by the 'dry_run' flag. This method takes care of all
				336	that bureaucracy for you; all you have to do is supply the
				337	function to call and an argument tuple for it (to embody the
				338	"external action" being performed), and an optional message to
				339	print.
				340	"""
				341	if msg is None:
				342	msg = "%s%r" % (func.__name__, args)
				343	if msg[-2:] == ',)': # correct for singleton tuple
				344	msg = msg[0:-2] + ')'
				345
				346	log.info(msg)
				347	if not dry_run:
				348	apply(func, args)
				349
				350
				351	def strtobool (val):
				352	"""Convert a string representation of truth to true (1) or false (0).
				353
				354	True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values
				355	are 'n', 'no', 'f', 'false', 'off', and '0'. Raises ValueError if
				356	'val' is anything else.
				357	"""
				358	val = string.lower(val)
				359	if val in ('y', 'yes', 't', 'true', 'on', '1'):
				360	return 1
				361	elif val in ('n', 'no', 'f', 'false', 'off', '0'):
				362	return 0
				363	else:
				364	raise ValueError, "invalid truth value %r" % (val,)
				365
				366
				367	def byte_compile (py_files,
				368	optimize=0, force=0,
				369	prefix=None, base_dir=None,
				370	verbose=1, dry_run=0,
				371	direct=None):
				372	"""Byte-compile a collection of Python source files to either .pyc
				373	or .pyo files in the same directory. 'py_files' is a list of files
				374	to compile; any files that don't end in ".py" are silently skipped.
				375	'optimize' must be one of the following:
				376	0 - don't optimize (generate .pyc)
				377	1 - normal optimization (like "python -O")
				378	2 - extra optimization (like "python -OO")
				379	If 'force' is true, all files are recompiled regardless of
				380	timestamps.
				381
				382	The source filename encoded in each bytecode file defaults to the
				383	filenames listed in 'py_files'; you can modify these with 'prefix' and
				384	'basedir'. 'prefix' is a string that will be stripped off of each
				385	source filename, and 'base_dir' is a directory name that will be
				386	prepended (after 'prefix' is stripped). You can supply either or both
				387	(or neither) of 'prefix' and 'base_dir', as you wish.
				388
				389	If 'dry_run' is true, doesn't actually do anything that would
				390	affect the filesystem.
				391
				392	Byte-compilation is either done directly in this interpreter process
				393	with the standard py_compile module, or indirectly by writing a
				394	temporary script and executing it. Normally, you should let
				395	'byte_compile()' figure out to use direct compilation or not (see
				396	the source for details). The 'direct' flag is used by the script
				397	generated in indirect mode; unless you know what you're doing, leave
				398	it set to None.
				399	"""
				400
				401	# First, if the caller didn't force us into direct or indirect mode,
				402	# figure out which mode we should be in. We take a conservative
				403	# approach: choose direct mode only if the current interpreter is
				404	# in debug mode and optimize is 0. If we're not in debug mode (-O
				405	# or -OO), we don't know which level of optimization this
				406	# interpreter is running with, so we can't do direct
				407	# byte-compilation and be certain that it's the right thing. Thus,
				408	# always compile indirectly if the current interpreter is in either
				409	# optimize mode, or if either optimization level was requested by
				410	# the caller.
				411	if direct is None:
				412	direct = (__debug__ and optimize == 0)
				413
				414	# "Indirect" byte-compilation: write a temporary script and then
				415	# run it with the appropriate flags.
				416	if not direct:
				417	try:
				418	from tempfile import mkstemp
				419	(script_fd, script_name) = mkstemp(".py")
				420	except ImportError:
				421	from tempfile import mktemp
				422	(script_fd, script_name) = None, mktemp(".py")
				423	log.info("writing byte-compilation script '%s'", script_name)
				424	if not dry_run:
				425	if script_fd is not None:
				426	script = os.fdopen(script_fd, "w")
				427	else:
				428	script = open(script_name, "w")
				429
				430	script.write("""\
				431	from distutils.util import byte_compile
				432	files = [
				433	""")
				434
				435	# XXX would be nice to write absolute filenames, just for
				436	# safety's sake (script should be more robust in the face of
				437	# chdir'ing before running it). But this requires abspath'ing
				438	# 'prefix' as well, and that breaks the hack in build_lib's
				439	# 'byte_compile()' method that carefully tacks on a trailing
				440	# slash (os.sep really) to make sure the prefix here is "just
				441	# right". This whole prefix business is rather delicate -- the
				442	# problem is that it's really a directory, but I'm treating it
				443	# as a dumb string, so trailing slashes and so forth matter.
				444
				445	#py_files = map(os.path.abspath, py_files)
				446	#if prefix:
				447	# prefix = os.path.abspath(prefix)
				448
				449	script.write(string.join(map(repr, py_files), ",\n") + "]\n")
				450	script.write("""
				451	byte_compile(files, optimize=%r, force=%r,
				452	prefix=%r, base_dir=%r,
				453	verbose=%r, dry_run=0,
				454	direct=1)
				455	""" % (optimize, force, prefix, base_dir, verbose))
				456
				457	script.close()
				458
				459	cmd = [sys.executable, script_name]
				460	if optimize == 1:
				461	cmd.insert(1, "-O")
				462	elif optimize == 2:
				463	cmd.insert(1, "-OO")
				464	spawn(cmd, dry_run=dry_run)
				465	execute(os.remove, (script_name,), "removing %s" % script_name,
				466	dry_run=dry_run)
				467
				468	# "Direct" byte-compilation: use the py_compile module to compile
				469	# right here, right now. Note that the script generated in indirect
				470	# mode simply calls 'byte_compile()' in direct mode, a weird sort of
				471	# cross-process recursion. Hey, it works!
				472	else:
				473	from py_compile import compile
				474
				475	for file in py_files:
				476	if file[-3:] != ".py":
				477	# This lets us be lazy and not filter filenames in
				478	# the "install_lib" command.
				479	continue
				480
				481	# Terminology from the py_compile module:
				482	# cfile - byte-compiled file
				483	# dfile - purported source filename (same as 'file' by default)
				484	if sys.platform.startswith('java'):
				485	cfile = file[:-3] + '$py.class'
				486	else:
				487	cfile = file + (__debug__ and "c" or "o")
				488	dfile = file
				489	if prefix:
				490	if file[:len(prefix)] != prefix:
				491	raise ValueError, \
				492	("invalid prefix: filename %r doesn't start with %r"
				493	% (file, prefix))
				494	dfile = dfile[len(prefix):]
				495	if base_dir:
				496	dfile = os.path.join(base_dir, dfile)
				497
				498	cfile_base = os.path.basename(cfile)
				499	if direct:
				500	if force or newer(file, cfile):
				501	log.info("byte-compiling %s to %s", file, cfile_base)
				502	if not dry_run:
				503	compile(file, cfile, dfile)
				504	else:
				505	log.debug("skipping byte-compilation of %s to %s",
				506	file, cfile_base)
				507
				508	# byte_compile ()
				509
				510	def rfc822_escape (header):
				511	"""Return a version of the string escaped for inclusion in an
				512	RFC-822 header, by ensuring there are 8 spaces space after each newline.
				513	"""
				514	lines = string.split(header, '\n')
				515	lines = map(string.strip, lines)
				516	header = string.join(lines, '\n' + 8*' ')
				517	return header