Blame - linux-x64/clang/python3/lib/python3.9/distutils/util.py - hafnium/prebuilts

blob: 4b002ecef1df8ffd79a9aa067640eb43027a9bf2 [file] [log] [blame]

Olivier Deprez	f4ef2d0	2021-04-20 13:36:24 +0200	[diff] [blame]	1	"""distutils.util
				2
				3	Miscellaneous utility functions -- anything that doesn't fit into
				4	one of the other *util.py modules.
				5	"""
				6
				7	import os
				8	import re
				9	import importlib.util
				10	import string
				11	import sys
				12	from distutils.errors import DistutilsPlatformError
				13	from distutils.dep_util import newer
				14	from distutils.spawn import spawn
				15	from distutils import log
				16	from distutils.errors import DistutilsByteCompileError
				17
				18	def get_host_platform():
				19	"""Return a string that identifies the current platform. This is used mainly to
				20	distinguish platform-specific build directories and platform-specific built
				21	distributions. Typically includes the OS name and version and the
				22	architecture (as supplied by 'os.uname()'), although the exact information
				23	included depends on the OS; eg. on Linux, the kernel version isn't
				24	particularly important.
				25
				26	Examples of returned values:
				27	linux-i586
				28	linux-alpha (?)
				29	solaris-2.6-sun4u
				30
				31	Windows will return one of:
				32	win-amd64 (64bit Windows on AMD64 (aka x86_64, Intel64, EM64T, etc)
				33	win32 (all others - specifically, sys.platform is returned)
				34
				35	For other non-POSIX platforms, currently just returns 'sys.platform'.
				36
				37	"""
				38	if os.name == 'nt':
				39	if 'amd64' in sys.version.lower():
				40	return 'win-amd64'
				41	if '(arm)' in sys.version.lower():
				42	return 'win-arm32'
				43	if '(arm64)' in sys.version.lower():
				44	return 'win-arm64'
				45	return sys.platform
				46
				47	# Set for cross builds explicitly
				48	if "_PYTHON_HOST_PLATFORM" in os.environ:
				49	return os.environ["_PYTHON_HOST_PLATFORM"]
				50
				51	if os.name != "posix" or not hasattr(os, 'uname'):
				52	# XXX what about the architecture? NT is Intel or Alpha,
				53	# Mac OS is M68k or PPC, etc.
				54	return sys.platform
				55
				56	# Try to distinguish various flavours of Unix
				57
				58	(osname, host, release, version, machine) = os.uname()
				59
				60	# Convert the OS name to lowercase, remove '/' characters, and translate
				61	# spaces (for "Power Macintosh")
				62	osname = osname.lower().replace('/', '')
				63	machine = machine.replace(' ', '_')
				64	machine = machine.replace('/', '-')
				65
				66	if osname[:5] == "linux":
				67	# At least on Linux/Intel, 'machine' is the processor --
				68	# i386, etc.
				69	# XXX what about Alpha, SPARC, etc?
				70	return "%s-%s" % (osname, machine)
				71	elif osname[:5] == "sunos":
				72	if release[0] >= "5": # SunOS 5 == Solaris 2
				73	osname = "solaris"
				74	release = "%d.%s" % (int(release[0]) - 3, release[2:])
				75	# We can't use "platform.architecture()[0]" because a
				76	# bootstrap problem. We use a dict to get an error
				77	# if some suspicious happens.
				78	bitness = {2147483647:"32bit", 9223372036854775807:"64bit"}
				79	machine += ".%s" % bitness[sys.maxsize]
				80	# fall through to standard osname-release-machine representation
				81	elif osname[:3] == "aix":
				82	from _aix_support import aix_platform
				83	return aix_platform()
				84	elif osname[:6] == "cygwin":
				85	osname = "cygwin"
				86	rel_re = re.compile (r'[\d.]+', re.ASCII)
				87	m = rel_re.match(release)
				88	if m:
				89	release = m.group()
				90	elif osname[:6] == "darwin":
				91	import _osx_support, distutils.sysconfig
				92	osname, release, machine = _osx_support.get_platform_osx(
				93	distutils.sysconfig.get_config_vars(),
				94	osname, release, machine)
				95
				96	return "%s-%s-%s" % (osname, release, machine)
				97
				98	def get_platform():
				99	if os.name == 'nt':
				100	TARGET_TO_PLAT = {
				101	'x86' : 'win32',
				102	'x64' : 'win-amd64',
				103	'arm' : 'win-arm32',
				104	}
				105	return TARGET_TO_PLAT.get(os.environ.get('VSCMD_ARG_TGT_ARCH')) or get_host_platform()
				106	else:
				107	return get_host_platform()
				108
				109	def convert_path (pathname):
				110	"""Return 'pathname' as a name that will work on the native filesystem,
				111	i.e. split it on '/' and put it back together again using the current
				112	directory separator. Needed because filenames in the setup script are
				113	always supplied in Unix style, and have to be converted to the local
				114	convention before we can actually use them in the filesystem. Raises
				115	ValueError on non-Unix-ish systems if 'pathname' either starts or
				116	ends with a slash.
				117	"""
				118	if os.sep == '/':
				119	return pathname
				120	if not pathname:
				121	return pathname
				122	if pathname[0] == '/':
				123	raise ValueError("path '%s' cannot be absolute" % pathname)
				124	if pathname[-1] == '/':
				125	raise ValueError("path '%s' cannot end with '/'" % pathname)
				126
				127	paths = pathname.split('/')
				128	while '.' in paths:
				129	paths.remove('.')
				130	if not paths:
				131	return os.curdir
				132	return os.path.join(*paths)
				133
				134	# convert_path ()
				135
				136
				137	def change_root (new_root, pathname):
				138	"""Return 'pathname' with 'new_root' prepended. If 'pathname' is
				139	relative, this is equivalent to "os.path.join(new_root,pathname)".
				140	Otherwise, it requires making 'pathname' relative and then joining the
				141	two, which is tricky on DOS/Windows and Mac OS.
				142	"""
				143	if os.name == 'posix':
				144	if not os.path.isabs(pathname):
				145	return os.path.join(new_root, pathname)
				146	else:
				147	return os.path.join(new_root, pathname[1:])
				148
				149	elif os.name == 'nt':
				150	(drive, path) = os.path.splitdrive(pathname)
				151	if path[0] == '\\':
				152	path = path[1:]
				153	return os.path.join(new_root, path)
				154
				155	else:
				156	raise DistutilsPlatformError("nothing known about platform '%s'" % os.name)
				157
				158
				159	_environ_checked = 0
				160	def check_environ ():
				161	"""Ensure that 'os.environ' has all the environment variables we
				162	guarantee that users can use in config files, command-line options,
				163	etc. Currently this includes:
				164	HOME - user's home directory (Unix only)
				165	PLAT - description of the current platform, including hardware
				166	and OS (see 'get_platform()')
				167	"""
				168	global _environ_checked
				169	if _environ_checked:
				170	return
				171
				172	if os.name == 'posix' and 'HOME' not in os.environ:
				173	try:
				174	import pwd
				175	os.environ['HOME'] = pwd.getpwuid(os.getuid())[5]
				176	except (ImportError, KeyError):
				177	# bpo-10496: if the current user identifier doesn't exist in the
				178	# password database, do nothing
				179	pass
				180
				181	if 'PLAT' not in os.environ:
				182	os.environ['PLAT'] = get_platform()
				183
				184	_environ_checked = 1
				185
				186
				187	def subst_vars (s, local_vars):
				188	"""Perform shell/Perl-style variable substitution on 'string'. Every
				189	occurrence of '$' followed by a name is considered a variable, and
				190	variable is substituted by the value found in the 'local_vars'
				191	dictionary, or in 'os.environ' if it's not in 'local_vars'.
				192	'os.environ' is first checked/augmented to guarantee that it contains
				193	certain values: see 'check_environ()'. Raise ValueError for any
				194	variables not found in either 'local_vars' or 'os.environ'.
				195	"""
				196	check_environ()
				197	def _subst (match, local_vars=local_vars):
				198	var_name = match.group(1)
				199	if var_name in local_vars:
				200	return str(local_vars[var_name])
				201	else:
				202	return os.environ[var_name]
				203
				204	try:
				205	return re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s)
				206	except KeyError as var:
				207	raise ValueError("invalid variable '$%s'" % var)
				208
				209	# subst_vars ()
				210
				211
				212	def grok_environment_error (exc, prefix="error: "):
				213	# Function kept for backward compatibility.
				214	# Used to try clever things with EnvironmentErrors,
				215	# but nowadays str(exception) produces good messages.
				216	return prefix + str(exc)
				217
				218
				219	# Needed by 'split_quoted()'
				220	_wordchars_re = _squote_re = _dquote_re = None
				221	def _init_regex():
				222	global _wordchars_re, _squote_re, _dquote_re
				223	_wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace)
				224	_squote_re = re.compile(r"'(?:[^'\\]\|\\.)*'")
				225	_dquote_re = re.compile(r'"(?:[^"\\]\|\\.)*"')
				226
				227	def split_quoted (s):
				228	"""Split a string up according to Unix shell-like rules for quotes and
				229	backslashes. In short: words are delimited by spaces, as long as those
				230	spaces are not escaped by a backslash, or inside a quoted string.
				231	Single and double quotes are equivalent, and the quote characters can
				232	be backslash-escaped. The backslash is stripped from any two-character
				233	escape sequence, leaving only the escaped character. The quote
				234	characters are stripped from any quoted string. Returns a list of
				235	words.
				236	"""
				237
				238	# This is a nice algorithm for splitting up a single string, since it
				239	# doesn't require character-by-character examination. It was a little
				240	# bit of a brain-bender to get it working right, though...
				241	if _wordchars_re is None: _init_regex()
				242
				243	s = s.strip()
				244	words = []
				245	pos = 0
				246
				247	while s:
				248	m = _wordchars_re.match(s, pos)
				249	end = m.end()
				250	if end == len(s):
				251	words.append(s[:end])
				252	break
				253
				254	if s[end] in string.whitespace: # unescaped, unquoted whitespace: now
				255	words.append(s[:end]) # we definitely have a word delimiter
				256	s = s[end:].lstrip()
				257	pos = 0
				258
				259	elif s[end] == '\\': # preserve whatever is being escaped;
				260	# will become part of the current word
				261	s = s[:end] + s[end+1:]
				262	pos = end+1
				263
				264	else:
				265	if s[end] == "'": # slurp singly-quoted string
				266	m = _squote_re.match(s, end)
				267	elif s[end] == '"': # slurp doubly-quoted string
				268	m = _dquote_re.match(s, end)
				269	else:
				270	raise RuntimeError("this can't happen (bad char '%c')" % s[end])
				271
				272	if m is None:
				273	raise ValueError("bad string (mismatched %s quotes?)" % s[end])
				274
				275	(beg, end) = m.span()
				276	s = s[:beg] + s[beg+1:end-1] + s[end:]
				277	pos = m.end() - 2
				278
				279	if pos >= len(s):
				280	words.append(s)
				281	break
				282
				283	return words
				284
				285	# split_quoted ()
				286
				287
				288	def execute (func, args, msg=None, verbose=0, dry_run=0):
				289	"""Perform some action that affects the outside world (eg. by
				290	writing to the filesystem). Such actions are special because they
				291	are disabled by the 'dry_run' flag. This method takes care of all
				292	that bureaucracy for you; all you have to do is supply the
				293	function to call and an argument tuple for it (to embody the
				294	"external action" being performed), and an optional message to
				295	print.
				296	"""
				297	if msg is None:
				298	msg = "%s%r" % (func.__name__, args)
				299	if msg[-2:] == ',)': # correct for singleton tuple
				300	msg = msg[0:-2] + ')'
				301
				302	log.info(msg)
				303	if not dry_run:
				304	func(*args)
				305
				306
				307	def strtobool (val):
				308	"""Convert a string representation of truth to true (1) or false (0).
				309
				310	True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values
				311	are 'n', 'no', 'f', 'false', 'off', and '0'. Raises ValueError if
				312	'val' is anything else.
				313	"""
				314	val = val.lower()
				315	if val in ('y', 'yes', 't', 'true', 'on', '1'):
				316	return 1
				317	elif val in ('n', 'no', 'f', 'false', 'off', '0'):
				318	return 0
				319	else:
				320	raise ValueError("invalid truth value %r" % (val,))
				321
				322
				323	def byte_compile (py_files,
				324	optimize=0, force=0,
				325	prefix=None, base_dir=None,
				326	verbose=1, dry_run=0,
				327	direct=None):
				328	"""Byte-compile a collection of Python source files to .pyc
				329	files in a __pycache__ subdirectory. 'py_files' is a list
				330	of files to compile; any files that don't end in ".py" are silently
				331	skipped. 'optimize' must be one of the following:
				332	0 - don't optimize
				333	1 - normal optimization (like "python -O")
				334	2 - extra optimization (like "python -OO")
				335	If 'force' is true, all files are recompiled regardless of
				336	timestamps.
				337
				338	The source filename encoded in each bytecode file defaults to the
				339	filenames listed in 'py_files'; you can modify these with 'prefix' and
				340	'basedir'. 'prefix' is a string that will be stripped off of each
				341	source filename, and 'base_dir' is a directory name that will be
				342	prepended (after 'prefix' is stripped). You can supply either or both
				343	(or neither) of 'prefix' and 'base_dir', as you wish.
				344
				345	If 'dry_run' is true, doesn't actually do anything that would
				346	affect the filesystem.
				347
				348	Byte-compilation is either done directly in this interpreter process
				349	with the standard py_compile module, or indirectly by writing a
				350	temporary script and executing it. Normally, you should let
				351	'byte_compile()' figure out to use direct compilation or not (see
				352	the source for details). The 'direct' flag is used by the script
				353	generated in indirect mode; unless you know what you're doing, leave
				354	it set to None.
				355	"""
				356
				357	# Late import to fix a bootstrap issue: _posixsubprocess is built by
				358	# setup.py, but setup.py uses distutils.
				359	import subprocess
				360
				361	# nothing is done if sys.dont_write_bytecode is True
				362	if sys.dont_write_bytecode:
				363	raise DistutilsByteCompileError('byte-compiling is disabled.')
				364
				365	# First, if the caller didn't force us into direct or indirect mode,
				366	# figure out which mode we should be in. We take a conservative
				367	# approach: choose direct mode only if the current interpreter is
				368	# in debug mode and optimize is 0. If we're not in debug mode (-O
				369	# or -OO), we don't know which level of optimization this
				370	# interpreter is running with, so we can't do direct
				371	# byte-compilation and be certain that it's the right thing. Thus,
				372	# always compile indirectly if the current interpreter is in either
				373	# optimize mode, or if either optimization level was requested by
				374	# the caller.
				375	if direct is None:
				376	direct = (__debug__ and optimize == 0)
				377
				378	# "Indirect" byte-compilation: write a temporary script and then
				379	# run it with the appropriate flags.
				380	if not direct:
				381	try:
				382	from tempfile import mkstemp
				383	(script_fd, script_name) = mkstemp(".py")
				384	except ImportError:
				385	from tempfile import mktemp
				386	(script_fd, script_name) = None, mktemp(".py")
				387	log.info("writing byte-compilation script '%s'", script_name)
				388	if not dry_run:
				389	if script_fd is not None:
				390	script = os.fdopen(script_fd, "w")
				391	else:
				392	script = open(script_name, "w")
				393
				394	with script:
				395	script.write("""\
				396	from distutils.util import byte_compile
				397	files = [
				398	""")
				399
				400	# XXX would be nice to write absolute filenames, just for
				401	# safety's sake (script should be more robust in the face of
				402	# chdir'ing before running it). But this requires abspath'ing
				403	# 'prefix' as well, and that breaks the hack in build_lib's
				404	# 'byte_compile()' method that carefully tacks on a trailing
				405	# slash (os.sep really) to make sure the prefix here is "just
				406	# right". This whole prefix business is rather delicate -- the
				407	# problem is that it's really a directory, but I'm treating it
				408	# as a dumb string, so trailing slashes and so forth matter.
				409
				410	#py_files = map(os.path.abspath, py_files)
				411	#if prefix:
				412	# prefix = os.path.abspath(prefix)
				413
				414	script.write(",\n".join(map(repr, py_files)) + "]\n")
				415	script.write("""
				416	byte_compile(files, optimize=%r, force=%r,
				417	prefix=%r, base_dir=%r,
				418	verbose=%r, dry_run=0,
				419	direct=1)
				420	""" % (optimize, force, prefix, base_dir, verbose))
				421
				422	cmd = [sys.executable]
				423	cmd.extend(subprocess._optim_args_from_interpreter_flags())
				424	cmd.append(script_name)
				425	spawn(cmd, dry_run=dry_run)
				426	execute(os.remove, (script_name,), "removing %s" % script_name,
				427	dry_run=dry_run)
				428
				429	# "Direct" byte-compilation: use the py_compile module to compile
				430	# right here, right now. Note that the script generated in indirect
				431	# mode simply calls 'byte_compile()' in direct mode, a weird sort of
				432	# cross-process recursion. Hey, it works!
				433	else:
				434	from py_compile import compile
				435
				436	for file in py_files:
				437	if file[-3:] != ".py":
				438	# This lets us be lazy and not filter filenames in
				439	# the "install_lib" command.
				440	continue
				441
				442	# Terminology from the py_compile module:
				443	# cfile - byte-compiled file
				444	# dfile - purported source filename (same as 'file' by default)
				445	if optimize >= 0:
				446	opt = '' if optimize == 0 else optimize
				447	cfile = importlib.util.cache_from_source(
				448	file, optimization=opt)
				449	else:
				450	cfile = importlib.util.cache_from_source(file)
				451	dfile = file
				452	if prefix:
				453	if file[:len(prefix)] != prefix:
				454	raise ValueError("invalid prefix: filename %r doesn't start with %r"
				455	% (file, prefix))
				456	dfile = dfile[len(prefix):]
				457	if base_dir:
				458	dfile = os.path.join(base_dir, dfile)
				459
				460	cfile_base = os.path.basename(cfile)
				461	if direct:
				462	if force or newer(file, cfile):
				463	log.info("byte-compiling %s to %s", file, cfile_base)
				464	if not dry_run:
				465	compile(file, cfile, dfile)
				466	else:
				467	log.debug("skipping byte-compilation of %s to %s",
				468	file, cfile_base)
				469
				470	# byte_compile ()
				471
				472	def rfc822_escape (header):
				473	"""Return a version of the string escaped for inclusion in an
				474	RFC-822 header, by ensuring there are 8 spaces space after each newline.
				475	"""
				476	lines = header.split('\n')
				477	sep = '\n' + 8 * ' '
				478	return sep.join(lines)
				479
				480	# 2to3 support
				481
				482	def run_2to3(files, fixer_names=None, options=None, explicit=None):
				483	"""Invoke 2to3 on a list of Python files.
				484	The files should all come from the build area, as the
				485	modification is done in-place. To reduce the build time,
				486	only files modified since the last invocation of this
				487	function should be passed in the files argument."""
				488
				489	if not files:
				490	return
				491
				492	# Make this class local, to delay import of 2to3
				493	from lib2to3.refactor import RefactoringTool, get_fixers_from_package
				494	class DistutilsRefactoringTool(RefactoringTool):
				495	def log_error(self, msg, args, *kw):
				496	log.error(msg, *args)
				497
				498	def log_message(self, msg, *args):
				499	log.info(msg, *args)
				500
				501	def log_debug(self, msg, *args):
				502	log.debug(msg, *args)
				503
				504	if fixer_names is None:
				505	fixer_names = get_fixers_from_package('lib2to3.fixes')
				506	r = DistutilsRefactoringTool(fixer_names, options=options)
				507	r.refactor(files, write=True)
				508
				509	def copydir_run_2to3(src, dest, template=None, fixer_names=None,
				510	options=None, explicit=None):
				511	"""Recursively copy a directory, only copying new and changed files,
				512	running run_2to3 over all newly copied Python modules afterward.
				513
				514	If you give a template string, it's parsed like a MANIFEST.in.
				515	"""
				516	from distutils.dir_util import mkpath
				517	from distutils.file_util import copy_file
				518	from distutils.filelist import FileList
				519	filelist = FileList()
				520	curdir = os.getcwd()
				521	os.chdir(src)
				522	try:
				523	filelist.findall()
				524	finally:
				525	os.chdir(curdir)
				526	filelist.files[:] = filelist.allfiles
				527	if template:
				528	for line in template.splitlines():
				529	line = line.strip()
				530	if not line: continue
				531	filelist.process_template_line(line)
				532	copied = []
				533	for filename in filelist.files:
				534	outname = os.path.join(dest, filename)
				535	mkpath(os.path.dirname(outname))
				536	res = copy_file(os.path.join(src, filename), outname, update=1)
				537	if res[1]: copied.append(outname)
				538	run_2to3([fn for fn in copied if fn.lower().endswith('.py')],
				539	fixer_names=fixer_names, options=options, explicit=explicit)
				540	return copied
				541
				542	class Mixin2to3:
				543	'''Mixin class for commands that run 2to3.
				544	To configure 2to3, setup scripts may either change
				545	the class variables, or inherit from individual commands
				546	to override how 2to3 is invoked.'''
				547
				548	# provide list of fixers to run;
				549	# defaults to all from lib2to3.fixers
				550	fixer_names = None
				551
				552	# options dictionary
				553	options = None
				554
				555	# list of fixers to invoke even though they are marked as explicit
				556	explicit = None
				557
				558	def run_2to3(self, files):
				559	return run_2to3(files, self.fixer_names, self.options, self.explicit)