514 lines
		
	
	
		
			18 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			514 lines
		
	
	
		
			18 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| """distutils.util
 | |
| 
 | |
| Miscellaneous utility functions -- anything that doesn't fit into
 | |
| one of the other *util.py modules.
 | |
| """
 | |
| 
 | |
| import importlib.util
 | |
| import os
 | |
| import re
 | |
| import string
 | |
| import subprocess
 | |
| import sys
 | |
| import sysconfig
 | |
| import functools
 | |
| 
 | |
| from .errors import DistutilsPlatformError, DistutilsByteCompileError
 | |
| from .dep_util import newer
 | |
| from .spawn import spawn
 | |
| from ._log import log
 | |
| 
 | |
| 
 | |
| def get_host_platform():
 | |
|     """
 | |
|     Return a string that identifies the current platform. Use this
 | |
|     function to distinguish platform-specific build directories and
 | |
|     platform-specific built distributions.
 | |
|     """
 | |
| 
 | |
|     # This function initially exposed platforms as defined in Python 3.9
 | |
|     # even with older Python versions when distutils was split out.
 | |
|     # Now it delegates to stdlib sysconfig, but maintains compatibility.
 | |
| 
 | |
|     if sys.version_info < (3, 8):
 | |
|         if os.name == 'nt':
 | |
|             if '(arm)' in sys.version.lower():
 | |
|                 return 'win-arm32'
 | |
|             if '(arm64)' in sys.version.lower():
 | |
|                 return 'win-arm64'
 | |
| 
 | |
|     if sys.version_info < (3, 9):
 | |
|         if os.name == "posix" and hasattr(os, 'uname'):
 | |
|             osname, host, release, version, machine = os.uname()
 | |
|             if osname[:3] == "aix":
 | |
|                 from .py38compat import aix_platform
 | |
| 
 | |
|                 return aix_platform(osname, version, release)
 | |
| 
 | |
|     return sysconfig.get_platform()
 | |
| 
 | |
| 
 | |
| def get_platform():
 | |
|     if os.name == 'nt':
 | |
|         TARGET_TO_PLAT = {
 | |
|             'x86': 'win32',
 | |
|             'x64': 'win-amd64',
 | |
|             'arm': 'win-arm32',
 | |
|             'arm64': 'win-arm64',
 | |
|         }
 | |
|         target = os.environ.get('VSCMD_ARG_TGT_ARCH')
 | |
|         return TARGET_TO_PLAT.get(target) or get_host_platform()
 | |
|     return get_host_platform()
 | |
| 
 | |
| 
 | |
| if sys.platform == 'darwin':
 | |
|     _syscfg_macosx_ver = None  # cache the version pulled from sysconfig
 | |
| MACOSX_VERSION_VAR = 'MACOSX_DEPLOYMENT_TARGET'
 | |
| 
 | |
| 
 | |
| def _clear_cached_macosx_ver():
 | |
|     """For testing only. Do not call."""
 | |
|     global _syscfg_macosx_ver
 | |
|     _syscfg_macosx_ver = None
 | |
| 
 | |
| 
 | |
| def get_macosx_target_ver_from_syscfg():
 | |
|     """Get the version of macOS latched in the Python interpreter configuration.
 | |
|     Returns the version as a string or None if can't obtain one. Cached."""
 | |
|     global _syscfg_macosx_ver
 | |
|     if _syscfg_macosx_ver is None:
 | |
|         from distutils import sysconfig
 | |
| 
 | |
|         ver = sysconfig.get_config_var(MACOSX_VERSION_VAR) or ''
 | |
|         if ver:
 | |
|             _syscfg_macosx_ver = ver
 | |
|     return _syscfg_macosx_ver
 | |
| 
 | |
| 
 | |
| def get_macosx_target_ver():
 | |
|     """Return the version of macOS for which we are building.
 | |
| 
 | |
|     The target version defaults to the version in sysconfig latched at time
 | |
|     the Python interpreter was built, unless overridden by an environment
 | |
|     variable. If neither source has a value, then None is returned"""
 | |
| 
 | |
|     syscfg_ver = get_macosx_target_ver_from_syscfg()
 | |
|     env_ver = os.environ.get(MACOSX_VERSION_VAR)
 | |
| 
 | |
|     if env_ver:
 | |
|         # Validate overridden version against sysconfig version, if have both.
 | |
|         # Ensure that the deployment target of the build process is not less
 | |
|         # than 10.3 if the interpreter was built for 10.3 or later.  This
 | |
|         # ensures extension modules are built with correct compatibility
 | |
|         # values, specifically LDSHARED which can use
 | |
|         # '-undefined dynamic_lookup' which only works on >= 10.3.
 | |
|         if (
 | |
|             syscfg_ver
 | |
|             and split_version(syscfg_ver) >= [10, 3]
 | |
|             and split_version(env_ver) < [10, 3]
 | |
|         ):
 | |
|             my_msg = (
 | |
|                 '$' + MACOSX_VERSION_VAR + ' mismatch: '
 | |
|                 'now "%s" but "%s" during configure; '
 | |
|                 'must use 10.3 or later' % (env_ver, syscfg_ver)
 | |
|             )
 | |
|             raise DistutilsPlatformError(my_msg)
 | |
|         return env_ver
 | |
|     return syscfg_ver
 | |
| 
 | |
| 
 | |
| def split_version(s):
 | |
|     """Convert a dot-separated string into a list of numbers for comparisons"""
 | |
|     return [int(n) for n in s.split('.')]
 | |
| 
 | |
| 
 | |
| def convert_path(pathname):
 | |
|     """Return 'pathname' as a name that will work on the native filesystem,
 | |
|     i.e. split it on '/' and put it back together again using the current
 | |
|     directory separator.  Needed because filenames in the setup script are
 | |
|     always supplied in Unix style, and have to be converted to the local
 | |
|     convention before we can actually use them in the filesystem.  Raises
 | |
|     ValueError on non-Unix-ish systems if 'pathname' either starts or
 | |
|     ends with a slash.
 | |
|     """
 | |
|     if os.sep == '/':
 | |
|         return pathname
 | |
|     if not pathname:
 | |
|         return pathname
 | |
|     if pathname[0] == '/':
 | |
|         raise ValueError("path '%s' cannot be absolute" % pathname)
 | |
|     if pathname[-1] == '/':
 | |
|         raise ValueError("path '%s' cannot end with '/'" % pathname)
 | |
| 
 | |
|     paths = pathname.split('/')
 | |
|     while '.' in paths:
 | |
|         paths.remove('.')
 | |
|     if not paths:
 | |
|         return os.curdir
 | |
|     return os.path.join(*paths)
 | |
| 
 | |
| 
 | |
| # convert_path ()
 | |
| 
 | |
| 
 | |
| def change_root(new_root, pathname):
 | |
|     """Return 'pathname' with 'new_root' prepended.  If 'pathname' is
 | |
|     relative, this is equivalent to "os.path.join(new_root,pathname)".
 | |
|     Otherwise, it requires making 'pathname' relative and then joining the
 | |
|     two, which is tricky on DOS/Windows and Mac OS.
 | |
|     """
 | |
|     if os.name == 'posix':
 | |
|         if not os.path.isabs(pathname):
 | |
|             return os.path.join(new_root, pathname)
 | |
|         else:
 | |
|             return os.path.join(new_root, pathname[1:])
 | |
| 
 | |
|     elif os.name == 'nt':
 | |
|         (drive, path) = os.path.splitdrive(pathname)
 | |
|         if path[0] == '\\':
 | |
|             path = path[1:]
 | |
|         return os.path.join(new_root, path)
 | |
| 
 | |
|     raise DistutilsPlatformError(f"nothing known about platform '{os.name}'")
 | |
| 
 | |
| 
 | |
| @functools.lru_cache()
 | |
| def check_environ():
 | |
|     """Ensure that 'os.environ' has all the environment variables we
 | |
|     guarantee that users can use in config files, command-line options,
 | |
|     etc.  Currently this includes:
 | |
|       HOME - user's home directory (Unix only)
 | |
|       PLAT - description of the current platform, including hardware
 | |
|              and OS (see 'get_platform()')
 | |
|     """
 | |
|     if os.name == 'posix' and 'HOME' not in os.environ:
 | |
|         try:
 | |
|             import pwd
 | |
| 
 | |
|             os.environ['HOME'] = pwd.getpwuid(os.getuid())[5]
 | |
|         except (ImportError, KeyError):
 | |
|             # bpo-10496: if the current user identifier doesn't exist in the
 | |
|             # password database, do nothing
 | |
|             pass
 | |
| 
 | |
|     if 'PLAT' not in os.environ:
 | |
|         os.environ['PLAT'] = get_platform()
 | |
| 
 | |
| 
 | |
| def subst_vars(s, local_vars):
 | |
|     """
 | |
|     Perform variable substitution on 'string'.
 | |
|     Variables are indicated by format-style braces ("{var}").
 | |
|     Variable is substituted by the value found in the 'local_vars'
 | |
|     dictionary or in 'os.environ' if it's not in 'local_vars'.
 | |
|     'os.environ' is first checked/augmented to guarantee that it contains
 | |
|     certain values: see 'check_environ()'.  Raise ValueError for any
 | |
|     variables not found in either 'local_vars' or 'os.environ'.
 | |
|     """
 | |
|     check_environ()
 | |
|     lookup = dict(os.environ)
 | |
|     lookup.update((name, str(value)) for name, value in local_vars.items())
 | |
|     try:
 | |
|         return _subst_compat(s).format_map(lookup)
 | |
|     except KeyError as var:
 | |
|         raise ValueError(f"invalid variable {var}")
 | |
| 
 | |
| 
 | |
| def _subst_compat(s):
 | |
|     """
 | |
|     Replace shell/Perl-style variable substitution with
 | |
|     format-style. For compatibility.
 | |
|     """
 | |
| 
 | |
|     def _subst(match):
 | |
|         return f'{{{match.group(1)}}}'
 | |
| 
 | |
|     repl = re.sub(r'\$([a-zA-Z_][a-zA-Z_0-9]*)', _subst, s)
 | |
|     if repl != s:
 | |
|         import warnings
 | |
| 
 | |
|         warnings.warn(
 | |
|             "shell/Perl-style substitions are deprecated",
 | |
|             DeprecationWarning,
 | |
|         )
 | |
|     return repl
 | |
| 
 | |
| 
 | |
| def grok_environment_error(exc, prefix="error: "):
 | |
|     # Function kept for backward compatibility.
 | |
|     # Used to try clever things with EnvironmentErrors,
 | |
|     # but nowadays str(exception) produces good messages.
 | |
|     return prefix + str(exc)
 | |
| 
 | |
| 
 | |
| # Needed by 'split_quoted()'
 | |
| _wordchars_re = _squote_re = _dquote_re = None
 | |
| 
 | |
| 
 | |
| def _init_regex():
 | |
|     global _wordchars_re, _squote_re, _dquote_re
 | |
|     _wordchars_re = re.compile(r'[^\\\'\"%s ]*' % string.whitespace)
 | |
|     _squote_re = re.compile(r"'(?:[^'\\]|\\.)*'")
 | |
|     _dquote_re = re.compile(r'"(?:[^"\\]|\\.)*"')
 | |
| 
 | |
| 
 | |
| def split_quoted(s):
 | |
|     """Split a string up according to Unix shell-like rules for quotes and
 | |
|     backslashes.  In short: words are delimited by spaces, as long as those
 | |
|     spaces are not escaped by a backslash, or inside a quoted string.
 | |
|     Single and double quotes are equivalent, and the quote characters can
 | |
|     be backslash-escaped.  The backslash is stripped from any two-character
 | |
|     escape sequence, leaving only the escaped character.  The quote
 | |
|     characters are stripped from any quoted string.  Returns a list of
 | |
|     words.
 | |
|     """
 | |
| 
 | |
|     # This is a nice algorithm for splitting up a single string, since it
 | |
|     # doesn't require character-by-character examination.  It was a little
 | |
|     # bit of a brain-bender to get it working right, though...
 | |
|     if _wordchars_re is None:
 | |
|         _init_regex()
 | |
| 
 | |
|     s = s.strip()
 | |
|     words = []
 | |
|     pos = 0
 | |
| 
 | |
|     while s:
 | |
|         m = _wordchars_re.match(s, pos)
 | |
|         end = m.end()
 | |
|         if end == len(s):
 | |
|             words.append(s[:end])
 | |
|             break
 | |
| 
 | |
|         if s[end] in string.whitespace:
 | |
|             # unescaped, unquoted whitespace: now
 | |
|             # we definitely have a word delimiter
 | |
|             words.append(s[:end])
 | |
|             s = s[end:].lstrip()
 | |
|             pos = 0
 | |
| 
 | |
|         elif s[end] == '\\':
 | |
|             # preserve whatever is being escaped;
 | |
|             # will become part of the current word
 | |
|             s = s[:end] + s[end + 1 :]
 | |
|             pos = end + 1
 | |
| 
 | |
|         else:
 | |
|             if s[end] == "'":  # slurp singly-quoted string
 | |
|                 m = _squote_re.match(s, end)
 | |
|             elif s[end] == '"':  # slurp doubly-quoted string
 | |
|                 m = _dquote_re.match(s, end)
 | |
|             else:
 | |
|                 raise RuntimeError("this can't happen (bad char '%c')" % s[end])
 | |
| 
 | |
|             if m is None:
 | |
|                 raise ValueError("bad string (mismatched %s quotes?)" % s[end])
 | |
| 
 | |
|             (beg, end) = m.span()
 | |
|             s = s[:beg] + s[beg + 1 : end - 1] + s[end:]
 | |
|             pos = m.end() - 2
 | |
| 
 | |
|         if pos >= len(s):
 | |
|             words.append(s)
 | |
|             break
 | |
| 
 | |
|     return words
 | |
| 
 | |
| 
 | |
| # split_quoted ()
 | |
| 
 | |
| 
 | |
| def execute(func, args, msg=None, verbose=0, dry_run=0):
 | |
|     """Perform some action that affects the outside world (eg.  by
 | |
|     writing to the filesystem).  Such actions are special because they
 | |
|     are disabled by the 'dry_run' flag.  This method takes care of all
 | |
|     that bureaucracy for you; all you have to do is supply the
 | |
|     function to call and an argument tuple for it (to embody the
 | |
|     "external action" being performed), and an optional message to
 | |
|     print.
 | |
|     """
 | |
|     if msg is None:
 | |
|         msg = "{}{!r}".format(func.__name__, args)
 | |
|         if msg[-2:] == ',)':  # correct for singleton tuple
 | |
|             msg = msg[0:-2] + ')'
 | |
| 
 | |
|     log.info(msg)
 | |
|     if not dry_run:
 | |
|         func(*args)
 | |
| 
 | |
| 
 | |
| def strtobool(val):
 | |
|     """Convert a string representation of truth to true (1) or false (0).
 | |
| 
 | |
|     True values are 'y', 'yes', 't', 'true', 'on', and '1'; false values
 | |
|     are 'n', 'no', 'f', 'false', 'off', and '0'.  Raises ValueError if
 | |
|     'val' is anything else.
 | |
|     """
 | |
|     val = val.lower()
 | |
|     if val in ('y', 'yes', 't', 'true', 'on', '1'):
 | |
|         return 1
 | |
|     elif val in ('n', 'no', 'f', 'false', 'off', '0'):
 | |
|         return 0
 | |
|     else:
 | |
|         raise ValueError("invalid truth value {!r}".format(val))
 | |
| 
 | |
| 
 | |
| def byte_compile(  # noqa: C901
 | |
|     py_files,
 | |
|     optimize=0,
 | |
|     force=0,
 | |
|     prefix=None,
 | |
|     base_dir=None,
 | |
|     verbose=1,
 | |
|     dry_run=0,
 | |
|     direct=None,
 | |
| ):
 | |
|     """Byte-compile a collection of Python source files to .pyc
 | |
|     files in a __pycache__ subdirectory.  'py_files' is a list
 | |
|     of files to compile; any files that don't end in ".py" are silently
 | |
|     skipped.  'optimize' must be one of the following:
 | |
|       0 - don't optimize
 | |
|       1 - normal optimization (like "python -O")
 | |
|       2 - extra optimization (like "python -OO")
 | |
|     If 'force' is true, all files are recompiled regardless of
 | |
|     timestamps.
 | |
| 
 | |
|     The source filename encoded in each bytecode file defaults to the
 | |
|     filenames listed in 'py_files'; you can modify these with 'prefix' and
 | |
|     'basedir'.  'prefix' is a string that will be stripped off of each
 | |
|     source filename, and 'base_dir' is a directory name that will be
 | |
|     prepended (after 'prefix' is stripped).  You can supply either or both
 | |
|     (or neither) of 'prefix' and 'base_dir', as you wish.
 | |
| 
 | |
|     If 'dry_run' is true, doesn't actually do anything that would
 | |
|     affect the filesystem.
 | |
| 
 | |
|     Byte-compilation is either done directly in this interpreter process
 | |
|     with the standard py_compile module, or indirectly by writing a
 | |
|     temporary script and executing it.  Normally, you should let
 | |
|     'byte_compile()' figure out to use direct compilation or not (see
 | |
|     the source for details).  The 'direct' flag is used by the script
 | |
|     generated in indirect mode; unless you know what you're doing, leave
 | |
|     it set to None.
 | |
|     """
 | |
| 
 | |
|     # nothing is done if sys.dont_write_bytecode is True
 | |
|     if sys.dont_write_bytecode:
 | |
|         raise DistutilsByteCompileError('byte-compiling is disabled.')
 | |
| 
 | |
|     # First, if the caller didn't force us into direct or indirect mode,
 | |
|     # figure out which mode we should be in.  We take a conservative
 | |
|     # approach: choose direct mode *only* if the current interpreter is
 | |
|     # in debug mode and optimize is 0.  If we're not in debug mode (-O
 | |
|     # or -OO), we don't know which level of optimization this
 | |
|     # interpreter is running with, so we can't do direct
 | |
|     # byte-compilation and be certain that it's the right thing.  Thus,
 | |
|     # always compile indirectly if the current interpreter is in either
 | |
|     # optimize mode, or if either optimization level was requested by
 | |
|     # the caller.
 | |
|     if direct is None:
 | |
|         direct = __debug__ and optimize == 0
 | |
| 
 | |
|     # "Indirect" byte-compilation: write a temporary script and then
 | |
|     # run it with the appropriate flags.
 | |
|     if not direct:
 | |
|         try:
 | |
|             from tempfile import mkstemp
 | |
| 
 | |
|             (script_fd, script_name) = mkstemp(".py")
 | |
|         except ImportError:
 | |
|             from tempfile import mktemp
 | |
| 
 | |
|             (script_fd, script_name) = None, mktemp(".py")
 | |
|         log.info("writing byte-compilation script '%s'", script_name)
 | |
|         if not dry_run:
 | |
|             if script_fd is not None:
 | |
|                 script = os.fdopen(script_fd, "w")
 | |
|             else:
 | |
|                 script = open(script_name, "w")
 | |
| 
 | |
|             with script:
 | |
|                 script.write(
 | |
|                     """\
 | |
| from distutils.util import byte_compile
 | |
| files = [
 | |
| """
 | |
|                 )
 | |
| 
 | |
|                 # XXX would be nice to write absolute filenames, just for
 | |
|                 # safety's sake (script should be more robust in the face of
 | |
|                 # chdir'ing before running it).  But this requires abspath'ing
 | |
|                 # 'prefix' as well, and that breaks the hack in build_lib's
 | |
|                 # 'byte_compile()' method that carefully tacks on a trailing
 | |
|                 # slash (os.sep really) to make sure the prefix here is "just
 | |
|                 # right".  This whole prefix business is rather delicate -- the
 | |
|                 # problem is that it's really a directory, but I'm treating it
 | |
|                 # as a dumb string, so trailing slashes and so forth matter.
 | |
| 
 | |
|                 script.write(",\n".join(map(repr, py_files)) + "]\n")
 | |
|                 script.write(
 | |
|                     """
 | |
| byte_compile(files, optimize=%r, force=%r,
 | |
|              prefix=%r, base_dir=%r,
 | |
|              verbose=%r, dry_run=0,
 | |
|              direct=1)
 | |
| """
 | |
|                     % (optimize, force, prefix, base_dir, verbose)
 | |
|                 )
 | |
| 
 | |
|         cmd = [sys.executable]
 | |
|         cmd.extend(subprocess._optim_args_from_interpreter_flags())
 | |
|         cmd.append(script_name)
 | |
|         spawn(cmd, dry_run=dry_run)
 | |
|         execute(os.remove, (script_name,), "removing %s" % script_name, dry_run=dry_run)
 | |
| 
 | |
|     # "Direct" byte-compilation: use the py_compile module to compile
 | |
|     # right here, right now.  Note that the script generated in indirect
 | |
|     # mode simply calls 'byte_compile()' in direct mode, a weird sort of
 | |
|     # cross-process recursion.  Hey, it works!
 | |
|     else:
 | |
|         from py_compile import compile
 | |
| 
 | |
|         for file in py_files:
 | |
|             if file[-3:] != ".py":
 | |
|                 # This lets us be lazy and not filter filenames in
 | |
|                 # the "install_lib" command.
 | |
|                 continue
 | |
| 
 | |
|             # Terminology from the py_compile module:
 | |
|             #   cfile - byte-compiled file
 | |
|             #   dfile - purported source filename (same as 'file' by default)
 | |
|             if optimize >= 0:
 | |
|                 opt = '' if optimize == 0 else optimize
 | |
|                 cfile = importlib.util.cache_from_source(file, optimization=opt)
 | |
|             else:
 | |
|                 cfile = importlib.util.cache_from_source(file)
 | |
|             dfile = file
 | |
|             if prefix:
 | |
|                 if file[: len(prefix)] != prefix:
 | |
|                     raise ValueError(
 | |
|                         "invalid prefix: filename %r doesn't start with %r"
 | |
|                         % (file, prefix)
 | |
|                     )
 | |
|                 dfile = dfile[len(prefix) :]
 | |
|             if base_dir:
 | |
|                 dfile = os.path.join(base_dir, dfile)
 | |
| 
 | |
|             cfile_base = os.path.basename(cfile)
 | |
|             if direct:
 | |
|                 if force or newer(file, cfile):
 | |
|                     log.info("byte-compiling %s to %s", file, cfile_base)
 | |
|                     if not dry_run:
 | |
|                         compile(file, cfile, dfile)
 | |
|                 else:
 | |
|                     log.debug("skipping byte-compilation of %s to %s", file, cfile_base)
 | |
| 
 | |
| 
 | |
| def rfc822_escape(header):
 | |
|     """Return a version of the string escaped for inclusion in an
 | |
|     RFC-822 header, by ensuring there are 8 spaces space after each newline.
 | |
|     """
 | |
|     lines = header.split('\n')
 | |
|     sep = '\n' + 8 * ' '
 | |
|     return sep.join(lines)
 | 
