# Copyright 2014 Pants project contributors (see CONTRIBUTORS.md).
# Licensed under the Apache License, Version 2.0 (see LICENSE).
from __future__ import absolute_import
import json
import os
from pex import pex_warnings
from pex.common import can_write_dir, open_zip, safe_mkdtemp
from pex.compatibility import PY2
from pex.compatibility import string as compatibility_string
from pex.inherit_path import InheritPath
from pex.orderedset import OrderedSet
from pex.typing import TYPE_CHECKING
from pex.variables import ENV, Variables
from pex.version import __version__ as pex_version
if TYPE_CHECKING:
from pex.interpreter import PythonInterpreter
from typing import Any, Mapping, Optional, Text, Union
# TODO(wickman) Split this into a PexInfoBuilder/PexInfo to ensure immutability.
# Issue #92.
[docs]class PexInfo(object):
"""PEX metadata.
# Build metadata:
build_properties: BuildProperties # (key-value information about the build system)
code_hash: str # sha1 hash of all names/code in the archive
distributions: {dist_name: str} # map from distribution name (i.e. path in
# the internal cache) to its cache key (sha1)
requirements: list # list of requirements for this environment
# Environment options
pex_root: string # root of all pex-related files eg: ~/.pex
entry_point: string # entry point into this pex
script: string # script to execute in this pex environment
# at most one of script/entry_point can be specified
zip_safe: bool, default True # is this pex zip safe?
unzip: bool, default False # should this pex be unzipped and re-executed from there?
inherit_path: false/fallback/prefer # should this pex inherit site-packages + user site-packages
# + PYTHONPATH?
ignore_errors: True, default False # should we ignore inability to resolve dependencies?
always_write_cache: False # should we always write the internal cache to disk first?
# this is useful if you have very large dependencies that
# do not fit in RAM constrained environments
.. versionchanged:: 0.8
Removed the ``repositories`` and ``indices`` information, as they were never
implemented.
"""
PATH = "PEX-INFO"
INSTALL_CACHE = "installed_wheels"
@classmethod
def make_build_properties(cls, interpreter=None):
# This lazy import is currently needed for performance reasons. At PEX runtime PexInfo is
# read in the bootstrap to see if the PEX should run in `--unzip` mode. If so, it must
# re-exec itself to run against its unzipped contents. Since `make_build_properties` is only
# used at PEX buildtime and the transitive imports of PythonInterpreter are large and slow,
# we avoid this import cost for runtime-only use.
#
# See: https://github.com/pantsbuild/pex/issues/1054
from pex.interpreter import PythonInterpreter
pi = interpreter or PythonInterpreter.get()
plat = pi.platform
platform_name = plat.platform
return {
"pex_version": pex_version,
"class": pi.identity.interpreter,
"version": pi.identity.version,
"platform": platform_name,
}
@classmethod
def default(cls, interpreter=None):
# type: (Optional[PythonInterpreter]) -> PexInfo
pex_info = {
"requirements": [],
"distributions": {},
"build_properties": cls.make_build_properties(interpreter),
}
return cls(info=pex_info)
@classmethod
def from_pex(cls, pex):
if os.path.isfile(pex):
with open_zip(pex) as zf:
pex_info = zf.read(cls.PATH)
else:
with open(os.path.join(pex, cls.PATH)) as fp:
pex_info = fp.read()
return cls.from_json(pex_info)
@classmethod
def from_json(cls, content):
# type: (Union[bytes, Text]) -> PexInfo
if isinstance(content, bytes):
content = content.decode("utf-8")
return cls(info=json.loads(content))
@classmethod
def from_env(cls, env=ENV):
# type: (Variables) -> PexInfo
pex_force_local = Variables.PEX_FORCE_LOCAL.strip_default(env)
zip_safe = None if pex_force_local is None else not pex_force_local
pex_inherit_path = Variables.PEX_INHERIT_PATH.strip_default(env)
inherit_path = None if pex_inherit_path is None else pex_inherit_path.value
pex_info = {
"pex_root": Variables.PEX_ROOT.strip_default(env),
"entry_point": env.PEX_MODULE,
"script": env.PEX_SCRIPT,
"zip_safe": zip_safe,
"unzip": Variables.PEX_UNZIP.strip_default(env),
"inherit_path": inherit_path,
"ignore_errors": Variables.PEX_IGNORE_ERRORS.strip_default(env),
"always_write_cache": Variables.PEX_ALWAYS_CACHE.strip_default(env),
}
# Filter out empty entries not explicitly set in the environment.
return cls(info=dict((k, v) for (k, v) in pex_info.items() if v is not None))
@classmethod
def _parse_requirement_tuple(cls, requirement_tuple):
if isinstance(requirement_tuple, (tuple, list)):
if len(requirement_tuple) != 3:
raise ValueError("Malformed PEX requirement: %r" % (requirement_tuple,))
# pre 0.8.x requirement type:
pex_warnings.warn(
"Attempting to use deprecated PEX feature. Please upgrade past PEX 0.8.x."
)
return requirement_tuple[0]
elif isinstance(requirement_tuple, compatibility_string):
return requirement_tuple
raise ValueError("Malformed PEX requirement: %r" % (requirement_tuple,))
def __init__(self, info=None):
# type: (Optional[Mapping[str, Any]]) -> None
"""Construct a new PexInfo.
This should not be used directly.
"""
if info is not None and not isinstance(info, dict):
raise ValueError(
"PexInfo can only be seeded with a dict, got: " "%s of type %s" % (info, type(info))
)
self._pex_info = dict(info) if info else {} # type Dict[str, str]
self._distributions = self._pex_info.get("distributions", {})
# cast as set because pex info from json must store interpreter_constraints as a list
self._interpreter_constraints = set(self._pex_info.get("interpreter_constraints", set()))
requirements = self._pex_info.get("requirements", [])
if not isinstance(requirements, (list, tuple)):
raise ValueError("Expected requirements to be a list, got %s" % type(requirements))
self._requirements = OrderedSet(self._parse_requirement_tuple(req) for req in requirements)
def _get_safe(self, key):
if key not in self._pex_info:
return None
value = self._pex_info[key]
return value.encode("utf-8") if PY2 else value
@property
def build_properties(self):
"""Information about the system on which this PEX was generated.
:returns: A dictionary containing metadata about the environment used to build this PEX.
"""
return self._pex_info.get("build_properties", {})
@build_properties.setter
def build_properties(self, value):
if not isinstance(value, dict):
raise TypeError("build_properties must be a dictionary!")
self._pex_info["build_properties"] = self.make_build_properties()
self._pex_info["build_properties"].update(value)
@property
def zip_safe(self):
"""Whether or not this PEX should be treated as zip-safe.
If set to false and the PEX is zipped, the contents of the PEX will be unpacked into a
directory within the PEX_ROOT prior to execution. This allows code and frameworks depending
upon __file__ existing on disk to operate normally.
By default zip_safe is True. May be overridden at runtime by the $PEX_FORCE_LOCAL environment
variable.
"""
return self._pex_info.get("zip_safe", True)
@zip_safe.setter
def zip_safe(self, value):
self._pex_info["zip_safe"] = bool(value)
@property
def unzip(self):
"""Whether or not PEX should be unzipped before it's executed.
Unzipping a PEX is a operation that can be cached on the 1st run of a given PEX file which
can result in lower startup latency in subsequent runs.
"""
return self._pex_info.get("unzip", False)
@unzip.setter
def unzip(self, value):
self._pex_info["unzip"] = bool(value)
@property
def strip_pex_env(self):
"""Whether or not this PEX should strip `PEX_*` env vars before executing its entrypoint.
You might want to set this to `False` if this PEX executes other PEXes or the Pex CLI itself
and you want the executed PEX to be controlled via PEX environment variables.
"""
return self._pex_info.get("strip_pex_env", True)
@strip_pex_env.setter
def strip_pex_env(self, value):
self._pex_info["strip_pex_env"] = bool(value)
@property
def pex_path(self):
"""A colon separated list of other pex files to merge into the runtime environment.
This pex info property is used to persist the PEX_PATH environment variable into the pex
info metadata for reuse within a built pex.
"""
return self._pex_info.get("pex_path")
@pex_path.setter
def pex_path(self, value):
self._pex_info["pex_path"] = value
@property
def inherit_path(self):
# type: () -> InheritPath.Value
"""Whether or not this PEX should be allowed to inherit system dependencies.
By default, PEX environments are scrubbed of all system distributions prior to execution.
This means that PEX files cannot rely upon preexisting system libraries.
By default inherit_path is false. This may be overridden at runtime by the $PEX_INHERIT_PATH
environment variable.
"""
inherit_path = self._pex_info.get("inherit_path")
return InheritPath.for_value(inherit_path) if inherit_path else InheritPath.FALSE
@inherit_path.setter
def inherit_path(self, value):
# type: (InheritPath.Value) -> None
self._pex_info["inherit_path"] = value.value
@property
def interpreter_constraints(self):
"""A list of constraints that determine the interpreter compatibility for this pex, using
the Requirement-style format, e.g. ``'CPython>=3', or just '>=2.7,<3'`` for requirements
agnostic to interpreter class.
This property will be used at exec time when bootstrapping a pex to search PEX_PYTHON_PATH
for a list of compatible interpreters.
"""
return list(self._interpreter_constraints)
def add_interpreter_constraint(self, value):
self._interpreter_constraints.add(str(value))
@property
def ignore_errors(self):
return self._pex_info.get("ignore_errors", False)
@ignore_errors.setter
def ignore_errors(self, value):
self._pex_info["ignore_errors"] = bool(value)
@property
def emit_warnings(self):
return self._pex_info.get("emit_warnings", True)
@emit_warnings.setter
def emit_warnings(self, value):
self._pex_info["emit_warnings"] = bool(value)
@property
def code_hash(self):
return self._pex_info.get("code_hash")
@code_hash.setter
def code_hash(self, value):
self._pex_info["code_hash"] = value
@property
def entry_point(self):
return self._get_safe("entry_point")
@entry_point.setter
def entry_point(self, value):
self._pex_info["entry_point"] = value
@property
def script(self):
return self._get_safe("script")
@script.setter
def script(self, value):
self._pex_info["script"] = value
def add_requirement(self, requirement):
self._requirements.add(str(requirement))
@property
def requirements(self):
return self._requirements
def add_distribution(self, location, sha):
self._distributions[location] = sha
@property
def distributions(self):
return self._distributions
@property
def always_write_cache(self):
return self._pex_info.get("always_write_cache", False)
@always_write_cache.setter
def always_write_cache(self, value):
self._pex_info["always_write_cache"] = bool(value)
@property
def pex_root(self):
pex_root = os.path.expanduser(self._pex_info.get("pex_root", os.path.join("~", ".pex")))
if not can_write_dir(pex_root):
tmp_root = safe_mkdtemp()
pex_warnings.warn(
"PEX_ROOT is configured as {pex_root} but that path is un-writeable, "
"falling back to a temporary PEX_ROOT of {tmp_root} which will hurt "
"performance.".format(pex_root=pex_root, tmp_root=tmp_root)
)
pex_root = self._pex_info["pex_root"] = tmp_root
return pex_root
@pex_root.setter
def pex_root(self, value):
if value is None:
self._pex_info.pop("pex_root", None)
else:
self._pex_info["pex_root"] = value
@property
def internal_cache(self):
return ".deps"
@property
def install_cache(self):
return os.path.join(self.pex_root, self.INSTALL_CACHE)
@property
def zip_unsafe_cache(self):
return os.path.join(self.pex_root, "code")
def update(self, other):
if not isinstance(other, PexInfo):
raise TypeError("Cannot merge a %r with PexInfo" % type(other))
self._pex_info.update(other._pex_info)
self._distributions.update(other.distributions)
self._interpreter_constraints.update(other.interpreter_constraints)
self._requirements.update(other.requirements)
def dump(self, sort_keys=False):
# type: (bool) -> str
pex_info_copy = self._pex_info.copy()
pex_info_copy["inherit_path"] = self.inherit_path.value
pex_info_copy["requirements"] = sorted(self._requirements)
pex_info_copy["interpreter_constraints"] = sorted(self._interpreter_constraints)
pex_info_copy["distributions"] = self._distributions.copy()
return json.dumps(pex_info_copy, sort_keys=sort_keys)
def copy(self):
return self.from_json(self.dump())
@staticmethod
def _merge_split(*paths):
filtered_paths = filter(None, paths)
return [p for p in ":".join(filtered_paths).split(":") if p]
[docs] def merge_pex_path(self, pex_path):
"""Merges a new PEX_PATH definition into the existing one (if any).
:param str pex_path: The PEX_PATH to merge.
"""
if not pex_path:
return
self.pex_path = ":".join(self._merge_split(self.pex_path, pex_path))
def __repr__(self):
return "{}({!r})".format(type(self).__name__, self._pex_info)