Spaces:
Runtime error
Runtime error
"""Prepares a distribution for installation | |
""" | |
# The following comment should be removed at some point in the future. | |
# mypy: strict-optional=False | |
import logging | |
import mimetypes | |
import os | |
import shutil | |
from typing import Dict, Iterable, List, Optional, Tuple | |
from pip._vendor.packaging.utils import canonicalize_name | |
from pip._vendor.pkg_resources import Distribution | |
from pip._internal.distributions import make_distribution_for_install_requirement | |
from pip._internal.distributions.installed import InstalledDistribution | |
from pip._internal.exceptions import ( | |
DirectoryUrlHashUnsupported, | |
HashMismatch, | |
HashUnpinned, | |
InstallationError, | |
NetworkConnectionError, | |
PreviousBuildDirError, | |
VcsHashUnsupported, | |
) | |
from pip._internal.index.package_finder import PackageFinder | |
from pip._internal.models.link import Link | |
from pip._internal.models.wheel import Wheel | |
from pip._internal.network.download import BatchDownloader, Downloader | |
from pip._internal.network.lazy_wheel import ( | |
HTTPRangeRequestUnsupported, | |
dist_from_wheel_url, | |
) | |
from pip._internal.network.session import PipSession | |
from pip._internal.req.req_install import InstallRequirement | |
from pip._internal.req.req_tracker import RequirementTracker | |
from pip._internal.utils.deprecation import deprecated | |
from pip._internal.utils.filesystem import copy2_fixed | |
from pip._internal.utils.hashes import Hashes, MissingHashes | |
from pip._internal.utils.logging import indent_log | |
from pip._internal.utils.misc import display_path, hide_url, is_installable_dir, rmtree | |
from pip._internal.utils.temp_dir import TempDirectory | |
from pip._internal.utils.unpacking import unpack_file | |
from pip._internal.vcs import vcs | |
logger = logging.getLogger(__name__) | |
def _get_prepared_distribution( | |
req, # type: InstallRequirement | |
req_tracker, # type: RequirementTracker | |
finder, # type: PackageFinder | |
build_isolation, # type: bool | |
): | |
# type: (...) -> Distribution | |
"""Prepare a distribution for installation.""" | |
abstract_dist = make_distribution_for_install_requirement(req) | |
with req_tracker.track(req): | |
abstract_dist.prepare_distribution_metadata(finder, build_isolation) | |
return abstract_dist.get_pkg_resources_distribution() | |
def unpack_vcs_link(link, location): | |
# type: (Link, str) -> None | |
vcs_backend = vcs.get_backend_for_scheme(link.scheme) | |
assert vcs_backend is not None | |
vcs_backend.unpack(location, url=hide_url(link.url)) | |
class File: | |
def __init__(self, path, content_type): | |
# type: (str, Optional[str]) -> None | |
self.path = path | |
if content_type is None: | |
self.content_type = mimetypes.guess_type(path)[0] | |
else: | |
self.content_type = content_type | |
def get_http_url( | |
link, # type: Link | |
download, # type: Downloader | |
download_dir=None, # type: Optional[str] | |
hashes=None, # type: Optional[Hashes] | |
): | |
# type: (...) -> File | |
temp_dir = TempDirectory(kind="unpack", globally_managed=True) | |
# If a download dir is specified, is the file already downloaded there? | |
already_downloaded_path = None | |
if download_dir: | |
already_downloaded_path = _check_download_dir( | |
link, download_dir, hashes | |
) | |
if already_downloaded_path: | |
from_path = already_downloaded_path | |
content_type = None | |
else: | |
# let's download to a tmp dir | |
from_path, content_type = download(link, temp_dir.path) | |
if hashes: | |
hashes.check_against_path(from_path) | |
return File(from_path, content_type) | |
def _copy2_ignoring_special_files(src, dest): | |
# type: (str, str) -> None | |
"""Copying special files is not supported, but as a convenience to users | |
we skip errors copying them. This supports tools that may create e.g. | |
socket files in the project source directory. | |
""" | |
try: | |
copy2_fixed(src, dest) | |
except shutil.SpecialFileError as e: | |
# SpecialFileError may be raised due to either the source or | |
# destination. If the destination was the cause then we would actually | |
# care, but since the destination directory is deleted prior to | |
# copy we ignore all of them assuming it is caused by the source. | |
logger.warning( | |
"Ignoring special file error '%s' encountered copying %s to %s.", | |
str(e), | |
src, | |
dest, | |
) | |
def _copy_source_tree(source, target): | |
# type: (str, str) -> None | |
target_abspath = os.path.abspath(target) | |
target_basename = os.path.basename(target_abspath) | |
target_dirname = os.path.dirname(target_abspath) | |
def ignore(d, names): | |
# type: (str, List[str]) -> List[str] | |
skipped = [] # type: List[str] | |
if d == source: | |
# Pulling in those directories can potentially be very slow, | |
# exclude the following directories if they appear in the top | |
# level dir (and only it). | |
# See discussion at https://github.com/pypa/pip/pull/6770 | |
skipped += ['.tox', '.nox'] | |
if os.path.abspath(d) == target_dirname: | |
# Prevent an infinite recursion if the target is in source. | |
# This can happen when TMPDIR is set to ${PWD}/... | |
# and we copy PWD to TMPDIR. | |
skipped += [target_basename] | |
return skipped | |
shutil.copytree( | |
source, | |
target, | |
ignore=ignore, | |
symlinks=True, | |
copy_function=_copy2_ignoring_special_files, | |
) | |
def get_file_url( | |
link, # type: Link | |
download_dir=None, # type: Optional[str] | |
hashes=None # type: Optional[Hashes] | |
): | |
# type: (...) -> File | |
"""Get file and optionally check its hash. | |
""" | |
# If a download dir is specified, is the file already there and valid? | |
already_downloaded_path = None | |
if download_dir: | |
already_downloaded_path = _check_download_dir( | |
link, download_dir, hashes | |
) | |
if already_downloaded_path: | |
from_path = already_downloaded_path | |
else: | |
from_path = link.file_path | |
# If --require-hashes is off, `hashes` is either empty, the | |
# link's embedded hash, or MissingHashes; it is required to | |
# match. If --require-hashes is on, we are satisfied by any | |
# hash in `hashes` matching: a URL-based or an option-based | |
# one; no internet-sourced hash will be in `hashes`. | |
if hashes: | |
hashes.check_against_path(from_path) | |
return File(from_path, None) | |
def unpack_url( | |
link, # type: Link | |
location, # type: str | |
download, # type: Downloader | |
download_dir=None, # type: Optional[str] | |
hashes=None, # type: Optional[Hashes] | |
): | |
# type: (...) -> Optional[File] | |
"""Unpack link into location, downloading if required. | |
:param hashes: A Hashes object, one of whose embedded hashes must match, | |
or HashMismatch will be raised. If the Hashes is empty, no matches are | |
required, and unhashable types of requirements (like VCS ones, which | |
would ordinarily raise HashUnsupported) are allowed. | |
""" | |
# non-editable vcs urls | |
if link.is_vcs: | |
unpack_vcs_link(link, location) | |
return None | |
# Once out-of-tree-builds are no longer supported, could potentially | |
# replace the below condition with `assert not link.is_existing_dir` | |
# - unpack_url does not need to be called for in-tree-builds. | |
# | |
# As further cleanup, _copy_source_tree and accompanying tests can | |
# be removed. | |
if link.is_existing_dir(): | |
deprecated( | |
"A future pip version will change local packages to be built " | |
"in-place without first copying to a temporary directory. " | |
"We recommend you use --use-feature=in-tree-build to test " | |
"your packages with this new behavior before it becomes the " | |
"default.\n", | |
replacement=None, | |
gone_in="21.3", | |
issue=7555 | |
) | |
if os.path.isdir(location): | |
rmtree(location) | |
_copy_source_tree(link.file_path, location) | |
return None | |
# file urls | |
if link.is_file: | |
file = get_file_url(link, download_dir, hashes=hashes) | |
# http urls | |
else: | |
file = get_http_url( | |
link, | |
download, | |
download_dir, | |
hashes=hashes, | |
) | |
# unpack the archive to the build dir location. even when only downloading | |
# archives, they have to be unpacked to parse dependencies, except wheels | |
if not link.is_wheel: | |
unpack_file(file.path, location, file.content_type) | |
return file | |
def _check_download_dir(link, download_dir, hashes): | |
# type: (Link, str, Optional[Hashes]) -> Optional[str] | |
""" Check download_dir for previously downloaded file with correct hash | |
If a correct file is found return its path else None | |
""" | |
download_path = os.path.join(download_dir, link.filename) | |
if not os.path.exists(download_path): | |
return None | |
# If already downloaded, does its hash match? | |
logger.info('File was already downloaded %s', download_path) | |
if hashes: | |
try: | |
hashes.check_against_path(download_path) | |
except HashMismatch: | |
logger.warning( | |
'Previously-downloaded file %s has bad hash. ' | |
'Re-downloading.', | |
download_path | |
) | |
os.unlink(download_path) | |
return None | |
return download_path | |
class RequirementPreparer: | |
"""Prepares a Requirement | |
""" | |
def __init__( | |
self, | |
build_dir, # type: str | |
download_dir, # type: Optional[str] | |
src_dir, # type: str | |
build_isolation, # type: bool | |
req_tracker, # type: RequirementTracker | |
session, # type: PipSession | |
progress_bar, # type: str | |
finder, # type: PackageFinder | |
require_hashes, # type: bool | |
use_user_site, # type: bool | |
lazy_wheel, # type: bool | |
in_tree_build, # type: bool | |
): | |
# type: (...) -> None | |
super().__init__() | |
self.src_dir = src_dir | |
self.build_dir = build_dir | |
self.req_tracker = req_tracker | |
self._session = session | |
self._download = Downloader(session, progress_bar) | |
self._batch_download = BatchDownloader(session, progress_bar) | |
self.finder = finder | |
# Where still-packed archives should be written to. If None, they are | |
# not saved, and are deleted immediately after unpacking. | |
self.download_dir = download_dir | |
# Is build isolation allowed? | |
self.build_isolation = build_isolation | |
# Should hash-checking be required? | |
self.require_hashes = require_hashes | |
# Should install in user site-packages? | |
self.use_user_site = use_user_site | |
# Should wheels be downloaded lazily? | |
self.use_lazy_wheel = lazy_wheel | |
# Should in-tree builds be used for local paths? | |
self.in_tree_build = in_tree_build | |
# Memoized downloaded files, as mapping of url: (path, mime type) | |
self._downloaded = {} # type: Dict[str, Tuple[str, str]] | |
# Previous "header" printed for a link-based InstallRequirement | |
self._previous_requirement_header = ("", "") | |
def _log_preparing_link(self, req): | |
# type: (InstallRequirement) -> None | |
"""Provide context for the requirement being prepared.""" | |
if req.link.is_file and not req.original_link_is_in_wheel_cache: | |
message = "Processing %s" | |
information = str(display_path(req.link.file_path)) | |
else: | |
message = "Collecting %s" | |
information = str(req.req or req) | |
if (message, information) != self._previous_requirement_header: | |
self._previous_requirement_header = (message, information) | |
logger.info(message, information) | |
if req.original_link_is_in_wheel_cache: | |
with indent_log(): | |
logger.info("Using cached %s", req.link.filename) | |
def _ensure_link_req_src_dir(self, req, parallel_builds): | |
# type: (InstallRequirement, bool) -> None | |
"""Ensure source_dir of a linked InstallRequirement.""" | |
# Since source_dir is only set for editable requirements. | |
if req.link.is_wheel: | |
# We don't need to unpack wheels, so no need for a source | |
# directory. | |
return | |
assert req.source_dir is None | |
if req.link.is_existing_dir() and self.in_tree_build: | |
# build local directories in-tree | |
req.source_dir = req.link.file_path | |
return | |
# We always delete unpacked sdists after pip runs. | |
req.ensure_has_source_dir( | |
self.build_dir, | |
autodelete=True, | |
parallel_builds=parallel_builds, | |
) | |
# If a checkout exists, it's unwise to keep going. version | |
# inconsistencies are logged later, but do not fail the | |
# installation. | |
# FIXME: this won't upgrade when there's an existing | |
# package unpacked in `req.source_dir` | |
if is_installable_dir(req.source_dir): | |
raise PreviousBuildDirError( | |
"pip can't proceed with requirements '{}' due to a" | |
"pre-existing build directory ({}). This is likely " | |
"due to a previous installation that failed . pip is " | |
"being responsible and not assuming it can delete this. " | |
"Please delete it and try again.".format(req, req.source_dir) | |
) | |
def _get_linked_req_hashes(self, req): | |
# type: (InstallRequirement) -> Hashes | |
# By the time this is called, the requirement's link should have | |
# been checked so we can tell what kind of requirements req is | |
# and raise some more informative errors than otherwise. | |
# (For example, we can raise VcsHashUnsupported for a VCS URL | |
# rather than HashMissing.) | |
if not self.require_hashes: | |
return req.hashes(trust_internet=True) | |
# We could check these first 2 conditions inside unpack_url | |
# and save repetition of conditions, but then we would | |
# report less-useful error messages for unhashable | |
# requirements, complaining that there's no hash provided. | |
if req.link.is_vcs: | |
raise VcsHashUnsupported() | |
if req.link.is_existing_dir(): | |
raise DirectoryUrlHashUnsupported() | |
# Unpinned packages are asking for trouble when a new version | |
# is uploaded. This isn't a security check, but it saves users | |
# a surprising hash mismatch in the future. | |
# file:/// URLs aren't pinnable, so don't complain about them | |
# not being pinned. | |
if req.original_link is None and not req.is_pinned: | |
raise HashUnpinned() | |
# If known-good hashes are missing for this requirement, | |
# shim it with a facade object that will provoke hash | |
# computation and then raise a HashMissing exception | |
# showing the user what the hash should be. | |
return req.hashes(trust_internet=False) or MissingHashes() | |
def _fetch_metadata_using_lazy_wheel(self, link): | |
# type: (Link) -> Optional[Distribution] | |
"""Fetch metadata using lazy wheel, if possible.""" | |
if not self.use_lazy_wheel: | |
return None | |
if self.require_hashes: | |
logger.debug('Lazy wheel is not used as hash checking is required') | |
return None | |
if link.is_file or not link.is_wheel: | |
logger.debug( | |
'Lazy wheel is not used as ' | |
'%r does not points to a remote wheel', | |
link, | |
) | |
return None | |
wheel = Wheel(link.filename) | |
name = canonicalize_name(wheel.name) | |
logger.info( | |
'Obtaining dependency information from %s %s', | |
name, wheel.version, | |
) | |
url = link.url.split('#', 1)[0] | |
try: | |
return dist_from_wheel_url(name, url, self._session) | |
except HTTPRangeRequestUnsupported: | |
logger.debug('%s does not support range requests', url) | |
return None | |
def _complete_partial_requirements( | |
self, | |
partially_downloaded_reqs, # type: Iterable[InstallRequirement] | |
parallel_builds=False, # type: bool | |
): | |
# type: (...) -> None | |
"""Download any requirements which were only fetched by metadata.""" | |
# Download to a temporary directory. These will be copied over as | |
# needed for downstream 'download', 'wheel', and 'install' commands. | |
temp_dir = TempDirectory(kind="unpack", globally_managed=True).path | |
# Map each link to the requirement that owns it. This allows us to set | |
# `req.local_file_path` on the appropriate requirement after passing | |
# all the links at once into BatchDownloader. | |
links_to_fully_download = {} # type: Dict[Link, InstallRequirement] | |
for req in partially_downloaded_reqs: | |
assert req.link | |
links_to_fully_download[req.link] = req | |
batch_download = self._batch_download( | |
links_to_fully_download.keys(), | |
temp_dir, | |
) | |
for link, (filepath, _) in batch_download: | |
logger.debug("Downloading link %s to %s", link, filepath) | |
req = links_to_fully_download[link] | |
req.local_file_path = filepath | |
# This step is necessary to ensure all lazy wheels are processed | |
# successfully by the 'download', 'wheel', and 'install' commands. | |
for req in partially_downloaded_reqs: | |
self._prepare_linked_requirement(req, parallel_builds) | |
def prepare_linked_requirement(self, req, parallel_builds=False): | |
# type: (InstallRequirement, bool) -> Distribution | |
"""Prepare a requirement to be obtained from req.link.""" | |
assert req.link | |
link = req.link | |
self._log_preparing_link(req) | |
with indent_log(): | |
# Check if the relevant file is already available | |
# in the download directory | |
file_path = None | |
if self.download_dir is not None and link.is_wheel: | |
hashes = self._get_linked_req_hashes(req) | |
file_path = _check_download_dir(req.link, self.download_dir, hashes) | |
if file_path is not None: | |
# The file is already available, so mark it as downloaded | |
self._downloaded[req.link.url] = file_path, None | |
else: | |
# The file is not available, attempt to fetch only metadata | |
wheel_dist = self._fetch_metadata_using_lazy_wheel(link) | |
if wheel_dist is not None: | |
req.needs_more_preparation = True | |
return wheel_dist | |
# None of the optimizations worked, fully prepare the requirement | |
return self._prepare_linked_requirement(req, parallel_builds) | |
def prepare_linked_requirements_more(self, reqs, parallel_builds=False): | |
# type: (Iterable[InstallRequirement], bool) -> None | |
"""Prepare linked requirements more, if needed.""" | |
reqs = [req for req in reqs if req.needs_more_preparation] | |
for req in reqs: | |
# Determine if any of these requirements were already downloaded. | |
if self.download_dir is not None and req.link.is_wheel: | |
hashes = self._get_linked_req_hashes(req) | |
file_path = _check_download_dir(req.link, self.download_dir, hashes) | |
if file_path is not None: | |
self._downloaded[req.link.url] = file_path, None | |
req.needs_more_preparation = False | |
# Prepare requirements we found were already downloaded for some | |
# reason. The other downloads will be completed separately. | |
partially_downloaded_reqs = [] # type: List[InstallRequirement] | |
for req in reqs: | |
if req.needs_more_preparation: | |
partially_downloaded_reqs.append(req) | |
else: | |
self._prepare_linked_requirement(req, parallel_builds) | |
# TODO: separate this part out from RequirementPreparer when the v1 | |
# resolver can be removed! | |
self._complete_partial_requirements( | |
partially_downloaded_reqs, parallel_builds=parallel_builds, | |
) | |
def _prepare_linked_requirement(self, req, parallel_builds): | |
# type: (InstallRequirement, bool) -> Distribution | |
assert req.link | |
link = req.link | |
self._ensure_link_req_src_dir(req, parallel_builds) | |
hashes = self._get_linked_req_hashes(req) | |
if link.is_existing_dir() and self.in_tree_build: | |
local_file = None | |
elif link.url not in self._downloaded: | |
try: | |
local_file = unpack_url( | |
link, req.source_dir, self._download, | |
self.download_dir, hashes | |
) | |
except NetworkConnectionError as exc: | |
raise InstallationError( | |
'Could not install requirement {} because of HTTP ' | |
'error {} for URL {}'.format(req, exc, link) | |
) | |
else: | |
file_path, content_type = self._downloaded[link.url] | |
if hashes: | |
hashes.check_against_path(file_path) | |
local_file = File(file_path, content_type) | |
# For use in later processing, | |
# preserve the file path on the requirement. | |
if local_file: | |
req.local_file_path = local_file.path | |
dist = _get_prepared_distribution( | |
req, self.req_tracker, self.finder, self.build_isolation, | |
) | |
return dist | |
def save_linked_requirement(self, req): | |
# type: (InstallRequirement) -> None | |
assert self.download_dir is not None | |
assert req.link is not None | |
link = req.link | |
if link.is_vcs or (link.is_existing_dir() and req.editable): | |
# Make a .zip of the source_dir we already created. | |
req.archive(self.download_dir) | |
return | |
if link.is_existing_dir(): | |
logger.debug( | |
'Not copying link to destination directory ' | |
'since it is a directory: %s', link, | |
) | |
return | |
if req.local_file_path is None: | |
# No distribution was downloaded for this requirement. | |
return | |
download_location = os.path.join(self.download_dir, link.filename) | |
if not os.path.exists(download_location): | |
shutil.copy(req.local_file_path, download_location) | |
download_path = display_path(download_location) | |
logger.info('Saved %s', download_path) | |
def prepare_editable_requirement( | |
self, | |
req, # type: InstallRequirement | |
): | |
# type: (...) -> Distribution | |
"""Prepare an editable requirement | |
""" | |
assert req.editable, "cannot prepare a non-editable req as editable" | |
logger.info('Obtaining %s', req) | |
with indent_log(): | |
if self.require_hashes: | |
raise InstallationError( | |
'The editable requirement {} cannot be installed when ' | |
'requiring hashes, because there is no single file to ' | |
'hash.'.format(req) | |
) | |
req.ensure_has_source_dir(self.src_dir) | |
req.update_editable() | |
dist = _get_prepared_distribution( | |
req, self.req_tracker, self.finder, self.build_isolation, | |
) | |
req.check_if_exists(self.use_user_site) | |
return dist | |
def prepare_installed_requirement( | |
self, | |
req, # type: InstallRequirement | |
skip_reason # type: str | |
): | |
# type: (...) -> Distribution | |
"""Prepare an already-installed requirement | |
""" | |
assert req.satisfied_by, "req should have been satisfied but isn't" | |
assert skip_reason is not None, ( | |
"did not get skip reason skipped but req.satisfied_by " | |
"is set to {}".format(req.satisfied_by) | |
) | |
logger.info( | |
'Requirement %s: %s (%s)', | |
skip_reason, req, req.satisfied_by.version | |
) | |
with indent_log(): | |
if self.require_hashes: | |
logger.debug( | |
'Since it is already installed, we are trusting this ' | |
'package without checking its hash. To ensure a ' | |
'completely repeatable environment, install into an ' | |
'empty virtualenv.' | |
) | |
return InstalledDistribution(req).get_pkg_resources_distribution() | |