Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Isolate, reuse PackageFinder best candidate logic #5971

Merged
merged 5 commits into from
Apr 16, 2019
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions news/5175.bugfix
Original file line number Diff line number Diff line change
@@ -0,0 +1 @@
Make pip's self version check avoid recommending upgrades to prereleases if the currently-installed version is stable.
138 changes: 97 additions & 41 deletions src/pip/_internal/index.py
Original file line number Diff line number Diff line change
Expand Up @@ -55,7 +55,8 @@
BuildTag = Tuple[Any, ...] # either empty tuple or Tuple[int, str]
CandidateSortingKey = Tuple[int, _BaseVersion, BuildTag, Optional[int]]

__all__ = ['FormatControl', 'PackageFinder']

__all__ = ['FormatControl', 'FoundCandidates', 'PackageFinder']


SECURE_ORIGINS = [
Expand Down Expand Up @@ -254,6 +255,67 @@ def _get_html_page(link, session=None):
return None


class FoundCandidates(object):
"""A collection of candidates, returned by `PackageFinder.find_candidates`.

Arguments:

* `candidates`: A sequence of all available candidates found.
* `specifier`: Specifier to filter applicable versions.
* `prereleases`: Whether prereleases should be accounted. Pass None to
infer from the specifier.
* `sort_key`: A callable used as the key function when choosing the best
candidate.
"""
def __init__(
self,
candidates, # type: List[InstallationCandidate]
specifier, # type: specifiers.BaseSpecifier
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

Again, I think specifier should be optional (defaulting to the empty SpecifierSet).

Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I made the specifier argument optional in finder.find_candidates(), but kept it required in FoundCandidates constructor.

prereleases, # type: Optional[bool]
sort_key, # type: Callable[[InstallationCandidate], Any]
):
# type: (...) -> None
self._candidates = candidates
self._specifier = specifier
self._prereleases = prereleases
self._sort_key = sort_key

def iter_all(self):
# type: () -> Iterable[InstallationCandidate]
"""Iterate through all candidates.
"""
return iter(self._candidates)

def iter_applicable(self):
# type: () -> Iterable[InstallationCandidate]
"""Iterate through candidates matching the given specifier.
"""
# Filter out anything which doesn't match our specifier.
versions = set(self._specifier.filter(
# We turn the version object into a str here because otherwise
# when we're debundled but setuptools isn't, Python will see
# packaging.version.Version and
# pkg_resources._vendor.packaging.version.Version as different
# types. This way we'll use a str as a common data interchange
# format. If we stop using the pkg_resources provided specifier
# and start using our own, we can drop the cast to str().
[str(c.version) for c in self._candidates],
prereleases=self._prereleases,
))
# Again, converting to str to deal with debundling.
return (c for c in self._candidates if str(c.version) in versions)

def get_best(self):
# type: () -> Optional[InstallationCandidate]
"""Return the best candidate available, or None if no applicable
candidates are found.
"""
candidates = list(self.iter_applicable())
if not candidates:
return None
return max(candidates, key=self._sort_key)


class PackageFinder(object):
"""This finds packages.

Expand Down Expand Up @@ -628,6 +690,25 @@ def find_all_candidates(self, project_name):
# This is an intentional priority ordering
return file_versions + find_links_versions + page_versions

def find_candidates(
self,
project_name, # type: str
specifier=specifiers.SpecifierSet(), # type: specifiers.BaseSpecifier
):
"""Find matches for the given project and specifier.

If given, `specifier` should implement `filter` to allow version
filtering (e.g. ``packaging.specifiers.SpecifierSet``).

Returns a `FoundCandidates` instance.
"""
return FoundCandidates(
self.find_all_candidates(project_name),
specifier=specifier,
prereleases=(self.allow_all_prereleases or None),
sort_key=self._candidate_sort_key,
)

def find_requirement(self, req, upgrade):
# type: (InstallRequirement, bool) -> Optional[Link]
"""Try to find a Link matching req
Expand All @@ -636,52 +717,28 @@ def find_requirement(self, req, upgrade):
Returns a Link if found,
Raises DistributionNotFound or BestVersionAlreadyInstalled otherwise
"""
all_candidates = self.find_all_candidates(req.name)

# Filter out anything which doesn't match our specifier
compatible_versions = set(
req.specifier.filter(
# We turn the version object into a str here because otherwise
# when we're debundled but setuptools isn't, Python will see
# packaging.version.Version and
# pkg_resources._vendor.packaging.version.Version as different
# types. This way we'll use a str as a common data interchange
# format. If we stop using the pkg_resources provided specifier
# and start using our own, we can drop the cast to str().
[str(c.version) for c in all_candidates],
prereleases=(
self.allow_all_prereleases
if self.allow_all_prereleases else None
),
)
)
applicable_candidates = [
# Again, converting to str to deal with debundling.
c for c in all_candidates if str(c.version) in compatible_versions
]

if applicable_candidates:
best_candidate = max(applicable_candidates,
key=self._candidate_sort_key)
else:
best_candidate = None
candidates = self.find_candidates(req.name, req.specifier)
best_candidate = candidates.get_best()

installed_version = None # type: Optional[_BaseVersion]
if req.satisfied_by is not None:
installed_version = parse_version(req.satisfied_by.version)
else:
installed_version = None

def _format_versions(cand_iter):
# This repeated parse_version and str() conversion is needed to
# handle different vendoring sources from pip and pkg_resources.
# If we stop using the pkg_resources provided specifier.
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

PS - also, here's a code comment that got chopped off that can be fixed in a subsequent commit.

return ", ".join(sorted(
{str(c.version) for c in cand_iter},
key=parse_version,
)) or "none"

if installed_version is None and best_candidate is None:
logger.critical(
'Could not find a version that satisfies the requirement %s '
'(from versions: %s)',
req,
', '.join(
sorted(
{str(c.version) for c in all_candidates},
key=parse_version,
)
)
_format_versions(candidates.iter_all()),
)

raise DistributionNotFound(
Expand Down Expand Up @@ -716,15 +773,14 @@ def find_requirement(self, req, upgrade):
'Installed version (%s) is most up-to-date (past versions: '
'%s)',
installed_version,
', '.join(sorted(compatible_versions, key=parse_version)) or
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

It looks like parse_version got dropped in the new code.

Copy link
Member Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

This is merged into the above variable. I have made this into a function instead, with additional comments to make the usage clearer (hopefully).

"none",
_format_versions(candidates.iter_applicable()),
)
raise BestVersionAlreadyInstalled

logger.debug(
'Using version %s (newest of versions: %s)',
best_candidate.version,
', '.join(sorted(compatible_versions, key=parse_version))
_format_versions(candidates.iter_applicable()),
)
return best_candidate.location

Expand Down
8 changes: 3 additions & 5 deletions src/pip/_internal/utils/outdated.py
Original file line number Diff line number Diff line change
Expand Up @@ -129,12 +129,10 @@ def pip_version_check(session, options):
trusted_hosts=options.trusted_hosts,
session=session,
)
all_candidates = finder.find_all_candidates("pip")
if not all_candidates:
candidate = finder.find_candidates("pip").get_best()
if candidate is None:
return
pypi_version = str(
max(all_candidates, key=lambda c: c.version).version
)
pypi_version = str(candidate.version)

# save that we've performed a check
state.save(pypi_version, current_time)
Expand Down
12 changes: 10 additions & 2 deletions tests/unit/test_unit_outdated.py
Original file line number Diff line number Diff line change
Expand Up @@ -12,6 +12,14 @@
from pip._internal.utils import outdated


class MockFoundCandidates(object):
def __init__(self, best):
self._best = best

def get_best(self):
return self._best


class MockPackageFinder(object):

BASE_URL = 'https://pypi.org/simple/pip-{0}.tar.gz'
Expand All @@ -28,8 +36,8 @@ class MockPackageFinder(object):
def __init__(self, *args, **kwargs):
pass

def find_all_candidates(self, project_name):
return self.INSTALLATION_CANDIDATES
def find_candidates(self, project_name):
return MockFoundCandidates(self.INSTALLATION_CANDIDATES[0])


class MockDistribution(object):
Expand Down