更改enroll命名,添加了注释,向get_error_msg中添加了一些错误代码

2022-05-05 22:59:35 +08:00
parent 51b5e374a3
commit ece69eaf57
4637 changed files with 7699 additions and 608140 deletions
@@ -12,19 +12,15 @@ import re
 import urllib.parse
 import urllib.request
 import xml.etree.ElementTree
-from html.parser import HTMLParser
 from optparse import Values
 from typing import (
-    TYPE_CHECKING,
    Callable,
-    Dict,
    Iterable,
    List,
    MutableMapping,
    NamedTuple,
    Optional,
    Sequence,
-    Tuple,
    Union,
 )

@@ -43,11 +39,6 @@ from pip._internal.vcs import vcs

 from .sources import CandidatesFromPage, LinkSource, build_source

-if TYPE_CHECKING:
-    from typing import Protocol
-else:
-    Protocol = object
-
 logger = logging.getLogger(__name__)

 HTMLElement = xml.etree.ElementTree.Element
@@ -172,8 +163,6 @@ def _determine_base_url(document: HTMLElement, page_url: str) -> str:
    :param document: An HTML document representation. The current
        implementation expects the result of ``html5lib.parse()``.
    :param page_url: The URL of the HTML document.
-
-    TODO: Remove when `html5lib` is dropped.
    """
    for base in document.findall(".//base"):
        href = base.get("href")
@@ -245,20 +234,20 @@ def _clean_link(url: str) -> str:


 def _create_link_from_element(
-    element_attribs: Dict[str, Optional[str]],
+    anchor: HTMLElement,
    page_url: str,
    base_url: str,
 ) -> Optional[Link]:
    """
-    Convert an anchor element's attributes in a simple repository page to a Link.
+    Convert an anchor element in a simple repository page to a Link.
    """
-    href = element_attribs.get("href")
+    href = anchor.get("href")
    if not href:
        return None

    url = _clean_link(urllib.parse.urljoin(base_url, href))
-    pyrequire = element_attribs.get("data-requires-python")
-    yanked_reason = element_attribs.get("data-yanked")
+    pyrequire = anchor.get("data-requires-python")
+    yanked_reason = anchor.get("data-yanked")

    link = Link(
        url,
@@ -282,14 +271,9 @@ class CacheablePageContent:
        return hash(self.page.url)


-class ParseLinks(Protocol):
-    def __call__(
-        self, page: "HTMLPage", use_deprecated_html5lib: bool
-    ) -> Iterable[Link]:
-        ...
-
-
-def with_cached_html_pages(fn: ParseLinks) -> ParseLinks:
+def with_cached_html_pages(
+    fn: Callable[["HTMLPage"], Iterable[Link]],
+) -> Callable[["HTMLPage"], List[Link]]:
    """
    Given a function that parses an Iterable[Link] from an HTMLPage, cache the
    function's result (keyed by CacheablePageContent), unless the HTMLPage
@@ -297,25 +281,22 @@ def with_cached_html_pages(fn: ParseLinks) -> ParseLinks:
    """

    @functools.lru_cache(maxsize=None)
-    def wrapper(
-        cacheable_page: CacheablePageContent, use_deprecated_html5lib: bool
-    ) -> List[Link]:
-        return list(fn(cacheable_page.page, use_deprecated_html5lib))
+    def wrapper(cacheable_page: CacheablePageContent) -> List[Link]:
+        return list(fn(cacheable_page.page))

    @functools.wraps(fn)
-    def wrapper_wrapper(page: "HTMLPage", use_deprecated_html5lib: bool) -> List[Link]:
+    def wrapper_wrapper(page: "HTMLPage") -> List[Link]:
        if page.cache_link_parsing:
-            return wrapper(CacheablePageContent(page), use_deprecated_html5lib)
-        return list(fn(page, use_deprecated_html5lib))
+            return wrapper(CacheablePageContent(page))
+        return list(fn(page))

    return wrapper_wrapper


-def _parse_links_html5lib(page: "HTMLPage") -> Iterable[Link]:
+@with_cached_html_pages
+def parse_links(page: "HTMLPage") -> Iterable[Link]:
    """
    Parse an HTML document, and yield its anchor elements as Link objects.
-
-    TODO: Remove when `html5lib` is dropped.
    """
    document = html5lib.parse(
        page.content,
@@ -326,33 +307,6 @@ def _parse_links_html5lib(page: "HTMLPage") -> Iterable[Link]:
    url = page.url
    base_url = _determine_base_url(document, url)
    for anchor in document.findall(".//a"):
-        link = _create_link_from_element(
-            anchor.attrib,
-            page_url=url,
-            base_url=base_url,
-        )
-        if link is None:
-            continue
-        yield link
-
-
-@with_cached_html_pages
-def parse_links(page: "HTMLPage", use_deprecated_html5lib: bool) -> Iterable[Link]:
-    """
-    Parse an HTML document, and yield its anchor elements as Link objects.
-    """
-
-    if use_deprecated_html5lib:
-        yield from _parse_links_html5lib(page)
-        return
-
-    parser = HTMLLinkParser(page.url)
-    encoding = page.encoding or "utf-8"
-    parser.feed(page.content.decode(encoding))
-
-    url = page.url
-    base_url = parser.base_url or url
-    for anchor in parser.anchors:
        link = _create_link_from_element(
            anchor,
            page_url=url,
@@ -389,34 +343,6 @@ class HTMLPage:
        return redact_auth_from_url(self.url)


-class HTMLLinkParser(HTMLParser):
-    """
-    HTMLParser that keeps the first base HREF and a list of all anchor
-    elements' attributes.
-    """
-
-    def __init__(self, url: str) -> None:
-        super().__init__(convert_charrefs=True)
-
-        self.url: str = url
-        self.base_url: Optional[str] = None
-        self.anchors: List[Dict[str, Optional[str]]] = []
-
-    def handle_starttag(self, tag: str, attrs: List[Tuple[str, Optional[str]]]) -> None:
-        if tag == "base" and self.base_url is None:
-            href = self.get_href(attrs)
-            if href is not None:
-                self.base_url = href
-        elif tag == "a":
-            self.anchors.append(dict(attrs))
-
-    def get_href(self, attrs: List[Tuple[str, Optional[str]]]) -> Optional[str]:
-        for name, value in attrs:
-            if name == "href":
-                return value
-        return None
-
-
 def _handle_get_page_fail(
    link: Link,
    reason: Union[str, Exception],
@@ -37,6 +37,7 @@ from pip._internal.utils.logging import indent_log
 from pip._internal.utils.misc import build_netloc
 from pip._internal.utils.packaging import check_requires_python
 from pip._internal.utils.unpacking import SUPPORTED_EXTENSIONS
+from pip._internal.utils.urls import url_to_path

 __all__ = ["FormatControl", "BestCandidateResult", "PackageFinder"]

@@ -580,7 +581,6 @@ class PackageFinder:
        link_collector: LinkCollector,
        target_python: TargetPython,
        allow_yanked: bool,
-        use_deprecated_html5lib: bool,
        format_control: Optional[FormatControl] = None,
        candidate_prefs: Optional[CandidatePreferences] = None,
        ignore_requires_python: Optional[bool] = None,
@@ -605,7 +605,6 @@ class PackageFinder:
        self._ignore_requires_python = ignore_requires_python
        self._link_collector = link_collector
        self._target_python = target_python
-        self._use_deprecated_html5lib = use_deprecated_html5lib

        self.format_control = format_control

@@ -622,8 +621,6 @@ class PackageFinder:
        link_collector: LinkCollector,
        selection_prefs: SelectionPreferences,
        target_python: Optional[TargetPython] = None,
-        *,
-        use_deprecated_html5lib: bool,
    ) -> "PackageFinder":
        """Create a PackageFinder.

@@ -648,7 +645,6 @@ class PackageFinder:
            allow_yanked=selection_prefs.allow_yanked,
            format_control=selection_prefs.format_control,
            ignore_requires_python=selection_prefs.ignore_requires_python,
-            use_deprecated_html5lib=use_deprecated_html5lib,
        )

    @property
@@ -770,7 +766,7 @@ class PackageFinder:
        if html_page is None:
            return []

-        page_links = list(parse_links(html_page, self._use_deprecated_html5lib))
+        page_links = list(parse_links(html_page))

        with indent_log():
            package_links = self.evaluate_links(
@@ -820,14 +816,7 @@ class PackageFinder:
        )

        if logger.isEnabledFor(logging.DEBUG) and file_candidates:
-            paths = []
-            for candidate in file_candidates:
-                assert candidate.link.url  # we need to have a URL
-                try:
-                    paths.append(candidate.link.file_path)
-                except Exception:
-                    paths.append(candidate.link.url)  # it's not a local file
-
+            paths = [url_to_path(c.link.url) for c in file_candidates]
            logger.debug("Local files found: %s", ", ".join(paths))

        # This is an intentional priority ordering
@@ -892,7 +881,7 @@ class PackageFinder:

        installed_version: Optional[_BaseVersion] = None
        if req.satisfied_by is not None:
-            installed_version = req.satisfied_by.version
+            installed_version = parse_version(req.satisfied_by.version)

        def _format_versions(cand_iter: Iterable[InstallationCandidate]) -> str:
            # This repeated parse_version and str() conversion is needed to