pip/src/pip/_internal/models/link.py

import posixpath
import re

from pip._vendor.six.moves.urllib import parse as urllib_parse

from pip._internal.utils.misc import (
    WHEEL_EXTENSION, path_to_url, redact_password_from_url,
    split_auth_from_netloc, splitext,
)
from pip._internal.utils.models import KeyBasedCompareMixin
from pip._internal.utils.typing import MYPY_CHECK_RUNNING

if MYPY_CHECK_RUNNING:
    from typing import Optional, Tuple, Union
    from pip._internal.index import HTMLPage


class Link(KeyBasedCompareMixin):
    """Represents a parsed link from a Package Index's simple URL
    """

    def __init__(self, url, comes_from=None, requires_python=None):
        # type: (str, Optional[Union[str, HTMLPage]], Optional[str]) -> None
        """
        url:
            url of the resource pointed to (href of the link)
        comes_from:
            instance of HTMLPage where the link was found, or string.
        requires_python:
            String containing the `Requires-Python` metadata field, specified
            in PEP 345. This may be specified by a data-requires-python
            attribute in the HTML link tag, as described in PEP 503.
        """

        # url can be a UNC windows share
        if url.startswith('\\\\'):
            url = path_to_url(url)

        self._parsed_url = urllib_parse.urlsplit(url)
        # Store the url as a private attribute to prevent accidentally
        # trying to set a new value.
        self._url = url

        self.comes_from = comes_from
        self.requires_python = requires_python if requires_python else None

        super(Link, self).__init__(key=url, defining_class=Link)

    def __str__(self):
        if self.requires_python:
            rp = ' (requires-python:%s)' % self.requires_python
        else:
            rp = ''
        if self.comes_from:
            return '%s (from %s)%s' % (redact_password_from_url(self._url),
                                       self.comes_from, rp)
        else:
            return redact_password_from_url(str(self._url))

    def __repr__(self):
        return '<Link %s>' % self

    @property
    def url(self):
        # type: () -> str
        return self._url

    @property
    def filename(self):
        # type: () -> str
        path = self.path.rstrip('/')
        name = posixpath.basename(path)
        if not name:
            # Make sure we don't leak auth information if the netloc
            # includes a username and password.
            netloc, user_pass = split_auth_from_netloc(self.netloc)
            return netloc

        name = urllib_parse.unquote(name)
        assert name, ('URL %r produced no filename' % self._url)
        return name

    @property
    def scheme(self):
        # type: () -> str
        return self._parsed_url.scheme

    @property
    def netloc(self):
        # type: () -> str
        """
        This can contain auth information.
        """
        return self._parsed_url.netloc

    @property
    def path(self):
        # type: () -> str
        return urllib_parse.unquote(self._parsed_url.path)

    def splitext(self):
        # type: () -> Tuple[str, str]
        return splitext(posixpath.basename(self.path.rstrip('/')))

    @property
    def ext(self):
        # type: () -> str
        return self.splitext()[1]

    @property
    def url_without_fragment(self):
        # type: () -> str
        scheme, netloc, path, query, fragment = self._parsed_url
        return urllib_parse.urlunsplit((scheme, netloc, path, query, None))

    _egg_fragment_re = re.compile(r'[#&]egg=([^&]*)')

    @property
    def egg_fragment(self):
        # type: () -> Optional[str]
        match = self._egg_fragment_re.search(self._url)
        if not match:
            return None
        return match.group(1)

    _subdirectory_fragment_re = re.compile(r'[#&]subdirectory=([^&]*)')

    @property
    def subdirectory_fragment(self):
        # type: () -> Optional[str]
        match = self._subdirectory_fragment_re.search(self._url)
        if not match:
            return None
        return match.group(1)

    _hash_re = re.compile(
        r'(sha1|sha224|sha384|sha256|sha512|md5)=([a-f0-9]+)'
    )

    @property
    def hash(self):
        # type: () -> Optional[str]
        match = self._hash_re.search(self._url)
        if match:
            return match.group(2)
        return None

    @property
    def hash_name(self):
        # type: () -> Optional[str]
        match = self._hash_re.search(self._url)
        if match:
            return match.group(1)
        return None

    @property
    def show_url(self):
        # type: () -> Optional[str]
        return posixpath.basename(self._url.split('#', 1)[0].split('?', 1)[0])

    @property
    def is_wheel(self):
        # type: () -> bool
        return self.ext == WHEEL_EXTENSION

    @property
    def is_artifact(self):
        # type: () -> bool
        """
        Determines if this points to an actual artifact (e.g. a tarball) or if
        it points to an "abstract" thing like a path or a VCS location.
        """
        from pip._internal.vcs import vcs

        if self.scheme in vcs.all_schemes:
            return False

        return True
Move Link to models 2018-06-18 12:59:56 +02:00			`import posixpath`
			`import re`

			`from pip._vendor.six.moves.urllib import parse as urllib_parse`

Move wheel extension information to remove cycle imports 2018-11-30 08:14:07 +01:00			`from pip._internal.utils.misc import (`
Fix an edge case where Link.filename can leak auth information. 2019-06-23 01:34:51 +02:00			`WHEEL_EXTENSION, path_to_url, redact_password_from_url,`
			`split_auth_from_netloc, splitext,`
Move wheel extension information to remove cycle imports 2018-11-30 08:14:07 +01:00			`)`
Add a utility for comparision logic and switch to it It uses the operator module, instead of inline-lambdas 2018-06-18 13:10:05 +02:00			`from pip._internal.utils.models import KeyBasedCompareMixin`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`from pip._internal.utils.typing import MYPY_CHECK_RUNNING`

			`if MYPY_CHECK_RUNNING:`
remove unused imports 2019-02-22 12:18:46 +01:00			`from typing import Optional, Tuple, Union`
remove #noqa: F401 2019-02-22 12:17:07 +01:00			`from pip._internal.index import HTMLPage`
Move Link to models 2018-06-18 12:59:56 +02:00

Add a utility for comparision logic and switch to it It uses the operator module, instead of inline-lambdas 2018-06-18 13:10:05 +02:00			`class Link(KeyBasedCompareMixin):`
Move Link to models 2018-06-18 12:59:56 +02:00			`"""Represents a parsed link from a Package Index's simple URL`
			`"""`

			`def __init__(self, url, comes_from=None, requires_python=None):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: (str, Optional[Union[str, HTMLPage]], Optional[str]) -> None`
Move Link to models 2018-06-18 12:59:56 +02:00			`"""`
			`url:`
			`url of the resource pointed to (href of the link)`
			`comes_from:`
			`instance of HTMLPage where the link was found, or string.`
			`requires_python:`
			String containing the `Requires-Python` metadata field, specified
			`in PEP 345. This may be specified by a data-requires-python`
			`attribute in the HTML link tag, as described in PEP 503.`
			`"""`

			`# url can be a UNC windows share`
			`if url.startswith('\\\\'):`
			`url = path_to_url(url)`

Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`self._parsed_url = urllib_parse.urlsplit(url)`
			`# Store the url as a private attribute to prevent accidentally`
			`# trying to set a new value.`
			`self._url = url`

Move Link to models 2018-06-18 12:59:56 +02:00			`self.comes_from = comes_from`
			`self.requires_python = requires_python if requires_python else None`

Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`super(Link, self).__init__(key=url, defining_class=Link)`
Add a utility for comparision logic and switch to it It uses the operator module, instead of inline-lambdas 2018-06-18 13:10:05 +02:00
Move Link to models 2018-06-18 12:59:56 +02:00			`def __str__(self):`
			`if self.requires_python:`
			`rp = ' (requires-python:%s)' % self.requires_python`
			`else:`
			`rp = ''`
			`if self.comes_from:`
Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`return '%s (from %s)%s' % (redact_password_from_url(self._url),`
Redact basic authentication passwords from log messages (#5773) Redact basic authentication passwords from URLs. 2018-10-19 11:06:10 +02:00			`self.comes_from, rp)`
Move Link to models 2018-06-18 12:59:56 +02:00			`else:`
Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`return redact_password_from_url(str(self._url))`
Move Link to models 2018-06-18 12:59:56 +02:00
			`def __repr__(self):`
			`return '<Link %s>' % self`

Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`@property`
			`def url(self):`
			`# type: () -> str`
			`return self._url`

Move Link to models 2018-06-18 12:59:56 +02:00			`@property`
			`def filename(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> str`
Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`path = self.path.rstrip('/')`
Fix an edge case where Link.filename can leak auth information. 2019-06-23 01:34:51 +02:00			`name = posixpath.basename(path)`
			`if not name:`
			`# Make sure we don't leak auth information if the netloc`
			`# includes a username and password.`
			`netloc, user_pass = split_auth_from_netloc(self.netloc)`
			`return netloc`

Move Link to models 2018-06-18 12:59:56 +02:00			`name = urllib_parse.unquote(name)`
Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`assert name, ('URL %r produced no filename' % self._url)`
Move Link to models 2018-06-18 12:59:56 +02:00			`return name`

			`@property`
			`def scheme(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> str`
models.link: use named attribute 2019-06-24 11:26:14 +02:00			`return self._parsed_url.scheme`
Move Link to models 2018-06-18 12:59:56 +02:00
			`@property`
			`def netloc(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> str`
Fix an edge case where Link.filename can leak auth information. 2019-06-23 01:34:51 +02:00			`"""`
			`This can contain auth information.`
			`"""`
models.link: use named attribute 2019-06-24 11:26:14 +02:00			`return self._parsed_url.netloc`
Move Link to models 2018-06-18 12:59:56 +02:00
			`@property`
			`def path(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> str`
models.link: use named attribute 2019-06-24 11:26:14 +02:00			`return urllib_parse.unquote(self._parsed_url.path)`
Move Link to models 2018-06-18 12:59:56 +02:00
			`def splitext(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> Tuple[str, str]`
Move Link to models 2018-06-18 12:59:56 +02:00			`return splitext(posixpath.basename(self.path.rstrip('/')))`

			`@property`
			`def ext(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> str`
Move Link to models 2018-06-18 12:59:56 +02:00			`return self.splitext()[1]`

			`@property`
			`def url_without_fragment(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> str`
Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`scheme, netloc, path, query, fragment = self._parsed_url`
Move Link to models 2018-06-18 12:59:56 +02:00			`return urllib_parse.urlunsplit((scheme, netloc, path, query, None))`

			`_egg_fragment_re = re.compile(r'[#&]egg=([^&]*)')`

			`@property`
			`def egg_fragment(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> Optional[str]`
Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`match = self._egg_fragment_re.search(self._url)`
Move Link to models 2018-06-18 12:59:56 +02:00			`if not match:`
			`return None`
			`return match.group(1)`

			`_subdirectory_fragment_re = re.compile(r'[#&]subdirectory=([^&]*)')`

			`@property`
			`def subdirectory_fragment(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> Optional[str]`
Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`match = self._subdirectory_fragment_re.search(self._url)`
Move Link to models 2018-06-18 12:59:56 +02:00			`if not match:`
			`return None`
			`return match.group(1)`

			`_hash_re = re.compile(`
			`r'(sha1\|sha224\|sha384\|sha256\|sha512\|md5)=([a-f0-9]+)'`
			`)`

			`@property`
			`def hash(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> Optional[str]`
Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`match = self._hash_re.search(self._url)`
Move Link to models 2018-06-18 12:59:56 +02:00			`if match:`
			`return match.group(2)`
			`return None`

			`@property`
			`def hash_name(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> Optional[str]`
Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`match = self._hash_re.search(self._url)`
Move Link to models 2018-06-18 12:59:56 +02:00			`if match:`
			`return match.group(1)`
			`return None`

			`@property`
			`def show_url(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> Optional[str]`
Parse the url when creating a Link object. 2019-06-23 01:02:42 +02:00			`return posixpath.basename(self._url.split('#', 1)[0].split('?', 1)[0])`
Move Link to models 2018-06-18 12:59:56 +02:00
			`@property`
			`def is_wheel(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> bool`
Move wheel extension information to remove cycle imports 2018-11-30 08:14:07 +01:00			`return self.ext == WHEEL_EXTENSION`
Move Link to models 2018-06-18 12:59:56 +02:00
			`@property`
			`def is_artifact(self):`
add type annotations for pip._internal.models (#6065) 2018-12-17 12:12:36 +01:00			`# type: () -> bool`
Move Link to models 2018-06-18 12:59:56 +02:00			`"""`
			`Determines if this points to an actual artifact (e.g. a tarball) or if`
			`it points to an "abstract" thing like a path or a VCS location.`
			`"""`
			`from pip._internal.vcs import vcs`

			`if self.scheme in vcs.all_schemes:`
			`return False`

			`return True`