123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163 |
- import posixpath
- import re
-
- from pip._vendor.six.moves.urllib import parse as urllib_parse
-
- from pip._internal.download import path_to_url
- from pip._internal.utils.misc import (
- WHEEL_EXTENSION, redact_password_from_url, splitext,
- )
- from pip._internal.utils.models import KeyBasedCompareMixin
- from pip._internal.utils.typing import MYPY_CHECK_RUNNING
-
- if MYPY_CHECK_RUNNING:
- from typing import Optional, Tuple, Union, Text # noqa: F401
- from pip._internal.index import HTMLPage # noqa: F401
-
-
- class Link(KeyBasedCompareMixin):
- """Represents a parsed link from a Package Index's simple URL
- """
-
- def __init__(self, url, comes_from=None, requires_python=None):
- # type: (str, Optional[Union[str, HTMLPage]], Optional[str]) -> None
- """
- url:
- url of the resource pointed to (href of the link)
- comes_from:
- instance of HTMLPage where the link was found, or string.
- requires_python:
- String containing the `Requires-Python` metadata field, specified
- in PEP 345. This may be specified by a data-requires-python
- attribute in the HTML link tag, as described in PEP 503.
- """
-
- # url can be a UNC windows share
- if url.startswith('\\\\'):
- url = path_to_url(url)
-
- self.url = url
- self.comes_from = comes_from
- self.requires_python = requires_python if requires_python else None
-
- super(Link, self).__init__(
- key=(self.url),
- defining_class=Link
- )
-
- def __str__(self):
- if self.requires_python:
- rp = ' (requires-python:%s)' % self.requires_python
- else:
- rp = ''
- if self.comes_from:
- return '%s (from %s)%s' % (redact_password_from_url(self.url),
- self.comes_from, rp)
- else:
- return redact_password_from_url(str(self.url))
-
- def __repr__(self):
- return '<Link %s>' % self
-
- @property
- def filename(self):
- # type: () -> str
- _, netloc, path, _, _ = urllib_parse.urlsplit(self.url)
- name = posixpath.basename(path.rstrip('/')) or netloc
- name = urllib_parse.unquote(name)
- assert name, ('URL %r produced no filename' % self.url)
- return name
-
- @property
- def scheme(self):
- # type: () -> str
- return urllib_parse.urlsplit(self.url)[0]
-
- @property
- def netloc(self):
- # type: () -> str
- return urllib_parse.urlsplit(self.url)[1]
-
- @property
- def path(self):
- # type: () -> str
- return urllib_parse.unquote(urllib_parse.urlsplit(self.url)[2])
-
- def splitext(self):
- # type: () -> Tuple[str, str]
- return splitext(posixpath.basename(self.path.rstrip('/')))
-
- @property
- def ext(self):
- # type: () -> str
- return self.splitext()[1]
-
- @property
- def url_without_fragment(self):
- # type: () -> str
- scheme, netloc, path, query, fragment = urllib_parse.urlsplit(self.url)
- return urllib_parse.urlunsplit((scheme, netloc, path, query, None))
-
- _egg_fragment_re = re.compile(r'[#&]egg=([^&]*)')
-
- @property
- def egg_fragment(self):
- # type: () -> Optional[str]
- match = self._egg_fragment_re.search(self.url)
- if not match:
- return None
- return match.group(1)
-
- _subdirectory_fragment_re = re.compile(r'[#&]subdirectory=([^&]*)')
-
- @property
- def subdirectory_fragment(self):
- # type: () -> Optional[str]
- match = self._subdirectory_fragment_re.search(self.url)
- if not match:
- return None
- return match.group(1)
-
- _hash_re = re.compile(
- r'(sha1|sha224|sha384|sha256|sha512|md5)=([a-f0-9]+)'
- )
-
- @property
- def hash(self):
- # type: () -> Optional[str]
- match = self._hash_re.search(self.url)
- if match:
- return match.group(2)
- return None
-
- @property
- def hash_name(self):
- # type: () -> Optional[str]
- match = self._hash_re.search(self.url)
- if match:
- return match.group(1)
- return None
-
- @property
- def show_url(self):
- # type: () -> Optional[str]
- return posixpath.basename(self.url.split('#', 1)[0].split('?', 1)[0])
-
- @property
- def is_wheel(self):
- # type: () -> bool
- return self.ext == WHEEL_EXTENSION
-
- @property
- def is_artifact(self):
- # type: () -> bool
- """
- Determines if this points to an actual artifact (e.g. a tarball) or if
- it points to an "abstract" thing like a path or a VCS location.
- """
- from pip._internal.vcs import vcs
-
- if self.scheme in vcs.all_schemes:
- return False
-
- return True
|