|
| 1 | +import json |
1 | 2 | import logging
|
2 | 3 | import requests
|
3 | 4 |
|
|
23 | 24 | from packaging.utils import canonicalize_name
|
24 | 25 | from urllib.parse import urljoin, urlparse, urlunsplit
|
25 | 26 | from pathlib import PurePath
|
26 |
| -from pypi_simple import parse_links_stream_response |
| 27 | +from pypi_simple import ACCEPT_JSON_PREFERRED, ProjectPage |
27 | 28 |
|
28 | 29 | from pulpcore.plugin.viewsets import OperationPostponedResponse
|
29 | 30 | from pulpcore.plugin.tasking import dispatch
|
|
45 | 46 | python_content_to_json,
|
46 | 47 | PYPI_LAST_SERIAL,
|
47 | 48 | PYPI_SERIAL_CONSTANT,
|
| 49 | + get_remote_package_filter, |
48 | 50 | )
|
49 | 51 |
|
50 | 52 | from pulp_python.app import tasks
|
@@ -232,27 +234,31 @@ def list(self, request, path):
|
232 | 234 |
|
233 | 235 | def pull_through_package_simple(self, package, path, remote):
|
234 | 236 | """Gets the package's simple page from remote."""
|
235 |
| - def parse_url(link): |
236 |
| - parsed = urlparse(link.url) |
237 |
| - digest, _, value = parsed.fragment.partition('=') |
| 237 | + def parse_package(dis_package): |
| 238 | + parsed = urlparse(dis_package.url) |
238 | 239 | stripped_url = urlunsplit(chain(parsed[:3], ("", "")))
|
239 |
| - redirect = f'{path}/{link.text}?redirect={stripped_url}' |
240 |
| - d_url = urljoin(self.base_content_url, redirect) |
241 |
| - return link.text, d_url, value if digest == 'sha256' else '' |
| 240 | + redirect_path = f'{path}/{dis_package.filename}?redirect={stripped_url}' |
| 241 | + d_url = urljoin(self.base_content_url, redirect_path) |
| 242 | + return dis_package.filename, d_url, dis_package.digests.get("sha256", "") |
| 243 | + |
| 244 | + rfilter = get_remote_package_filter(remote) |
| 245 | + if not rfilter.filter_project(package): |
| 246 | + return Http404(f"{package} does not exist.") |
242 | 247 |
|
243 | 248 | url = remote.get_remote_artifact_url(f'simple/{package}/')
|
244 |
| - kwargs = {} |
245 |
| - if proxy_url := remote.proxy_url: |
246 |
| - if remote.proxy_username or remote.proxy_password: |
247 |
| - parsed_proxy = urlparse(proxy_url) |
248 |
| - netloc = f"{remote.proxy_username}:{remote.proxy_password}@{parsed_proxy.netloc}" |
249 |
| - proxy_url = urlunsplit((parsed_proxy.scheme, netloc, "", "", "")) |
250 |
| - kwargs["proxies"] = {"http": proxy_url, "https": proxy_url} |
251 |
| - |
252 |
| - response = requests.get(url, stream=True, **kwargs) |
253 |
| - links = parse_links_stream_response(response) |
254 |
| - packages = (parse_url(link) for link in links) |
255 |
| - return StreamingHttpResponse(write_simple_detail(package, packages, streamed=True)) |
| 249 | + remote.headers.append({"Accept": ACCEPT_JSON_PREFERRED}) |
| 250 | + downloader = remote.get_downloader(url=url, max_retries=1) |
| 251 | + try: |
| 252 | + d = downloader.fetch() |
| 253 | + except Exception: |
| 254 | + return Http404(f"Could not find {package}.") |
| 255 | + |
| 256 | + if d.headers["content-type"] == "application/vnd.pypi.simple.v1+json": |
| 257 | + page = ProjectPage.from_json_data(json.load(open(d.path, "rb"), base_url=remote.url)) |
| 258 | + else: |
| 259 | + page = ProjectPage.from_html(package, open(d.path, "rb").read(), base_url=remote.url) |
| 260 | + packages = [parse_package(p) for p in page.packages if rfilter.filter_release(package, p.version)] |
| 261 | + return Response(write_simple_detail(package, packages)) |
256 | 262 |
|
257 | 263 | @extend_schema(operation_id="pypi_simple_package_read", summary="Get package simple page")
|
258 | 264 | def retrieve(self, request, path, package):
|
|
0 commit comments