From 4dc3c5789f45116bd2ca0e1efb0b39572da102b5 Mon Sep 17 00:00:00 2001 From: Ee Durbin Date: Tue, 18 Jun 2024 12:09:09 -0400 Subject: [PATCH] implement a /digest/{project_name}/{sha256,blake2b_256}:{file_digest} endpoint This is a sketch of an implementation for #23, mostly to consider the ergonomics. --- conveyor/config.py | 22 +++++++++++++++++++++- conveyor/views.py | 45 +++++++++++++++++++++++++++++++++++++++++++++ 2 files changed, 66 insertions(+), 1 deletion(-) diff --git a/conveyor/config.py b/conveyor/config.py index d3baa4f..beb047e 100644 --- a/conveyor/config.py +++ b/conveyor/config.py @@ -19,7 +19,7 @@ from aiohttp.web_middlewares import normalize_path_middleware from aiobotocore.session import get_session as aiobotocore_get_session -from .views import not_found, redirect, health, documentation, documentation_top, index +from .views import not_found, redirect, health, documentation, documentation_top, index, content_sha256, content_blake2b_256 from .tasks import redirects_refresh_task @@ -81,6 +81,26 @@ def _cached_aiobotocore_session(): "/packages/{python_version}/{project_l}/{project_name}/{filename}", redirect, ) + app.router.add_route( + "GET", + "/digest/{project_name}/sha256:{file_sha256}", + content_sha256, + ) + app.router.add_route( + "HEAD", + "/digest/{project_name}/sha256:{file_sha256}", + content_sha256, + ) + app.router.add_route( + "GET", + "/digest/{project_name}/blake2b_256:{file_blake2b_256}", + content_blake2b_256, + ) + app.router.add_route( + "HEAD", + "/digest/{project_name}/blake2b_256:{file_blake2b_256}", + content_blake2b_256, + ) app.router.add_route( "GET", "/packages/{tail:.*}", diff --git a/conveyor/views.py b/conveyor/views.py index 9c03865..b64a755 100644 --- a/conveyor/views.py +++ b/conveyor/views.py @@ -74,6 +74,51 @@ async def _normalize_filename(filename): return filename +async def content_by_hash(request, digest=None, file_digest=None): + project_name = request.match_info["project_name"] + json_url = urllib.parse.urljoin( + request.app["settings"]["endpoint"], + "/pypi/{}/json".format(project_name), + ) + + async with request.app["http.session"].get(json_url) as resp: + if 400 <= resp.status < 500: + return web.Response(status=resp.status) + elif 500 <= resp.status < 600: + return web.Response(status=503) + + # It shouldn't be possible to get a status code other than 200 here. + assert resp.status == 200 + + # Get the JSON data from our request. + data = await resp.json() + + # Look at all of the files listed in the JSON response, and see if one + # matches our filename and Python version. If we find one, then return a + # 302 redirect to that URL. + for release in data.get("releases", {}).values(): + for file_ in release: + if file_['digests'][digest] == file_digest: + return web.Response( + status=302, + headers={ + "Location": file_["url"], + "Cache-Control": "max-age=604800, public", + }, + ) + + # If we've gotten to this point, it means that we couldn't locate an url + # to redirect to so we'll jsut 404. + return web.Response(status=404, headers={"Reason": "no file found"}) + + +async def content_sha256(request): + return await content_by_hash(request, digest="sha256", file_digest=request.match_info["file_sha256"]) + +async def content_blake2b_256(request): + return await content_by_hash(request, digest="blake2b_256", file_digest=request.match_info["file_blake2b_256"]) + + async def redirect(request): python_version = request.match_info["python_version"] project_l = request.match_info["project_l"]