From dfa756aa6891c9043b57c24a09d712aa668dd9db Mon Sep 17 00:00:00 2001 From: Andrew Cheng Date: Fri, 29 Mar 2024 15:59:02 -0700 Subject: [PATCH] Allow source files to publish at by-hash paths Closes #1059 --- .github/workflows/scripts/install.sh | 2 +- CHANGES/1059.feature | 1 + pulp_deb/app/tasks/publishing.py | 38 +++++++++++------ .../functional/api/test_download_content.py | 42 +++++++++++++++++++ template_config.yml | 3 +- 5 files changed, 71 insertions(+), 15 deletions(-) create mode 100644 CHANGES/1059.feature diff --git a/.github/workflows/scripts/install.sh b/.github/workflows/scripts/install.sh index 07dae129..00e69e86 100755 --- a/.github/workflows/scripts/install.sh +++ b/.github/workflows/scripts/install.sh @@ -82,7 +82,7 @@ VARSYAML cat >> vars/main.yaml << VARSYAML pulp_env: {} -pulp_settings: {"allowed_content_checksums": ["md5", "sha1", "sha256", "sha512"], "allowed_export_paths": ["/tmp"], "allowed_import_paths": ["/tmp"]} +pulp_settings: {"allowed_content_checksums": ["md5", "sha1", "sha256", "sha512"], "allowed_export_paths": ["/tmp"], "allowed_import_paths": ["/tmp"], "apt_by_hash": true} pulp_scheme: https pulp_default_container: ghcr.io/pulp/pulp-ci-centos9:latest VARSYAML diff --git a/CHANGES/1059.feature b/CHANGES/1059.feature new file mode 100644 index 00000000..b9da22a8 --- /dev/null +++ b/CHANGES/1059.feature @@ -0,0 +1 @@ +Extend publishing at by-hash paths to source files. diff --git a/pulp_deb/app/tasks/publishing.py b/pulp_deb/app/tasks/publishing.py index 7c3d301f..ebd641fc 100644 --- a/pulp_deb/app/tasks/publishing.py +++ b/pulp_deb/app/tasks/publishing.py @@ -365,19 +365,9 @@ def finish(self): # Generating metadata files using checksum if settings.APT_BY_HASH: - for path, index in ( - (package_index_path, package_index), - (gz_package_index_path, gz_package_index), - ): - for checksum in settings.ALLOWED_CONTENT_CHECKSUMS: - if checksum in CHECKSUM_TYPE_MAP: - hashed_index_path = _fetch_file_checksum(path, index, checksum) - hashed_index = PublishedMetadata.create_from_file( - publication=self.parent.publication, - file=File(open(path, "rb")), - relative_path=hashed_index_path, - ) - hashed_index.save() + self.generate_by_hash( + package_index_path, package_index, gz_package_index_path, gz_package_index + ) self.parent.add_metadata(package_index) self.parent.add_metadata(gz_package_index) @@ -394,9 +384,31 @@ def finish(self): publication=self.parent.publication, file=File(open(gz_source_index_path, "rb")) ) gz_source_index.save() + + # Generating metadata files using checksum + if settings.APT_BY_HASH: + self.generate_by_hash( + source_index_path, source_index, gz_source_index_path, gz_source_index + ) + self.parent.add_metadata(source_index) self.parent.add_metadata(gz_source_index) + def generate_by_hash(self, index_path, index, gz_index_path, gz_index): + for path, index in ( + (index_path, index), + (gz_index_path, gz_index), + ): + for checksum in settings.ALLOWED_CONTENT_CHECKSUMS: + if checksum in CHECKSUM_TYPE_MAP: + hashed_index_path = _fetch_file_checksum(path, index, checksum) + hashed_index = PublishedMetadata.create_from_file( + publication=self.parent.publication, + file=File(open(path, "rb")), + relative_path=hashed_index_path, + ) + hashed_index.save() + class _ReleaseHelper: def __init__( diff --git a/pulp_deb/tests/functional/api/test_download_content.py b/pulp_deb/tests/functional/api/test_download_content.py index 0c4290b5..26b52fb8 100644 --- a/pulp_deb/tests/functional/api/test_download_content.py +++ b/pulp_deb/tests/functional/api/test_download_content.py @@ -3,11 +3,13 @@ import os import pytest import hashlib +import re from random import choice from urllib.parse import urljoin from pulp_deb.tests.functional.constants import ( DEB_FIXTURE_STANDARD_REPOSITORY_NAME, + DEB_FIXTURE_SINGLE_DIST, DEB_GENERIC_CONTENT_NAME, DEB_PACKAGE_NAME, DEB_PACKAGE_RELEASE_COMPONENT_NAME, @@ -204,3 +206,43 @@ def test_download_cached_content( content_hash = hashlib.sha256(content).hexdigest() assert package_hash == content_hash + + +@pytest.mark.parallel +def test_apt_by_hash( + deb_init_and_sync, + deb_publication_factory, + deb_distribution_factory, + deb_get_content_types, + download_content_unit, +): + """Verify that deb and deb source content is available in the by-hash path.""" + # Create/sync a repo and then do a publish and create a distro + repo, _ = deb_init_and_sync(remote_args={"sync_sources": True}) + deb_publication_factory(repo, structured=True, simple=True) + distribution = deb_distribution_factory(repository=repo) + + # Obtain the Release file and parse out the sha256 + release_metadata = deb_get_content_types( + "apt_release_file_api", DEB_RELEASE_FILE_NAME, repo, repo.latest_version_href + ) + single_release_metadata = next( + release for release in release_metadata if release.distribution == DEB_FIXTURE_SINGLE_DIST + ) + release_file_path = next( + key for key in single_release_metadata.artifacts.keys() if key.endswith("/Release") + ) + release_file = download_content_unit(distribution.base_path, release_file_path).decode("utf-8") + sha256_section = release_file.split("SHA256:")[1].split("SHA512:")[0].strip() + sha256_pattern = re.compile( + r"([a-fA-F0-9]{64})\s+\d+\s+([^/\s]+/[^/\s]+)/(Packages|Sources)(?:\s|\n)" + ) + matches = sha256_pattern.findall(sha256_section) + sha256_dict = {path: sha for sha, path, _ in matches} + + # Verify that all by-hash files are available + for path, sha256 in sha256_dict.items(): + content_url = f"dists/{DEB_FIXTURE_SINGLE_DIST}/{path}/by-hash/SHA256/{sha256}" + assert "404" not in download_content_unit(distribution.base_path, content_url).decode( + "utf-8" + ) diff --git a/template_config.yml b/template_config.yml index 9e223d18..a3fe2fca 100644 --- a/template_config.yml +++ b/template_config.yml @@ -1,7 +1,7 @@ # This config represents the latest values used when running the plugin-template. Any settings that # were not present before running plugin-template have been added with their default values. -# generated with plugin_template@2021.08.26-354-g82d22de +# generated with plugin_template@2021.08.26-349-gba81617 api_root: /pulp/ black: true @@ -56,6 +56,7 @@ pulp_settings: - /tmp allowed_import_paths: - /tmp + apt_by_hash: true pulp_settings_azure: null pulp_settings_gcp: null pulp_settings_s3: null