From c23740641c5895965c92b9ab8343db250f213a65 Mon Sep 17 00:00:00 2001 From: Michael Kopf Date: Tue, 3 Dec 2024 12:16:57 +0100 Subject: [PATCH 1/4] make oras-py behave the same way as oras-go for deciding whether to unpack a tar layer or not Signed-off-by: Michael Kopf --- CHANGELOG.md | 1 + oras/provider.py | 53 ++++++++++++++++++++++------------------- oras/tests/test_oras.py | 19 +++++++++++++++ 3 files changed, 49 insertions(+), 24 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index f7f7f9d..aa071c9 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -14,6 +14,7 @@ and **Merged pull requests**. Critical items to know are: The versions coincide with releases on pip. Only major versions will be released as tags on Github. ## [0.0.x](https://github.com/oras-project/oras-py/tree/main) (0.0.x) + - use same annotation as oras-go for determining whether to unpack a layer or not - retry on 500 (0.2.25) - align provider config_path type annotations (0.2.24) - add missing prefix property to auth backend (0.2.23) diff --git a/oras/provider.py b/oras/provider.py index 1bb94a7..eaeaee3 100644 --- a/oras/provider.py +++ b/oras/provider.py @@ -760,23 +760,24 @@ def push( f"Blob {blob} is not in the present working directory context." ) - # Save directory or blob name before compressing - blob_name = os.path.basename(blob) - # If it's a directory, we need to compress - cleanup_blob = False - if os.path.isdir(blob): - blob = oras.utils.make_targz(blob) - cleanup_blob = True + is_dir_layer = os.path.isdir(blob) + blob_to_use_for_layer = ( + oras.utils.make_targz(blob) if is_dir_layer else blob + ) # Create a new layer from the blob - layer = oras.oci.NewLayer(blob, is_dir=cleanup_blob, media_type=media_type) + layer = oras.oci.NewLayer( + blob_to_use_for_layer, is_dir=is_dir_layer, media_type=media_type + ) annotations = annotset.get_annotations(blob) # Always strip blob_name of path separator - layer["annotations"] = { - oras.defaults.annotation_title: blob_name.strip(os.sep) - } + layer["annotations"] = {oras.defaults.annotation_title: blob.strip(os.sep)} + + if is_dir_layer: + layer["annotations"][oras.defaults.annotation_unpack] = "True" + if annotations: layer["annotations"].update(annotations) @@ -786,7 +787,7 @@ def push( # Upload the blob layer response = self.upload_blob( - blob, + blob_to_use_for_layer, container, layer, do_chunked=do_chunked, @@ -795,8 +796,8 @@ def push( self._check_200_response(response) # Do we need to cleanup a temporary targz? - if cleanup_blob and os.path.exists(blob): - os.remove(blob) + if is_dir_layer and os.path.exists(blob_to_use_for_layer): + os.remove(blob_to_use_for_layer) # Add annotations to the manifest, if provided manifest_annots = annotset.get_annotations("$manifest") or {} @@ -851,22 +852,23 @@ def pull( allowed_media_type: Optional[List] = None, overwrite: bool = True, outdir: Optional[str] = None, + skip_unpack: bool = False, ) -> List[str]: """ Pull an artifact from a target + :param target: target location to pull from + :type target: str :param config_path: path to a config file :type config_path: str :param allowed_media_type: list of allowed media types :type allowed_media_type: list or None :param overwrite: if output file exists, overwrite :type overwrite: bool - :param manifest_config_ref: save manifest config to this file - :type manifest_config_ref: str :param outdir: output directory path :type outdir: str - :param target: target location to pull from - :type target: str + :param skip_unpack: skip unpacking layers + :type skip_unpack: bool """ container = self.get_container(target) self.auth.load_configs( @@ -878,9 +880,13 @@ def pull( files = [] for layer in manifest.get("layers", []): - filename = (layer.get("annotations") or {}).get( - oras.defaults.annotation_title - ) + annotations: dict = layer.get("annotations", {}) + filename = annotations.get(oras.defaults.annotation_title) + # A directory will need to be uncompressed and moved + unpack_layer = annotations.get(oras.defaults.annotation_unpack, False) + + if unpack_layer and skip_unpack: + filename += ".tar.gz" # If we don't have a filename, default to digest. Hopefully does not happen if not filename: @@ -895,8 +901,7 @@ def pull( ) continue - # A directory will need to be uncompressed and moved - if layer["mediaType"] == oras.defaults.default_blob_dir_media_type: + if unpack_layer and not skip_unpack: targz = oras.utils.get_tmpfile(suffix=".tar.gz") self.download_blob(container, layer["digest"], targz) @@ -906,7 +911,7 @@ def pull( # Anything else just extracted directly else: self.download_blob(container, layer["digest"], outfile) - logger.info(f"Successfully pulled {outfile}.") + logger.info(f"Successfully pulled {outfile}") files.append(outfile) return files diff --git a/oras/tests/test_oras.py b/oras/tests/test_oras.py index 7ebff96..75a0f2c 100644 --- a/oras/tests/test_oras.py +++ b/oras/tests/test_oras.py @@ -161,6 +161,25 @@ def test_directory_push_pull(tmp_path, registry, credentials, target_dir): assert "artifact.txt" in os.listdir(files[0]) +@pytest.mark.with_auth(False) +def test_directory_push_pull_skip_unpack(tmp_path, registry, credentials, target_dir): + """ + Test push and pull for directory + """ + client = oras.client.OrasClient(hostname=registry, insecure=True) + + # Test upload of a directory + upload_dir = os.path.join(here, "upload_data") + res = client.push(files=[upload_dir], target=target_dir) + assert res.status_code == 201 + files = client.pull(target=target_dir, outdir=tmp_path, skip_unpack=True) + + assert len(files) == 1 + assert os.path.basename(files[0]) == "upload_data.tar.gz" + assert str(tmp_path) in files[0] + assert os.path.exists(files[0]) + + @pytest.mark.with_auth(True) def test_directory_push_pull_selfsigned_auth( tmp_path, registry, credentials, target_dir From 7e161df14155cabb27708455a083c221b097ee12 Mon Sep 17 00:00:00 2001 From: Michael Kopf Date: Tue, 3 Dec 2024 14:06:50 +0100 Subject: [PATCH 2/4] add missing version in changelog Signed-off-by: Michael Kopf --- CHANGELOG.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index aa071c9..c414e90 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -14,7 +14,7 @@ and **Merged pull requests**. Critical items to know are: The versions coincide with releases on pip. Only major versions will be released as tags on Github. ## [0.0.x](https://github.com/oras-project/oras-py/tree/main) (0.0.x) - - use same annotation as oras-go for determining whether to unpack a layer or not + - use same annotation as oras-go for determining whether to unpack a layer or not (0.2.26) - retry on 500 (0.2.25) - align provider config_path type annotations (0.2.24) - add missing prefix property to auth backend (0.2.23) From f5b230c211ed230c8d2ff2605cd35b639076fd6b Mon Sep 17 00:00:00 2001 From: Stefan Lietzau <104021830+stefansli@users.noreply.github.com> Date: Tue, 10 Dec 2024 16:50:24 +0100 Subject: [PATCH 3/4] Fix comments from review Signed-off-by: Stefan Lietzau <104021830+stefansli@users.noreply.github.com> --- CHANGELOG.md | 2 +- oras/provider.py | 7 +------ 2 files changed, 2 insertions(+), 7 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 5897f8f..c7de357 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -14,10 +14,10 @@ and **Merged pull requests**. Critical items to know are: The versions coincide with releases on pip. Only major versions will be released as tags on Github. ## [0.0.x](https://github.com/oras-project/oras-py/tree/main) (0.0.x) - - use same annotation as oras-go for determining whether to unpack a layer or not (0.2.26) - check for blob existence before uploading (0.2.26) - fix get_tags for ECR when limit is None, closes issue [173](https://github.com/oras-project/oras-py/issues/173) - fix empty token for anon tokens to work, closes issue [167](https://github.com/oras-project/oras-py/issues/167) + - use same annotation as oras-go for determining whether to unpack a layer or not [119](https://github.com/oras-project/oras-py/issues/119) - retry on 500 (0.2.25) - align provider config_path type annotations (0.2.24) - add missing prefix property to auth backend (0.2.23) diff --git a/oras/provider.py b/oras/provider.py index 677d9c0..11c13f0 100644 --- a/oras/provider.py +++ b/oras/provider.py @@ -888,8 +888,6 @@ def pull( :type overwrite: bool :param outdir: output directory path :type outdir: str - :param skip_unpack: skip unpacking layers - :type skip_unpack: bool """ container = self.get_container(target) self.auth.load_configs( @@ -906,9 +904,6 @@ def pull( # A directory will need to be uncompressed and moved unpack_layer = annotations.get(oras.defaults.annotation_unpack, False) - if unpack_layer and skip_unpack: - filename += ".tar.gz" - # If we don't have a filename, default to digest. Hopefully does not happen if not filename: filename = layer["digest"] @@ -922,7 +917,7 @@ def pull( ) continue - if unpack_layer and not skip_unpack: + if unpack_layer: targz = oras.utils.get_tmpfile(suffix=".tar.gz") self.download_blob(container, layer["digest"], targz) From 32982ea366165cde25d1002b5e1d3a40a3efaeb6 Mon Sep 17 00:00:00 2001 From: Stefan Lietzau <104021830+stefansli@users.noreply.github.com> Date: Tue, 10 Dec 2024 17:10:48 +0100 Subject: [PATCH 4/4] Fix test_directory_push_pull_skip_unpack Rewrite test to test the functionality to only unpack if the annotation is set. Signed-off-by: Stefan Lietzau <104021830+stefansli@users.noreply.github.com> --- oras/tests/test_oras.py | 14 ++++++++++---- 1 file changed, 10 insertions(+), 4 deletions(-) diff --git a/oras/tests/test_oras.py b/oras/tests/test_oras.py index 75a0f2c..ebb8e6e 100644 --- a/oras/tests/test_oras.py +++ b/oras/tests/test_oras.py @@ -2,12 +2,14 @@ __copyright__ = "Copyright The ORAS Authors." __license__ = "Apache-2.0" +import json import os import shutil import pytest import oras.client +import oras.oci here = os.path.abspath(os.path.dirname(__file__)) @@ -168,14 +170,18 @@ def test_directory_push_pull_skip_unpack(tmp_path, registry, credentials, target """ client = oras.client.OrasClient(hostname=registry, insecure=True) - # Test upload of a directory + # Test upload of a directory with an annotation file setting oras.defaults.annotation_unpack to False upload_dir = os.path.join(here, "upload_data") - res = client.push(files=[upload_dir], target=target_dir) + annotation_file = os.path.join(here, "annotations.json") + with open(annotation_file, "w") as f: + json.dump({str(upload_dir):{"oras.defaults.annotation_unpack": "False"}}, f) + + res = client.push(files=[upload_dir], target=target_dir, annotation_file=annotation_file) assert res.status_code == 201 - files = client.pull(target=target_dir, outdir=tmp_path, skip_unpack=True) + files = client.pull(target=target_dir, outdir=tmp_path) assert len(files) == 1 - assert os.path.basename(files[0]) == "upload_data.tar.gz" + assert os.path.basename(files[0]) == os.path.basename(upload_dir) assert str(tmp_path) in files[0] assert os.path.exists(files[0])