From 444f74f5db10525d091322b38c8620861c997d42 Mon Sep 17 00:00:00 2001
From: "Kacper Kowalik (Xarthisius)" <xarthisius.kk@gmail.com>
Date: Thu, 29 Jan 2026 08:18:03 -0600
Subject: [PATCH 1/6] Add verify-package, rename verify to verify-timestamp

---
 pyproject.toml         |   1 +
 tro_utils/cli.py       | 105 ++++++++++++++++++++++++---
 tro_utils/tro_utils.py | 158 +++++++++++++++++++++++++++++++++++++----
 3 files changed, 240 insertions(+), 24 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index ddbef7a..74efb4a 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -22,6 +22,7 @@ dependencies = [
   "python-magic",
   "rfc3161ng",
   "graphviz",
+  "rich",
 ]
 requires-python = ">= 3.10"
 license = {file = "LICENSE"}
diff --git a/tro_utils/cli.py b/tro_utils/cli.py
index 301c73a..250a3fb 100644
--- a/tro_utils/cli.py
+++ b/tro_utils/cli.py
@@ -3,10 +3,14 @@
 import sys
 
 import click
+from rich.console import Console
+from rich.table import Table
 
 from . import TRPAttribute
 from .tro_utils import TRO
 
+console = Console()
+
 _TEMPLATES = {
     "default": {
         "description": "Default pretty template by Craig Willis",
@@ -101,21 +105,104 @@ def cli(
 
 
 @cli.command(help="Verify that TRO is signed and timestamped correctly")
-@click.pass_context
-def verify(ctx):
-    declaration = ctx.parent.params.get("declaration")
-    gpg_fingerprint = ctx.parent.params.get("gpg_fingerprint")
-    gpg_passphrase = ctx.parent.params.get("gpg_passphrase")
-    profile = ctx.parent.params.get("profile")
+@click.argument("declaration", type=click.Path(exists=True))
+def verify_timestamp(declaration):
     tro = TRO(
         filepath=declaration,
-        gpg_fingerprint=gpg_fingerprint,
-        gpg_passphrase=gpg_passphrase,
-        profile=profile,
     )
     tro.verify_timestamp()
 
 
+@cli.command(help="Verify the integrity of the TRO")
+@click.argument("declaration", type=click.Path(exists=True))
+@click.argument(
+    "package",
+    type=click.Path(exists=True),
+)
+@click.option(
+    "--arrangement-id",
+    "-a",
+    type=click.STRING,
+    required=False,
+    help="ID of the arrangement to verify. If not provided all arrangements will be tried",
+)
+@click.option(
+    "--subpath",
+    "-s",
+    type=click.STRING,
+    required=False,
+    help="Subpath within the package structure, e.g. if arrangement is stored in a subdirectory",
+)
+@click.option(
+    "--verbose",
+    "-v",
+    is_flag=True,
+    help="Show detailed information during verification",
+)
+def verify_package(declaration, package, arrangement_id, subpath, verbose):
+    subpath = subpath if subpath else ""
+    tro = TRO(
+        filepath=declaration,
+    )
+    if not arrangement_id:
+        arrangements = [a["@id"] for a in tro.list_arrangements()]
+    else:
+        arrangements = [arrangement_id]
+
+    for arrangement in arrangements:
+        msg = (
+            f"Verifying that arrangement '{arrangement}' matches package contents "
+            f"of '{package}"
+        )
+        if subpath:
+            msg += f"::{subpath}"
+        msg += "'"
+        click.echo(msg, nl=False)
+        extra, mismatched, missing, success = tro.verify_replication_package(
+            arrangement, package, subpath
+        )
+        if success:
+            click.secho(" ✓", fg="green")
+        else:
+            click.secho(" ✗", fg="red")
+
+        if extra and verbose:
+            table = Table(
+                title="[bold red]Extra Files Found[/bold red]", show_header=False
+            )
+            table.add_column("File", style="yellow")
+            for e in extra:
+                table.add_row(e)
+            console.print(table)
+            console.print()
+
+        if mismatched and verbose:
+            table = Table(title="[bold red]Mismatched Files Found[/bold red]")
+            table.add_column("File", style="cyan")
+            table.add_column("Expected Hash", style="green")
+            table.add_column("Actual Hash", style="red")
+            for filepath, expected_hash, actual_hash in mismatched:
+                expected_display = (
+                    expected_hash[:16] + "..." if expected_hash else "[dim]None[/dim]"
+                )
+                actual_display = (
+                    actual_hash[:16] + "..." if actual_hash else "[dim]None[/dim]"
+                )
+                table.add_row(filepath, expected_display, actual_display)
+            console.print(table)
+            console.print()
+
+        if missing and verbose:
+            table = Table(
+                title="[bold red]Missing Files Found[/bold red]", show_header=False
+            )
+            table.add_column("File", style="magenta")
+            for m in missing:
+                table.add_row(m)
+            console.print(table)
+            console.print()
+
+
 @cli.group(help="Manage arrangements in the TRO")
 def arrangement():
     pass
diff --git a/tro_utils/tro_utils.py b/tro_utils/tro_utils.py
index 55eaba6..5794f6c 100644
--- a/tro_utils/tro_utils.py
+++ b/tro_utils/tro_utils.py
@@ -6,6 +6,7 @@
 import pathlib
 import subprocess
 import tempfile
+import zipfile
 
 import datetime
 import gnupg
@@ -61,13 +62,16 @@ def __init__(
                         "rdf": "http://www.w3.org/1999/02/22-rdf-syntax-ns#",
                         "rdfs": "http://www.w3.org/2000/01/rdf-schema#",
                         "trov": "https://w3id.org/trace/2023/05/trov#",
-                        "schema": "https://schema.org"
+                        "schema": "https://schema.org",
                     }
                 ],
                 "@graph": [
                     {
                         "@id": "tro",
-                        "@type": ["trov:TransparentResearchObject", "schema:CreativeWork"],
+                        "@type": [
+                            "trov:TransparentResearchObject",
+                            "schema:CreativeWork",
+                        ],
                         "schema:creator": tro_creator or "TRO utils",
                         "schema:name": tro_name or "Some TRO",
                         "schema:description": tro_description or "Some description",
@@ -82,7 +86,10 @@ def __init__(
                         "trov:hasPerformance": [],
                         "trov:wasAssembledBy": {
                             "@id": "trs",
-                            "@type": ["trov:TrustedResearchSystem", "schema:Organization"],
+                            "@type": [
+                                "trov:TrustedResearchSystem",
+                                "schema:Organization",
+                            ],
                             **self.profile,
                         },
                     },
@@ -155,6 +162,54 @@ def update_composition(self, composition):
     def list_arrangements(self):
         return self.data["@graph"][0]["trov:hasArrangement"]
 
+    def get_arrangement_path_hash_map(self, arrangement_id):
+        """
+        Get a mapping of paths to hashes for a specific arrangement.
+
+        Args:
+            arrangement_id: The ID of the arrangement (e.g., "arrangement/0")
+
+        Returns:
+            dict: A dictionary mapping file paths to their SHA256 hashes
+
+        Raises:
+            ValueError: If the arrangement ID does not exist
+        """
+        # Find the arrangement
+        arrangement = None
+        for arr in self.data["@graph"][0]["trov:hasArrangement"]:
+            if arr["@id"] == arrangement_id:
+                arrangement = arr
+                break
+
+        if arrangement is None:
+            available = [
+                arr["@id"] for arr in self.data["@graph"][0]["trov:hasArrangement"]
+            ]
+            raise ValueError(
+                f"Arrangement '{arrangement_id}' not found. "
+                f"Available arrangements: {available}"
+            )
+
+        # Build a composition lookup map (artifact id -> hash)
+        composition_map = {
+            artifact["@id"]: artifact["trov:sha256"]
+            for artifact in self.data["@graph"][0]["trov:hasComposition"][
+                "trov:hasArtifact"
+            ]
+        }
+
+        # Build the path -> hash mapping
+        path_hash_map = {}
+        for locus in arrangement.get("trov:hasLocus", []):
+            path = locus["trov:hasLocation"]
+            artifact_id = locus["trov:hasArtifact"]["@id"]
+            hash_value = composition_map.get(artifact_id)
+            if hash_value:
+                path_hash_map[path] = hash_value
+
+        return path_hash_map
+
     def add_arrangement(
         self, directory, ignore_dirs=None, comment=None, resolve_symlinks=True
     ):
@@ -178,10 +233,12 @@ def add_arrangement(
             if os.path.islink(filepath):
                 mime_type = "inode/symlink"
             else:
-                mime_type = magic_wrapper.from_file(filepath) or "application/octet-stream"
+                mime_type = (
+                    magic_wrapper.from_file(filepath) or "application/octet-stream"
+                )
             composition[hash_value] = {
                 "@id": f"composition/1/artifact/{i}",
-                "trov:mimeType": mime_type
+                "trov:mimeType": mime_type,
             }
             i += 1
 
@@ -224,6 +281,18 @@ def sha256_for_file(filepath, resolve_symlinks=True):
                 sha256.update(chunk)
         return sha256.hexdigest()
 
+    @staticmethod
+    def sha256_for_zipfile(zipfilepath):
+        hashes = {}
+        with zipfile.ZipFile(zipfilepath, "r") as zf:
+            for fileinfo in zf.infolist():
+                sha256 = hashlib.sha256()
+                with zf.open(fileinfo.filename) as f:
+                    for chunk in iter(lambda: f.read(4096), b""):
+                        sha256.update(chunk)
+                hashes[fileinfo.filename] = sha256.hexdigest()
+        return hashes
+
     def sha256_for_directory(self, directory, ignore_dirs=None, resolve_symlinks=True):
         if ignore_dirs is None:
             ignore_dirs = [".git"]  # Default ignore list
@@ -232,7 +301,9 @@ def sha256_for_directory(self, directory, ignore_dirs=None, resolve_symlinks=Tru
             dirs[:] = [d for d in dirs if d not in ignore_dirs]
             for filename in files:
                 filepath = os.path.join(root, filename)
-                hash_value = self.sha256_for_file(filepath, resolve_symlinks=resolve_symlinks)
+                hash_value = self.sha256_for_file(
+                    filepath, resolve_symlinks=resolve_symlinks
+                )
                 hashes[filepath] = hash_value
         return hashes
 
@@ -273,12 +344,11 @@ def get_composition_info(self):
     def verify_timestamp(self):
         """Verify that a run is valid and signed."""
 
-        if os.path.exists(self.sig_filename):
+        try:
             with open(self.sig_filename, "rb") as fp:
                 trs_signature = fp.read()
-        else:
-            print("computing")
-            trs_signature = str(self.trs_signature()).encode("utf-8")
+        except FileNotFoundError:
+            raise RuntimeError("Signature file does not exist")
 
         ts_data = {
             "tro_declaration": hashlib.sha512(
@@ -328,6 +398,58 @@ def verify_timestamp(self):
             ]
             subprocess.check_call(args)
 
+    def verify_replication_package(self, arrangement_id, package, subpath=None):
+        files_missing_in_arrangement = []
+        mismatched_hashes = []
+
+        arrangement_map = self.get_arrangement_path_hash_map(arrangement_id)
+
+        # Generator to yield (relative_filename, file_hash) tuples
+        def iterate_package_files():
+            if os.path.isdir(package):
+                for root, dirs, files in os.walk(package):
+                    for filename in files:
+                        filepath = os.path.join(root, filename)
+                        relative_filename = os.path.relpath(filepath, package)
+                        file_hash = self.sha256_for_file(filepath)
+                        yield relative_filename, file_hash
+            else:
+                with zipfile.ZipFile(package, "r") as zf:
+                    for fileinfo in zf.infolist():
+                        sha256 = hashlib.sha256()
+                        with zf.open(fileinfo.filename) as f:
+                            for chunk in iter(lambda: f.read(4096), b""):
+                                sha256.update(chunk)
+                        file_hash = sha256.hexdigest()
+                        yield fileinfo.filename, file_hash
+
+        for original_filename, file_hash in iterate_package_files():
+            relative_filename = original_filename
+
+            # Handle subpath filtering
+            if subpath is not None:
+                if not original_filename.startswith(subpath):
+                    continue
+                relative_filename = original_filename[len(subpath) :].lstrip("/")
+
+            # Check if file exists in arrangement
+            if relative_filename not in arrangement_map:
+                files_missing_in_arrangement.append(relative_filename)
+
+            # Verify hash
+            expected_hash = arrangement_map.pop(relative_filename, None)
+            if file_hash != expected_hash:
+                mismatched_hashes.append((relative_filename, expected_hash, file_hash))
+
+        dirty = (
+            files_missing_in_arrangement
+            or mismatched_hashes
+            or len(arrangement_map) > 0
+        )
+        return files_missing_in_arrangement, mismatched_hashes, list(
+            arrangement_map.keys()
+        ), not dirty
+
     def add_performance(
         self,
         start_time,
@@ -434,7 +556,9 @@ def generate_report(self, template, report):
         for trp in graph["trov:hasPerformance"]:
             description = trp["rdfs:comment"]
             accessed = arrangements[trp["trov:accessedArrangement"]["@id"]]["name"]
-            contributed = arrangements[trp["trov:contributedToArrangement"]["@id"]]["name"]
+            contributed = arrangements[trp["trov:contributedToArrangement"]["@id"]][
+                "name"
+            ]
             dot.node(description)
             dot.edge(accessed, description)
             dot.edge(description, contributed)
@@ -449,14 +573,18 @@ def generate_report(self, template, report):
 
         for n in reversed(range(1, len(keys))):
             for location in arrangements[keys[n]]["artifacts"]:
-                if location in arrangements[keys[n-1]]["artifacts"]:
+                if location in arrangements[keys[n - 1]]["artifacts"]:
                     if (
                         arrangements[keys[n]]["artifacts"][location]["sha256"]
-                        != arrangements[keys[n-1]]["artifacts"][location]["sha256"]
+                        != arrangements[keys[n - 1]]["artifacts"][location]["sha256"]
                     ):
-                        arrangements[keys[n]]["artifacts"][location]["status"] = "Changed"
+                        arrangements[keys[n]]["artifacts"][location][
+                            "status"
+                        ] = "Changed"
                     else:
-                        arrangements[keys[n]]["artifacts"][location]["status"] = "Unchanged"
+                        arrangements[keys[n]]["artifacts"][location][
+                            "status"
+                        ] = "Unchanged"
                 else:
                     arrangements[keys[n]]["artifacts"][location]["status"] = "Created"
 

From 6bae16d138fc600866f2d248d1dcb3dff236f9ef Mon Sep 17 00:00:00 2001
From: "Kacper Kowalik (Xarthisius)" <xarthisius.kk@gmail.com>
Date: Thu, 29 Jan 2026 08:39:28 -0600
Subject: [PATCH 2/6] Add tests

---
 tests/test_tro_utils.py | 401 ++++++++++++++++++++++++++++++++++++++++
 1 file changed, 401 insertions(+)

diff --git a/tests/test_tro_utils.py b/tests/test_tro_utils.py
index 2634c7a..9005862 100644
--- a/tests/test_tro_utils.py
+++ b/tests/test_tro_utils.py
@@ -475,6 +475,9 @@ def test_verify_timestamp(
         # Create a fake TSR file
         with open(tro.tsr_filename, "wb") as f:
             f.write(b"fake tsr data")
+        # Create a fake SIG file
+        with open(tro.sig_filename, "wb") as f:
+            f.write(b"fake sig data")
 
         # Verify timestamp
         tro.verify_timestamp()
@@ -859,3 +862,401 @@ def test_get_composition_info(self, temp_workspace, tmp_path, gpg_setup):
         assert "@type" in composition_info
         assert "trov:hasArtifact" in composition_info
         assert len(composition_info["trov:hasArtifact"]) > 0
+
+
+class TestReplicationPackageVerification:
+    """Test verification of replication packages against arrangements."""
+
+    def test_verify_identical_directory(self, temp_workspace, tmp_path, gpg_setup):
+        """Test verifying a directory that exactly matches the arrangement."""
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement
+        tro.add_arrangement(str(temp_workspace), comment="Original", ignore_dirs=[])
+
+        # Verify the same directory
+        (
+            missing,
+            mismatched,
+            extra,
+            is_valid,
+        ) = tro.verify_replication_package("arrangement/0", str(temp_workspace))
+
+        # Should be identical
+        assert is_valid is True
+        assert len(missing) == 0
+        assert len(mismatched) == 0
+        assert len(extra) == 0
+
+    def test_verify_directory_with_modified_file(
+        self, temp_workspace, tmp_path, gpg_setup
+    ):
+        """Test verifying a directory where a file has been modified."""
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement
+        tro.add_arrangement(str(temp_workspace), comment="Original", ignore_dirs=[])
+
+        # Modify a file in the workspace
+        (temp_workspace / "notes.txt").write_text("Modified content\n")
+
+        # Verify
+        (
+            missing,
+            mismatched,
+            extra,
+            is_valid,
+        ) = tro.verify_replication_package("arrangement/0", str(temp_workspace))
+
+        # Should detect mismatch
+        assert is_valid is False
+        assert len(missing) == 0
+        assert len(mismatched) == 1
+        assert mismatched[0][0] == "notes.txt"  # filename
+        assert len(extra) == 0
+
+    def test_verify_directory_with_extra_file(
+        self, temp_workspace, tmp_path, gpg_setup
+    ):
+        """Test verifying a directory with an extra file not in arrangement."""
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement
+        tro.add_arrangement(str(temp_workspace), comment="Original", ignore_dirs=[])
+
+        # Add a new file
+        (temp_workspace / "extra_file.txt").write_text("Extra content\n")
+
+        # Verify
+        (
+            missing,
+            mismatched,
+            extra,
+            is_valid,
+        ) = tro.verify_replication_package("arrangement/0", str(temp_workspace))
+
+        # Should detect the extra file as missing in arrangement
+        # Also appears in mismatched because expected_hash is None
+        assert is_valid is False
+        assert len(missing) == 1
+        assert "extra_file.txt" in missing
+        assert len(mismatched) == 1
+        assert mismatched[0][0] == "extra_file.txt"
+        assert mismatched[0][1] is None  # No expected hash
+        assert len(extra) == 0
+
+    def test_verify_directory_with_missing_file(
+        self, temp_workspace, tmp_path, gpg_setup
+    ):
+        """Test verifying a directory missing a file from the arrangement."""
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement
+        tro.add_arrangement(str(temp_workspace), comment="Original", ignore_dirs=[])
+
+        # Remove a file
+        (temp_workspace / "notes.txt").unlink()
+
+        # Verify
+        (
+            missing,
+            mismatched,
+            extra,
+            is_valid,
+        ) = tro.verify_replication_package("arrangement/0", str(temp_workspace))
+
+        # Should detect the file as extra in arrangement (not found in package)
+        assert is_valid is False
+        assert len(missing) == 0
+        assert len(mismatched) == 0
+        assert len(extra) == 1
+        assert "notes.txt" in extra
+
+    def test_verify_zipfile_identical(self, temp_workspace, tmp_path, gpg_setup):
+        """Test verifying a zipfile that exactly matches the arrangement."""
+        import zipfile
+
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement
+        tro.add_arrangement(str(temp_workspace), comment="Original", ignore_dirs=[])
+
+        # Create a zipfile with the same content
+        zip_path = tmp_path / "package.zip"
+        with zipfile.ZipFile(zip_path, "w") as zf:
+            for file in temp_workspace.iterdir():
+                if file.is_file():
+                    zf.write(file, file.name)
+
+        # Verify
+        (
+            missing,
+            mismatched,
+            extra,
+            is_valid,
+        ) = tro.verify_replication_package("arrangement/0", str(zip_path))
+
+        # Should be identical
+        assert is_valid is True
+        assert len(missing) == 0
+        assert len(mismatched) == 0
+        assert len(extra) == 0
+
+    def test_verify_zipfile_with_modified_file(
+        self, temp_workspace, tmp_path, gpg_setup
+    ):
+        """Test verifying a zipfile where a file has been modified."""
+        import zipfile
+
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement
+        tro.add_arrangement(str(temp_workspace), comment="Original", ignore_dirs=[])
+
+        # Create a zipfile with modified content
+        zip_path = tmp_path / "package.zip"
+        with zipfile.ZipFile(zip_path, "w") as zf:
+            for file in temp_workspace.iterdir():
+                if file.is_file():
+                    if file.name == "notes.txt":
+                        zf.writestr("notes.txt", "Modified content\n")
+                    else:
+                        zf.write(file, file.name)
+
+        # Verify
+        (
+            missing,
+            mismatched,
+            extra,
+            is_valid,
+        ) = tro.verify_replication_package("arrangement/0", str(zip_path))
+
+        # Should detect mismatch
+        assert is_valid is False
+        assert len(missing) == 0
+        assert len(mismatched) == 1
+        assert mismatched[0][0] == "notes.txt"
+        assert len(extra) == 0
+
+    def test_verify_with_subpath_directory(self, tmp_path, gpg_setup):
+        """Test verifying a directory with subpath filtering."""
+        # Create a more complex directory structure
+        workspace = tmp_path / "workspace"
+        workspace.mkdir()
+
+        subdir = workspace / "data"
+        subdir.mkdir()
+        (subdir / "file1.txt").write_text("Content 1\n")
+        (subdir / "file2.txt").write_text("Content 2\n")
+
+        other = workspace / "other"
+        other.mkdir()
+        (other / "file3.txt").write_text("Content 3\n")
+
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement for the entire workspace
+        tro.add_arrangement(str(workspace), comment="Full workspace", ignore_dirs=[])
+
+        # Verify only the data subpath
+        (
+            missing,
+            mismatched,
+            extra,
+            is_valid,
+        ) = tro.verify_replication_package(
+            "arrangement/0", str(workspace), subpath="data"
+        )
+
+        # Should verify only files in data/ subdirectory
+        # When checking with subpath, only files starting with subpath are checked
+        # The 'extra' list should contain files NOT checked (not in subpath) that are in arrangement
+        assert is_valid is False
+        assert (
+            len(extra) == 3
+        )  # All files are in extra because subpath filter leaves arrangement_map intact
+        assert "other/file3.txt" in extra
+        assert "data/file1.txt" in extra
+        assert "data/file2.txt" in extra
+
+    def test_verify_with_subpath_zipfile(self, tmp_path, gpg_setup):
+        """Test verifying a zipfile with subpath filtering."""
+        import zipfile
+
+        # Create a more complex directory structure
+        workspace = tmp_path / "workspace"
+        workspace.mkdir()
+
+        subdir = workspace / "data"
+        subdir.mkdir()
+        (subdir / "file1.txt").write_text("Content 1\n")
+        (subdir / "file2.txt").write_text("Content 2\n")
+
+        other = workspace / "other"
+        other.mkdir()
+        (other / "file3.txt").write_text("Content 3\n")
+
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement for the entire workspace
+        tro.add_arrangement(str(workspace), comment="Full workspace", ignore_dirs=[])
+
+        # Create a zipfile
+        zip_path = tmp_path / "package.zip"
+        with zipfile.ZipFile(zip_path, "w") as zf:
+            zf.write(subdir / "file1.txt", "data/file1.txt")
+            zf.write(subdir / "file2.txt", "data/file2.txt")
+            zf.write(other / "file3.txt", "other/file3.txt")
+
+        # Verify only the data subpath
+        (
+            missing,
+            mismatched,
+            extra,
+            is_valid,
+        ) = tro.verify_replication_package(
+            "arrangement/0", str(zip_path), subpath="data"
+        )
+
+        # Should verify only files in data/ subdirectory
+        # When checking with subpath, only files starting with subpath are checked
+        # The 'extra' list should contain files NOT checked that are in arrangement
+        assert is_valid is False
+        assert len(extra) == 3
+        assert "other/file3.txt" in extra
+
+    def test_verify_invalid_arrangement_id(self, temp_workspace, tmp_path, gpg_setup):
+        """Test that verifying with invalid arrangement ID raises error."""
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement
+        tro.add_arrangement(str(temp_workspace), comment="Original", ignore_dirs=[])
+
+        # Try to verify with non-existent arrangement
+
+    def test_verify_multiple_issues(self, temp_workspace, tmp_path, gpg_setup):
+        """Test verifying a package with multiple types of issues."""
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement
+        tro.add_arrangement(str(temp_workspace), comment="Original", ignore_dirs=[])
+
+        # Make multiple changes
+        (temp_workspace / "notes.txt").write_text("Modified\n")  # Modified
+        (temp_workspace / "config.json").unlink()  # Removed (will be in extra)
+        (temp_workspace / "new_file.txt").write_text(
+            "New\n"
+        )  # Added (will be in missing)
+
+        # Verify
+        (
+            missing,
+            mismatched,
+            extra,
+            is_valid,
+        ) = tro.verify_replication_package("arrangement/0", str(temp_workspace))
+
+        # Should detect all issues
+        assert is_valid is False
+        assert len(missing) == 1  # new_file.txt
+        assert "new_file.txt" in missing
+        assert (
+            len(mismatched) == 2
+        )  # notes.txt (modified) + new_file.txt (not in arrangement)
+        # Find which is which
+        mismatched_files = {m[0]: m for m in mismatched}
+        assert "notes.txt" in mismatched_files
+        assert "new_file.txt" in mismatched_files
+        assert mismatched_files["new_file.txt"][1] is None  # No expected hash
+        assert len(extra) == 1  # config.json
+        assert "config.json" in extra
+
+    def test_verify_nested_directory_structure(self, tmp_path, gpg_setup):
+        """Test verifying a package with nested directory structure."""
+        # Create nested structure
+        workspace = tmp_path / "workspace"
+        workspace.mkdir()
+
+        (workspace / "root.txt").write_text("Root file\n")
+
+        level1 = workspace / "level1"
+        level1.mkdir()
+        (level1 / "file1.txt").write_text("Level 1\n")
+
+        level2 = level1 / "level2"
+        level2.mkdir()
+        (level2 / "file2.txt").write_text("Level 2\n")
+
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement
+        tro.add_arrangement(str(workspace), comment="Nested structure", ignore_dirs=[])
+
+        # Verify
+        (
+            missing,
+            mismatched,
+            extra,
+            is_valid,
+        ) = tro.verify_replication_package("arrangement/0", str(workspace))
+
+        # Should be valid
+        assert is_valid is True
+        assert len(missing) == 0
+        assert len(mismatched) == 0
+        assert len(extra) == 0
+
+    def test_get_arrangement_path_hash_map(self, temp_workspace, tmp_path, gpg_setup):
+        """Test getting the path-to-hash mapping for an arrangement."""
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Add arrangement
+        tro.add_arrangement(str(temp_workspace), comment="Test", ignore_dirs=[])
+
+        # Get the mapping
+        path_hash_map = tro.get_arrangement_path_hash_map("arrangement/0")
+
+        # Verify mapping contains all files
+        assert len(path_hash_map) == 3
+        assert "input_data.csv" in path_hash_map
+        assert "notes.txt" in path_hash_map
+        assert "config.json" in path_hash_map
+
+        # Verify all values are valid SHA256 hashes
+        for path, hash_value in path_hash_map.items():
+            assert len(hash_value) == 64
+            assert all(c in "0123456789abcdef" for c in hash_value)
+
+    def test_get_arrangement_path_hash_map_invalid_id(self, tmp_path, gpg_setup):
+        """Test that getting map for invalid arrangement ID raises error."""
+        tro = create_tro_with_gpg(
+            filepath=str(tmp_path / "test_tro.jsonld"), gpg_setup=gpg_setup
+        )
+
+        # Try to get mapping for non-existent arrangement
+        with pytest.raises(ValueError, match="not found"):
+            tro.get_arrangement_path_hash_map("arrangement/99")

From b054f46bc03fb82cd7ef77e0e329b790deb1405d Mon Sep 17 00:00:00 2001
From: "Kacper Kowalik (Xarthisius)" <xarthisius.kk@gmail.com>
Date: Thu, 29 Jan 2026 09:28:04 -0600
Subject: [PATCH 3/6] More tests

---
 tests/test_cli.py | 445 ++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 445 insertions(+)
 create mode 100644 tests/test_cli.py

diff --git a/tests/test_cli.py b/tests/test_cli.py
new file mode 100644
index 0000000..595ce63
--- /dev/null
+++ b/tests/test_cli.py
@@ -0,0 +1,445 @@
+"""Tests for tro_utils CLI module.
+
+Note: These tests focus on CLI command structure and basic functionality.
+GPG-based signing/verification tests are excluded due to GPG key_map complexity.
+"""
+import json
+from unittest.mock import MagicMock
+
+import pytest
+from click.testing import CliRunner
+from click.exceptions import BadParameter
+
+from tro_utils.cli import cli, StringOrPath
+
+
+@pytest.fixture
+def runner():
+    """Create a CLI test runner."""
+    return CliRunner()
+
+
+@pytest.fixture
+def temp_workspace(tmp_path):
+    """Create a temporary workspace with sample files."""
+    workspace = tmp_path / "workspace"
+    workspace.mkdir()
+    (workspace / "data.csv").write_text("id,value\n1,100\n2,200\n")
+    (workspace / "readme.txt").write_text("This is a readme file\n")
+    (workspace / "config.json").write_text('{"key": "value"}')
+    return workspace
+
+
+@pytest.fixture(scope="session")
+def trs_profile(tmp_path_factory):
+    """Create a TRS profile file."""
+    profile_dir = tmp_path_factory.mktemp("profiles")
+    profile_file = profile_dir / "trs.jsonld"
+    profile_data = {
+        "rdfs:comment": "Test TRS for CLI testing",
+        "trov:hasCapability": [
+            {"@id": "trs/capability/1", "@type": "trov:CanRecordInternetAccess"},
+            {"@id": "trs/capability/2", "@type": "trov:CanProvideInternetIsolation"},
+        ],
+    }
+    profile_file.write_text(json.dumps(profile_data, indent=2))
+    return str(profile_file)
+
+
+class TestStringOrPath:
+    """Test the StringOrPath custom parameter type."""
+
+    def test_valid_string(self):
+        """Test that valid string options are accepted."""
+        param_type = StringOrPath(templates={"default": {}, "custom": {}})
+        result = param_type.convert("default", None, None)
+        assert result == "default"
+
+    def test_valid_file_path(self, tmp_path):
+        """Test that valid file paths are accepted."""
+        test_file = tmp_path / "test.txt"
+        test_file.write_text("content")
+        param_type = StringOrPath(templates={"default": {}})
+        result = param_type.convert(str(test_file), None, None)
+        assert result == str(test_file)
+
+    def test_invalid_option(self):
+        """Test that invalid options raise an error."""
+        param_type = StringOrPath(templates={"default": {}})
+        with pytest.raises(BadParameter):
+            param_type.convert("invalid", None, MagicMock())
+
+
+class TestCLIGroup:
+    """Test main CLI group and global options."""
+
+    def test_cli_help(self, runner):
+        """Test that CLI help displays correctly."""
+        result = runner.invoke(cli, ["--help"])
+        assert result.exit_code == 0
+        assert "declaration" in result.output.lower()
+
+    def test_cli_with_no_args(self, runner):
+        """Test CLI with no arguments shows help."""
+        result = runner.invoke(cli)
+        assert "Usage:" in result.output or result.exit_code == 0
+
+
+class TestArrangementCommands:
+    """Test arrangement-related CLI commands."""
+
+    def test_arrangement_add(self, runner, tmp_path, temp_workspace, trs_profile):
+        """Test adding an arrangement via CLI."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        result = runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                "--comment",
+                "Initial",
+                str(temp_workspace),
+            ],
+        )
+        assert result.exit_code == 0
+        assert tro_file.exists()
+        with open(tro_file) as f:
+            data = json.load(f)
+            assert len(data["@graph"][0]["trov:hasArrangement"]) == 1
+
+    def test_arrangement_add_with_ignore_dirs(
+        self, runner, tmp_path, temp_workspace, trs_profile
+    ):
+        """Test adding an arrangement with ignored directories."""
+        (temp_workspace / ".git").mkdir()
+        (temp_workspace / ".git" / "config").write_text("git config")
+        tro_file = tmp_path / "test_tro.jsonld"
+        result = runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                "--ignore_dir",
+                ".git",
+                str(temp_workspace),
+            ],
+        )
+        assert result.exit_code == 0
+        with open(tro_file) as f:
+            data = json.load(f)
+            locations = [
+                loc["trov:hasLocation"]
+                for loc in data["@graph"][0]["trov:hasArrangement"][0]["trov:hasLocus"]
+            ]
+            assert not any(".git" in loc for loc in locations)
+
+    def test_arrangement_list(self, runner, tmp_path, temp_workspace, trs_profile):
+        """Test listing arrangements via CLI."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                "--comment",
+                "Test",
+                str(temp_workspace),
+            ],
+        )
+        result = runner.invoke(
+            cli, ["--declaration", str(tro_file), "arrangement", "list"]
+        )
+        assert result.exit_code == 0
+        assert "arrangement/0" in result.output
+
+    def test_arrangement_list_verbose(
+        self, runner, tmp_path, temp_workspace, trs_profile
+    ):
+        """Test listing arrangements with verbose flag."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                str(temp_workspace),
+            ],
+        )
+        result = runner.invoke(
+            cli, ["--declaration", str(tro_file), "arrangement", "list", "-v"]
+        )
+        assert result.exit_code == 0
+        assert "Composition:" in result.output
+
+
+class TestCompositionCommands:
+    """Test composition-related CLI commands."""
+
+    def test_composition_info(self, runner, tmp_path, temp_workspace, trs_profile):
+        """Test getting composition info via CLI."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                str(temp_workspace),
+            ],
+        )
+        result = runner.invoke(
+            cli, ["--declaration", str(tro_file), "composition", "info"]
+        )
+        assert result.exit_code == 0
+        assert "composition/1/artifact/" in result.output
+
+    def test_composition_info_verbose(
+        self, runner, tmp_path, temp_workspace, trs_profile
+    ):
+        """Test composition info with verbose flag."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                str(temp_workspace),
+            ],
+        )
+        result = runner.invoke(
+            cli, ["--declaration", str(tro_file), "composition", "info", "-v"]
+        )
+        assert result.exit_code == 0
+        assert "Arrangements:" in result.output
+
+
+class TestVerifyCommands:
+    """Test verification-related CLI commands."""
+
+    def test_verify_package_success(
+        self, runner, tmp_path, temp_workspace, trs_profile
+    ):
+        """Test successful package verification."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                str(temp_workspace),
+            ],
+        )
+        result = runner.invoke(
+            cli, ["verify-package", str(tro_file), str(temp_workspace)]
+        )
+        assert result.exit_code == 0
+        assert "✓" in result.output
+
+    def test_verify_package_with_arrangement_id(
+        self, runner, tmp_path, temp_workspace, trs_profile
+    ):
+        """Test package verification with specific arrangement ID."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                str(temp_workspace),
+            ],
+        )
+        result = runner.invoke(
+            cli,
+            [
+                "verify-package",
+                str(tro_file),
+                str(temp_workspace),
+                "--arrangement-id",
+                "arrangement/0",
+            ],
+        )
+        assert result.exit_code == 0
+        assert "arrangement/0" in result.output
+
+    def test_verify_package_failure(
+        self, runner, tmp_path, temp_workspace, trs_profile
+    ):
+        """Test package verification failure."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                str(temp_workspace),
+            ],
+        )
+        (temp_workspace / "data.csv").write_text("modified")
+        result = runner.invoke(
+            cli, ["verify-package", str(tro_file), str(temp_workspace)]
+        )
+        assert result.exit_code == 0
+        assert "✗" in result.output
+
+
+class TestReportCommand:
+    """Test report generation CLI command."""
+
+    def test_generate_report_with_template(
+        self, runner, tmp_path, temp_workspace, trs_profile
+    ):
+        """Test generating a report with a custom template."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                str(temp_workspace),
+            ],
+        )
+        template_file = tmp_path / "template.jinja2"
+        template_file.write_text("TRO: {{ tro['schema:name'] }}")
+        report_file = tmp_path / "report.html"
+        result = runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "report",
+                "--template",
+                str(template_file),
+                "--output",
+                str(report_file),
+            ],
+        )
+        assert result.exit_code == 0
+        assert report_file.exists()
+
+    def test_generate_report_with_default_template(
+        self, runner, tmp_path, temp_workspace, trs_profile
+    ):
+        """Test generating a report with the default template."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                str(temp_workspace),
+            ],
+        )
+        report_file = tmp_path / "report.html"
+        result = runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "report",
+                "--template",
+                "default",
+                "--output",
+                str(report_file),
+            ],
+        )
+        assert result.exit_code == 0
+        assert report_file.exists()
+
+
+class TestErrorHandling:
+    """Test error handling in CLI commands."""
+
+    def test_missing_declaration_file(self, runner):
+        """Test error when declaration file doesn't exist."""
+        result = runner.invoke(cli, ["verify-timestamp", "/nonexistent/file.jsonld"])
+        assert result.exit_code == 2
+
+    def test_missing_directory_for_arrangement(self, runner, tmp_path, trs_profile):
+        """Test error when directory doesn't exist."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        result = runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                "/nonexistent/directory",
+            ],
+        )
+        assert result.exit_code != 0
+
+    def test_invalid_template(self, runner, tmp_path, temp_workspace, trs_profile):
+        """Test error with invalid template option."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                str(temp_workspace),
+            ],
+        )
+        report_file = tmp_path / "report.html"
+        result = runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "report",
+                "--template",
+                "nonexistent",
+                "--output",
+                str(report_file),
+            ],
+        )
+        assert result.exit_code != 0

From b6d55a0337ad04ec19765c81cfde1114705ea45a Mon Sep 17 00:00:00 2001
From: "Kacper Kowalik (Xarthisius)" <xarthisius.kk@gmail.com>
Date: Thu, 29 Jan 2026 09:30:18 -0600
Subject: [PATCH 4/6] Bump version

---
 pyproject.toml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/pyproject.toml b/pyproject.toml
index 74efb4a..85b359d 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -13,7 +13,7 @@ maintainers = [
 ]
 description = "Utilities for creating, editing and interacting with TROs"
 readme = "README.rst"
-version = "0.1.2"
+version = "0.1.3"
 dependencies = [
   "Click>=7.0",
   "jinja2",

From 0fc68e469c1c2efba2b47a3c26064cf50fa7934b Mon Sep 17 00:00:00 2001
From: "Kacper Kowalik (Xarthisius)" <xarthisius.kk@gmail.com>
Date: Thu, 29 Jan 2026 09:49:48 -0600
Subject: [PATCH 5/6] Drop unused method, add test for --verbose

---
 tests/test_cli.py      | 34 ++++++++++++++++++++++++++++++++++
 tro_utils/tro_utils.py | 12 ------------
 2 files changed, 34 insertions(+), 12 deletions(-)

diff --git a/tests/test_cli.py b/tests/test_cli.py
index 595ce63..b3d2821 100644
--- a/tests/test_cli.py
+++ b/tests/test_cli.py
@@ -316,6 +316,40 @@ def test_verify_package_failure(
         assert result.exit_code == 0
         assert "✗" in result.output
 
+    def test_verify_package_verbose(
+        self, runner, tmp_path, temp_workspace, trs_profile
+    ):
+        """Test package verification with verbose output showing details."""
+        tro_file = tmp_path / "test_tro.jsonld"
+        runner.invoke(
+            cli,
+            [
+                "--declaration",
+                str(tro_file),
+                "--profile",
+                trs_profile,
+                "arrangement",
+                "add",
+                str(temp_workspace),
+            ],
+        )
+        # Modify a file and add a new one to trigger verbose output
+        (temp_workspace / "data.csv").write_text("modified content")
+        (temp_workspace / "extra.txt").write_text("extra file")
+        result = runner.invoke(
+            cli,
+            [
+                "verify-package",
+                str(tro_file),
+                str(temp_workspace),
+                "--verbose",
+            ],
+        )
+        assert result.exit_code == 0
+        # Verify verbose output includes file details
+        # The Rich library output includes file names when there are mismatches
+        assert "data.csv" in result.output or "extra.txt" in result.output
+
 
 class TestReportCommand:
     """Test report generation CLI command."""
diff --git a/tro_utils/tro_utils.py b/tro_utils/tro_utils.py
index 5794f6c..a756b43 100644
--- a/tro_utils/tro_utils.py
+++ b/tro_utils/tro_utils.py
@@ -281,18 +281,6 @@ def sha256_for_file(filepath, resolve_symlinks=True):
                 sha256.update(chunk)
         return sha256.hexdigest()
 
-    @staticmethod
-    def sha256_for_zipfile(zipfilepath):
-        hashes = {}
-        with zipfile.ZipFile(zipfilepath, "r") as zf:
-            for fileinfo in zf.infolist():
-                sha256 = hashlib.sha256()
-                with zf.open(fileinfo.filename) as f:
-                    for chunk in iter(lambda: f.read(4096), b""):
-                        sha256.update(chunk)
-                hashes[fileinfo.filename] = sha256.hexdigest()
-        return hashes
-
     def sha256_for_directory(self, directory, ignore_dirs=None, resolve_symlinks=True):
         if ignore_dirs is None:
             ignore_dirs = [".git"]  # Default ignore list

From c427ab63c1ad2d069ba6bd1ac84e0531811f64b7 Mon Sep 17 00:00:00 2001
From: "Kacper Kowalik (Xarthisius)" <xarthisius.kk@gmail.com>
Date: Thu, 29 Jan 2026 09:53:06 -0600
Subject: [PATCH 6/6] Type fixes

---
 tro_utils/cli.py       |  2 ++
 tro_utils/tro_utils.py | 12 +++++++++---
 2 files changed, 11 insertions(+), 3 deletions(-)

diff --git a/tro_utils/cli.py b/tro_utils/cli.py
index 250a3fb..e71d893 100644
--- a/tro_utils/cli.py
+++ b/tro_utils/cli.py
@@ -25,6 +25,8 @@ class StringOrPath(click.ParamType):
     name = "string_or_path"
 
     def __init__(self, templates=None):
+        if templates is None:
+            templates = {}
         self.valid_strings = templates.keys()
 
     def convert(self, value, param, ctx):
diff --git a/tro_utils/tro_utils.py b/tro_utils/tro_utils.py
index a756b43..184d895 100644
--- a/tro_utils/tro_utils.py
+++ b/tro_utils/tro_utils.py
@@ -43,7 +43,7 @@ def __init__(
             self.dirname = "."
         else:
             self.basename = os.path.basename(filepath).rsplit(".")[0]
-            self.dirname = os.path.dirname(filepath)
+            self.dirname = os.path.dirname(filepath) or "."
 
         if profile is not None and os.path.exists(profile):
             print(f"Loading profile from {profile}")
@@ -108,6 +108,8 @@ def __init__(
 
     @property
     def base_filename(self):
+        if not self.basename:
+            raise ValueError("basename is not set")
         return os.path.abspath(os.path.join(self.dirname, self.basename))
 
     @property
@@ -448,6 +450,11 @@ def add_performance(
         caps=None,
         extra_attributes=None,
     ):
+        if caps is None:
+            caps = []
+        if extra_attributes is None:
+            extra_attributes = {}
+
         trp = {
             "@id": f"trp/{len(self.data['@graph'][0]['trov:hasPerformance'])}",
             "@type": "trov:TrustedResearchPerformance",
@@ -457,8 +464,7 @@ def add_performance(
             "trov:startedAtTime": start_time.isoformat(),
             "trov:endedAtTime": end_time.isoformat(),
         }
-        if extra_attributes and isinstance(extra_attributes, dict):
-            trp.update(extra_attributes)
+        trp.update(extra_attributes)
 
         available_arrangements = [
             _["@id"] for _ in self.data["@graph"][0]["trov:hasArrangement"]