From d7298d0e0e50aedc3cb4aea64a56bc985e71935a Mon Sep 17 00:00:00 2001
From: Ryan Harper <rharper@woxford.com>
Date: Sat, 13 Dec 2025 17:52:35 -0600
Subject: [PATCH 1/6] fix: bump build and ci go-version checks for publishing

Drop the go-version check in build and coverage when uploading
binaries.  We're only building with one version of go now.

Signed-off-by: Ryan Harper <rharper@woxford.com>
---
 .github/workflows/build.yaml    | 2 +-
 .github/workflows/coverage.yaml | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml
index d8a3af90..e0321e9d 100644
--- a/.github/workflows/build.yaml
+++ b/.github/workflows/build.yaml
@@ -113,7 +113,7 @@ jobs:
           make publish-stacker-bin
       - name: Upload artifacts
         uses: actions/upload-artifact@v4
-        if: ${{ (matrix.privilege-level == 'priv') && (matrix.go-version == '1.23.x') }}
+        if: ${{ (matrix.privilege-level == 'priv')}}
         with:
           # if there is more than 1 go-version, we would need to account for that here.
           name: stacker-${{ matrix.platform }}
diff --git a/.github/workflows/coverage.yaml b/.github/workflows/coverage.yaml
index ac6a6ac7..257ae3c1 100644
--- a/.github/workflows/coverage.yaml
+++ b/.github/workflows/coverage.yaml
@@ -104,7 +104,7 @@ jobs:
           files: coverage-${{ matrix.privilege-level}}.txt
       - name: Upload artifacts
         uses: actions/upload-artifact@v4
-        if: ${{ (matrix.privilege-level == 'priv') && (matrix.go-version == '1.23.x') }}
+        if: ${{ (matrix.privilege-level == 'priv')}}
         with:
           # if there is more than 1 go-version, we would need to account for that here.
           name: binary-cov

From a2f34e2715211af31121b1a0c32e6038c9f88e40 Mon Sep 17 00:00:00 2001
From: Ryan Harper <rharper@woxford.com>
Date: Mon, 15 Dec 2025 09:58:33 -0600
Subject: [PATCH 2/6] test: format python test harness file with black

Apply black python formatting to harness

Signed-off-by: Ryan Harper <rharper@woxford.com>
---
 test/main.py | 17 ++++++++++++++---
 1 file changed, 14 insertions(+), 3 deletions(-)

diff --git a/test/main.py b/test/main.py
index 52c4a7d8..41e7b411 100755
--- a/test/main.py
+++ b/test/main.py
@@ -1,4 +1,7 @@
 #!/usr/bin/python3
+"""
+test harness for stacker
+"""
 
 import argparse
 import glob
@@ -7,7 +10,7 @@
 import subprocess
 import sys
 
-priv_levels=("priv", "unpriv")
+priv_levels = ("priv", "unpriv")
 
 parser = argparse.ArgumentParser()
 parser.add_argument("--privilege-level", choices=priv_levels)
@@ -16,13 +19,21 @@
 
 options = parser.parse_args()
 
-priv_to_test=priv_levels
+priv_to_test = priv_levels
 
 if options.privilege_level is not None:
     priv_to_test = [options.privilege_level]
 
 for priv in priv_to_test:
-    cmd = ["bats", "--setup-suite-file", "./test/setup_suite.bash", "--jobs", str(options.jobs), "--tap", "--timing"]
+    cmd = [
+        "bats",
+        "--setup-suite-file",
+        "./test/setup_suite.bash",
+        "--jobs",
+        str(options.jobs),
+        "--tap",
+        "--timing",
+    ]
     cmd.extend(options.tests)
 
     env = os.environ.copy()

From 26c06f95699d8cc04375e6ee1fccbbdfe7915b03 Mon Sep 17 00:00:00 2001
From: Ryan Harper <rharper@woxford.com>
Date: Mon, 15 Dec 2025 10:08:17 -0600
Subject: [PATCH 3/6] test: add env check to test harness

Verify that we have the required env variables before starting
the harness.  This is primarily for offline testing but still
useful in the github workflows

Signed-off-by: Ryan Harper <rharper@woxford.com>
---
 test/main.py | 22 ++++++++++++++++++++++
 1 file changed, 22 insertions(+)

diff --git a/test/main.py b/test/main.py
index 41e7b411..5f4c9fd5 100755
--- a/test/main.py
+++ b/test/main.py
@@ -10,6 +10,23 @@
 import subprocess
 import sys
 
+
+def check_env(env_to_check):
+    """
+    check for required env variables
+    """
+    required_vars = ["ZOT_HOST", "ZOT_PORT", "REGISTRY_URL"]
+    errors = []
+    for req_var in required_vars:
+        if req_var not in env_to_check:
+            errors.append(f"missing env variable '{req_var}'")
+        if not env_to_check.get(req_var):
+            errors.append(f"env variable '{req_var}' is empyty")
+
+    if len(errors) > 0:
+        raise RuntimeError(f"EnvCheckFailures: {errors}")
+
+
 priv_levels = ("priv", "unpriv")
 
 parser = argparse.ArgumentParser()
@@ -38,6 +55,11 @@
 
     env = os.environ.copy()
     env["PRIVILEGE_LEVEL"] = priv
+    try:
+        check_env
+    except RuntimeError as err:
+        print(f"Failed environment variable check: {err}")
+        sys.exit(1)
 
     print("running tests in modes:", priv)
     try:

From 0b1f1072e8954c8fa445bb137eb95c968a5a625c Mon Sep 17 00:00:00 2001
From: Ryan Harper <rharper@woxford.com>
Date: Mon, 15 Dec 2025 10:14:28 -0600
Subject: [PATCH 4/6] test: increase verbosity on tests until we sort out why
 some tests fail during priv run

Signed-off-by: Ryan Harper <rharper@woxford.com>
---
 test/main.py | 1 +
 1 file changed, 1 insertion(+)

diff --git a/test/main.py b/test/main.py
index 5f4c9fd5..cf8e27e1 100755
--- a/test/main.py
+++ b/test/main.py
@@ -50,6 +50,7 @@ def check_env(env_to_check):
         str(options.jobs),
         "--tap",
         "--timing",
+        "--verbose-run",
     ]
     cmd.extend(options.tests)
 

From eb8e975f9e4db9bd48d7cdd331f8a83f2f50adf8 Mon Sep 17 00:00:00 2001
From: Ryan Harper <rharper@woxford.com>
Date: Mon, 15 Dec 2025 16:29:56 -0600
Subject: [PATCH 5/6] test: fixes for local and github building

- Format test/main.py with black python formatter
- Add skip_broken_tests and add this to bom test
  - Currently the bom test isn't working so we'll skip until we
    update the test for the current Centos image.  Once that's
    done we will change the test to fetch the Centos image via
    sha256 and/or mirror it into the ghcr.io/project-stacker OCI
    registry
- Add some debug around zot config starting
- Add checks to ensure exported variables that are required for the
  test harness to run are present in the env before running the tests
- Check and dump env before starting bats suite
- Add zot_teardown calls to ensure that we've properly terminated zot
  before attempting to start another one.  The github runs saw errors
  which looked like something already using port 8080 which is likely
  a race with a zot being killed.  Be more explicit and wait for it
  to go away.  Make use of pid file for simpler stopping
- Update/Add REGISTRY_SERVICE value to specify what registry OCI image
  we're using and export this into the build environment
- Add support for copying and running REGISTRY_SERVICE when running
  outside of github.
- Add start/stop_registry as convert tests uses registry to publish stuff
- Update publish.bats test to check if REGISTRY_SERVICE is running and
  if not startup up the service.  This handles the offline case where
  registry is not provided by the build environment.  For github where
  service is running, it will skip the start/stop

Signed-off-by: Ryan Harper <rharper@woxford.com>
---
 .github/workflows/build.yaml    |  12 ++-
 .github/workflows/coverage.yaml |  11 ++-
 test/bom.bats                   |   1 +
 test/convert.bats               |   8 ++
 test/helpers.bash               | 126 +++++++++++++++++++++++++++++---
 test/main.py                    |   2 +-
 test/publish.bats               |   8 ++
 7 files changed, 153 insertions(+), 15 deletions(-)

diff --git a/.github/workflows/build.yaml b/.github/workflows/build.yaml
index e0321e9d..f859e933 100644
--- a/.github/workflows/build.yaml
+++ b/.github/workflows/build.yaml
@@ -26,6 +26,12 @@ on:
         type: boolean
         description: 'Should slow tests be run?'
         default: true
+      registry-service:
+        required: false
+        type: string
+        description: 'registry service OCI image URI'
+        default: "ghcr.io/project-stacker/registry:2"
+
     secrets:
       codecov_token:
         required: true
@@ -34,7 +40,7 @@ jobs:
   build:
     services:
       registry:
-        image: ghcr.io/project-stacker/registry:2
+        image: ${{ inputs.registry-service }}
         ports:
           - 5000:5000
     strategy:
@@ -88,6 +94,7 @@ jobs:
         run: |
           make stacker VERSION_FULL=${{ inputs.build-id }}
         env:
+          REGISTRY_SERVICE: ${{ inputs.registry-service }}
           REGISTRY_URL: localhost:5000
           ZOT_HOST: localhost
           ZOT_PORT: 8080
@@ -98,6 +105,7 @@ jobs:
         run: |
           make check VERSION_FULL=${{ inputs.build-id }} PRIVILEGE_LEVEL=${{ matrix.privilege-level }}
         env:
+          REGISTRY_SERVICE: ${{ inputs.registry-service }}
           REGISTRY_URL: localhost:5000
           ZOT_HOST: localhost
           ZOT_PORT: 8080
@@ -113,7 +121,7 @@ jobs:
           make publish-stacker-bin
       - name: Upload artifacts
         uses: actions/upload-artifact@v4
-        if: ${{ (matrix.privilege-level == 'priv')}}
+        if: ${{ (matrix.privilege-level == 'priv') }}
         with:
           # if there is more than 1 go-version, we would need to account for that here.
           name: stacker-${{ matrix.platform }}
diff --git a/.github/workflows/coverage.yaml b/.github/workflows/coverage.yaml
index 257ae3c1..48ac5daf 100644
--- a/.github/workflows/coverage.yaml
+++ b/.github/workflows/coverage.yaml
@@ -26,6 +26,12 @@ on:
         type: boolean
         description: 'Should slow tests be run?'
         default: true
+      registry-service:
+        required: false
+        type: string
+        description: 'registry service OCI image URI'
+        default: "ghcr.io/project-stacker/registry:2"
+
     secrets:
       codecov_token:
         required: true
@@ -35,7 +41,7 @@ jobs:
     runs-on: ubuntu-24.04
     services:
       registry:
-        image: ghcr.io/project-stacker/registry:2
+        image: ${{ inputs.registry-service }}
         ports:
           - 5000:5000
     strategy:
@@ -91,6 +97,7 @@ jobs:
           go tool covdata percent -i $GOCOVERDIR
           ls -altR $GOCOVERDIR
         env:
+          REGISTRY_SERVICE: ${{ inputs.registry-service }}
           REGISTRY_URL: localhost:5000
           ZOT_HOST: localhost
           ZOT_PORT: 8080
@@ -104,7 +111,7 @@ jobs:
           files: coverage-${{ matrix.privilege-level}}.txt
       - name: Upload artifacts
         uses: actions/upload-artifact@v4
-        if: ${{ (matrix.privilege-level == 'priv')}}
+        if: ${{ (matrix.privilege-level == 'priv') }}
         with:
           # if there is more than 1 go-version, we would need to account for that here.
           name: binary-cov
diff --git a/test/bom.bats b/test/bom.bats
index ed4d065e..ea60cf93 100644
--- a/test/bom.bats
+++ b/test/bom.bats
@@ -22,6 +22,7 @@ function teardown() {
 
 @test "all container contents must be accounted for" {
   skip_slow_test
+  skip_broken_tests
   cat > stacker.yaml <<"EOF"
 bom-parent:
     from:
diff --git a/test/convert.bats b/test/convert.bats
index 18fbe8d8..f173b8a6 100644
--- a/test/convert.bats
+++ b/test/convert.bats
@@ -1,5 +1,13 @@
 load helpers
 
+function setup_file() {
+    start_registry
+}
+
+function teardown_file() {
+    stop_registry
+}
+
 function setup() {
     stacker_setup
 }
diff --git a/test/helpers.bash b/test/helpers.bash
index d74d53c9..5e08be87 100644
--- a/test/helpers.bash
+++ b/test/helpers.bash
@@ -135,6 +135,16 @@ function skip_slow_test {
     esac
 }
 
+function skip_broken_tests {
+    case "${BROKEN_TESTS:-false}" in
+        true) return;;
+        false) skip "${BATS_TEST_NAME} is broken. Set BROKEN_TESTS=true to run.";;
+        *) stderr "BROKEN_TESTS variable must be 'true' or 'false'" \
+            "found '${BROKEN_TESTS}'"
+           return 1;;
+    esac
+}
+
 function tmpd() {
     mktemp -d "${PWD}/stackertest${1:+-$1}.XXXXXX"
 }
@@ -221,10 +231,15 @@ EOF
 }
 
 function write_auth_zot_config {
+  if ! check_env_zot; then
+    echo "ERROR: invalid zot env values"
+    return 1
+  fi
 
   htpasswd -Bbn iam careful >> $TEST_TMPDIR/htpasswd
 
-  cat > $TEST_TMPDIR/zot-config.json << EOF
+  zotcfg=$TEST_TMPDIR/zot-config.json
+  cat > "$zotcfg" << EOF
 {
   "distSpecVersion": "1.1.0-dev",
   "storage": {
@@ -262,15 +277,18 @@ function write_auth_zot_config {
   }
 }
 EOF
-
+    echo "zot config:"
+    cat "$zotcfg"
 }
 
 function zot_setup {
+    zot_teardown
     write_plain_zot_config
     start_zot
 }
 
 function zot_setup_auth {
+    zot_teardown
     write_auth_zot_config
     start_zot USE_TLS
 }
@@ -279,12 +297,18 @@ function start_zot {
   ZOT_USE_TLS=$1
   echo "# starting zot at $ZOT_HOST:$ZOT_PORT" >&3
   # start as a background task
-  zot verify $TEST_TMPDIR/zot-config.json
-  zot serve $TEST_TMPDIR/zot-config.json &
+  zotcfg="$TEST_TMPDIR/zot-config.json"
+  if ! zot verify "$zotcfg"; then
+      echo "zot failed to verify zot config:"
+      cat "$zotcfg"
+      return 1
+  fi
+  zot serve "$TEST_TMPDIR/zot-config.json" &
   pid=$!
+  echo "$pid" > "${TEST_TMPDIR}/zot.pid"
 
   echo "zot is running at pid $pid"
-  cat $TEST_TMPDIR/zot.log
+  cat "$TEST_TMPDIR/zot.log"
   # wait until service is up
   count=5
   up=0
@@ -295,6 +319,14 @@ function start_zot {
       exit 1
     fi
     up=1
+    # check if correct port is open
+    if ! nc -v -z "${ZOT_HOST}" "${ZOT_PORT}"; then
+        echo "no response from host:${ZOT_HOST} port:${ZOT_PORT}" >&3
+        sleep 1
+        count=$((count - 1))
+        continue
+    fi
+    echo "Got response from host:${ZOT_HOST} on port:${ZOT_PORT}" >&3
     if [[ -n $ZOT_USE_TLS ]]; then
         echo "testing zot at https://$ZOT_HOST:$ZOT_PORT"
         curl -v --cacert $BATS_SUITE_TMPDIR/ca.crt  -u "iam:careful" -f https://$ZOT_HOST:$ZOT_PORT/v2/ || up=0
@@ -323,11 +355,14 @@ function start_zot {
 }
 
 function zot_teardown {
-  echo "# stopping zot" >&3
-  killall zot
-  killall -KILL zot || true
-  rm -f $TEST_TMPDIR/zot-config.json
-  rm -rf $TEST_TMPDIR/zot
+    zotpid="${TEST_TMPDIR}/zot.pid"
+    if [ -s "$zotpid" ]; then
+        echo "# stopping zot" >&3
+        pkill --pidfile "$zotpid"
+        echo "# stopped zot" >&3
+    fi
+    rm -f "$TEST_TMPDIR/zot-config.json"
+    rm -rf "$TEST_TMPDIR/zot"
 }
 
 function _skopeo() {
@@ -348,6 +383,77 @@ function _skopeo() {
     HOME="$home" skopeo "$@"
 }
 
+function start_registry() {
+    if [ -z "${REGISTRY_URL}" ]; then
+        echo "Missing REGISTRY_URL env value"
+        return 1
+    fi
+    if [ -z "${REGISTRY_SERVICE}" ]; then
+        echo "Missing REGISTRY_SERVICE env value"
+        return 1
+    fi
+    rhost=${REGISTRY_URL%:*}   # trim from right until colon, localhost
+    rport=${REGISTRY_URL#*:}   # trim from left until colon , 5000
+    if nc -v -z "${rhost}" "${rport}"; then
+        echo "# skipping start, registry service ${REGISTRY_SERVICE} already active for REGISTRY_URL=${REGISTRY_URL}" >&3
+        return 0
+    fi
+    echo "# no registry service ${REGISTRY_SERVICE} active for REGISTRY_URL=${REGISTRY_URL}" >&3
+    echo "# Starting registry service ${REGISTRY_SERVICE}" >&3
+
+
+    imgname=$(basename "${REGISTRY_SERVICE}")  # registry:tag
+    if ! _skopeo copy "docker://${REGISTRY_SERVICE}" "oci:${TEST_TMPDIR}/ocid:${imgname}"; then
+        echo "# skopeo copy of '${REGISTRY_SERVICE}' to local directory failed" >&3
+        return 1
+    fi
+
+    # unpack the image
+    unpackdir="${TEST_TMPDIR}/unpacked-reg"
+    if [ ! -d "${unpackdir}" ]; then
+        if ! umoci unpack --keep-dirlinks --image "${TEST_TMPDIR}/ocid:${imgname}" "${unpackdir}"; then
+            echo "failed to unpack registry service image ${imgname} to ${unpackdir}"
+            return 1
+        fi
+    else
+        echo "# reusing existing unpacked registry service OCI image" >&3
+    fi
+
+    # start up registry in the background
+    reglog="${TEST_TMPDIR}/registry.log"
+    chroot "${unpackdir}/rootfs" "/entrypoint.sh" "/etc/docker/registry/config.yml" "2>&1" "1>${reglog}" &
+    REGISTRY_PID=$!
+    echo "$REGISTRY_PID" > "${TEST_TMPDIR}/registry.pid"
+
+    regup=0
+    for ((x=1;x<=5;x++)); do
+        sleep "$x"
+        if ! nc -v -z "${rhost}" "${rport}"; then
+            echo "# local registry service not ready" >&3
+            sleep "$x"
+            continue
+        fi
+        regup=1
+        break
+    done
+
+    if [ "$regup" != "1" ]; then
+        echo "failed to bring up local registry service"
+    fi
+
+    echo "local registry service up on ${REGISTRY_URL} PID=$(cat "${TEST_TMPDIR}/registry.pid")"
+    return 0
+}
+
+function stop_registry() {
+    regpid="${TEST_TMPDIR}/registry.pid"
+    if [ -s "$regpid" ]; then
+        echo "# stopping local registry" >&3
+        pkill --pidfile "$regpid"
+        echo "# stopped local registry" >&3
+    fi
+}
+
 function dir_has_only() {
     local d="$1" oifs="$IFS" unexpected="" f=""
     shift
diff --git a/test/main.py b/test/main.py
index cf8e27e1..144f70db 100755
--- a/test/main.py
+++ b/test/main.py
@@ -15,7 +15,7 @@ def check_env(env_to_check):
     """
     check for required env variables
     """
-    required_vars = ["ZOT_HOST", "ZOT_PORT", "REGISTRY_URL"]
+    required_vars = ["ZOT_HOST", "ZOT_PORT", "REGISTRY_SERVICE", "REGISTRY_URL"]
     errors = []
     for req_var in required_vars:
         if req_var not in env_to_check:
diff --git a/test/publish.bats b/test/publish.bats
index b5b00d96..e6869991 100644
--- a/test/publish.bats
+++ b/test/publish.bats
@@ -1,5 +1,13 @@
 load helpers
 
+function setup_file() {
+    start_registry
+}
+
+function teardown_file() {
+    stop_registry
+}
+
 function setup() {
     stacker_setup
     mkdir -p ocibuilds/sub1

From c0d28e8d3292964889ba9ae17fe8e94b0411e08a Mon Sep 17 00:00:00 2001
From: Ryan Harper <rharper@woxford.com>
Date: Tue, 16 Dec 2025 13:18:56 -0600
Subject: [PATCH 6/6] fix: install-build-deps add software-properties-common
 for add-apt-repository

Signed-off-by: Ryan Harper <rharper@woxford.com>
---
 install-build-deps.sh | 4 ++++
 1 file changed, 4 insertions(+)

diff --git a/install-build-deps.sh b/install-build-deps.sh
index 954db821..9df26332 100755
--- a/install-build-deps.sh
+++ b/install-build-deps.sh
@@ -69,6 +69,10 @@ installdeps_ubuntu() {
         lxc-utils
     )
 
+    if ! command -v add-apt-repository; then
+        sudo apt-get -y install software-properties-common
+    fi
+
     case "$VERSION_ID" in
         22.04)
             sudo add-apt-repository -y ppa:project-machine/squashfuse