sigstore · knrc · Aug 2, 2025 · Aug 11, 2025 · Aug 18, 2025 · Aug 27, 2025
diff --git a/.github/workflows/test-e2e.yml b/.github/workflows/test-e2e.yml
@@ -48,4 +48,4 @@ jobs:
       - name: Running Test e2e
         run: |
           go mod tidy
-          make test-e2e
+          make test-e2e-ci
diff --git a/.gitignore b/.gitignore
@@ -15,3 +15,10 @@ cover.out
 manifests/*.yaml
 # Don't include generated bundles (will be built in CI/CD at some point)
 bundle/
+
+# Generated test keys
+testdata/docker/test_*.pub
+testdata/docker/test_*.priv
+
+# Generated model signature
+testdata/tensorflow_saved_model/model.sig
diff --git a/Makefile b/Makefile
@@ -31,6 +31,9 @@ BUNDLE_METADATA_OPTS ?= $(BUNDLE_CHANNELS) $(BUNDLE_DEFAULT_CHANNEL)
 # ghcr.io/sigstore/model-validation-operator-bundle:$VERSION and ghcr.io/sigstore/model-validation-operator-catalog:$VERSION.
 IMAGE_TAG_BASE ?= ghcr.io/sigstore/model-validation-operator
 
+# IMG defines the image:tag used for the operator.
+IMG ?= $(IMAGE_TAG_BASE):v$(VERSION)
+
 # BUNDLE_IMG defines the image:tag used for the bundle.
 # You can use it as an arg. (E.g make bundle-build BUNDLE_IMG=<some-registry>/<project-name-bundle>:<tag>)
 BUNDLE_IMG ?= $(IMAGE_TAG_BASE)-bundle:v$(VERSION)
@@ -52,8 +55,6 @@ endif
 # Set the Operator SDK version to use. By default, what is installed on the system is used.
 # This is useful for CI or a project to utilize a specific version of the operator-sdk toolkit.
 OPERATOR_SDK_VERSION ?= v1.41.1
-# Image URL to use all building/pushing image targets
-IMG ?= controller:latest
 
 # Get the currently used golang install path (in GOPATH/bin, unless GOBIN is set)
 ifeq (,$(shell go env GOBIN))
@@ -118,14 +119,6 @@ vet: ## Run go vet against code.
 test: manifests generate fmt vet setup-envtest ## Run tests.
 	KUBEBUILDER_ASSETS="$(shell $(ENVTEST) use $(ENVTEST_K8S_VERSION) --bin-dir $(LOCALBIN) -p path)" go test $$(go list ./... | grep -v /e2e) -coverprofile cover.out
 
-# TODO(user): To use a different vendor for e2e tests, modify the setup under 'tests/e2e'.
-# The default setup assumes Kind is pre-installed and builds/loads the Manager Docker image locally.
-# CertManager is installed by default; skip with:
-# - CERT_MANAGER_INSTALL_SKIP=true
-.PHONY: test-e2e
-test-e2e: manifests generate fmt vet ## Run the e2e tests. Expected an isolated environment using Kind.
-	go test ./test/e2e/ -v -ginkgo.v
-
 .PHONY: lint
 lint: golangci-lint ## Run golangci-lint linter
 	$(GOLANGCI_LINT) run
@@ -419,3 +412,158 @@ generate-manifests: manifests ## Generate manifests for all environments using g
 		echo "Generating manifests for $$env environment..."; \
 		./scripts/generate-manifests.sh $$env manifests; \
 	done
+
+##@ E2E Test Infrastructure
+
+# E2E Test Variables
+E2E_OPERATOR_NAMESPACE ?= model-validation-operator-system
+E2E_TEST_NAMESPACE ?= e2e-webhook-test-ns
+E2E_TEST_MODEL ?= model-validation-test-model:latest
+MODEL_TRANSPARENCY_IMG ?= ghcr.io/sigstore/model-transparency-cli:v1.0.1
+CERTMANAGER_VERSION ?= v1.18.2
+CERT_MANAGER_YAML ?= https://github.com/cert-manager/cert-manager/releases/download/$(CERTMANAGER_VERSION)/cert-manager.yaml
+KIND_CLUSTER ?= kind
+
+# Build and sign test model
+.PHONY: e2e-generate-test-keys
+e2e-generate-test-keys:
+	@echo "Generating ECDSA P-256 test keys for model signing..."
+	@if [ ! -f testdata/docker/test_private_key.priv ]; then \
+		echo "Generating private key..."; \
+		openssl ecparam -name prime256v1 -genkey -noout -out testdata/docker/test_private_key.priv; \
+	fi
+	@if [ ! -f testdata/docker/test_public_key.pub ]; then \
+		echo "Generating public key..."; \
+		openssl ec -in testdata/docker/test_private_key.priv -pubout -out testdata/docker/test_public_key.pub; \
+	fi
+	@if [ ! -f testdata/docker/test_invalid_private_key.priv ]; then \
+		echo "Generating invalid private key for failure tests..."; \
+		openssl ecparam -name prime256v1 -genkey -noout -out testdata/docker/test_invalid_private_key.priv; \
+	fi
+	@if [ ! -f testdata/docker/test_invalid_public_key.pub ]; then \
+		echo "Generating invalid public key for failure tests..."; \
+		openssl ec -in testdata/docker/test_invalid_private_key.priv -pubout -out testdata/docker/test_invalid_public_key.pub; \
+	fi
+
+.PHONY: e2e-sign-test-model
+e2e-sign-test-model: e2e-generate-test-keys
+	@echo "Signing test model with private key..."
+	@# Remove public key from model directory before signing to avoid including it in signature
+	@rm -f testdata/tensorflow_saved_model/test_public_key.pub
+	$(CONTAINER_TOOL) run --rm \
+		-v $(PWD)/testdata/tensorflow_saved_model:/model \
+		-v $(PWD)/testdata/docker/test_private_key.priv:/test_private_key.priv \
+		--entrypoint="" \
+		ghcr.io/sigstore/model-transparency-cli:v1.0.1 \
+		/usr/local/bin/model_signing sign key /model \
+		--private_key /test_private_key.priv \
+		--signature /model/model.sig
+
+.PHONY: e2e-build-test-model
+e2e-build-test-model: e2e-sign-test-model
+	@echo "Building test model image..."
+	cd testdata && $(CONTAINER_TOOL) build --no-cache -t $(E2E_TEST_MODEL) -f docker/test-model.Dockerfile .
+
+# install and uninstall cert-manager for tests
+
+.PHONY: e2e-install-certmanager
+e2e-install-certmanager:
+	@echo "Installing cert-manager..."
+	$(KUBECTL) apply -f $(CERT_MANAGER_YAML)
+	@echo "Waiting for cert-manager to be ready..."
+	$(KUBECTL) wait --for=condition=Available deployment -n cert-manager --all --timeout=120s
+
+.PHONY: e2e-uninstall-certmanager
+e2e-uninstall-certmanager: ## Uninstall cert-manager
+	@echo "Uninstalling cert-manager..."
+	-$(KUBECTL) delete -f $(CERT_MANAGER_YAML)
+
+# Load test images into the kind cluster
+
+.PHONY: e2e-build-image
+e2e-build-image:
+	$(CONTAINER_TOOL) build -t $(IMG) -f $(CONTAINER_FILE) .
+
+.PHONY: e2e-load-images
+e2e-load-images: e2e-build-image e2e-build-test-model
+	@echo "Pulling model-transparency-cli image..."
+	$(CONTAINER_TOOL) pull $(MODEL_TRANSPARENCY_IMG)
+	@echo "Loading manager image into Kind cluster..."
+	$(KIND) load docker-image -n $(KIND_CLUSTER) $(IMG)
+	@echo "Loading model-transparency-cli image into Kind cluster..."  
+	$(KIND) load docker-image -n $(KIND_CLUSTER) $(MODEL_TRANSPARENCY_IMG)
+	@echo "Loading test model image into Kind cluster..."
+	$(KIND) load docker-image -n $(KIND_CLUSTER) $(E2E_TEST_MODEL)
+
+# Setup test environment (namespaces, local models on kind cluster, operator)
+
+.PHONY: e2e-setup-namespaces
+e2e-setup-namespaces:
+	@echo "Creating operator namespace..."
+	$(KUBECTL) create ns $(E2E_OPERATOR_NAMESPACE) || true
+	@echo "Labeling operator namespace with restricted security policy..."
+	$(KUBECTL) label --overwrite ns $(E2E_OPERATOR_NAMESPACE) pod-security.kubernetes.io/enforce=restricted
+	@echo "Labeling operator namespace to be ignored by webhook..."
+	$(KUBECTL) label --overwrite ns $(E2E_OPERATOR_NAMESPACE) validation.ml.sigstore.dev/ignore=true
+	@echo "Creating test namespace..."
+	$(KUBECTL) create ns $(E2E_TEST_NAMESPACE) || true
+
+.PHONY: e2e-setup-model-data
+e2e-setup-model-data: e2e-load-images e2e-setup-namespaces
+	@echo "Cleaning up any existing model data DaemonSet..."
+	-$(KUBECTL) delete daemonset model-data-setup -n $(E2E_TEST_NAMESPACE) 2>/dev/null || true
+	@echo "Waiting for cleanup to complete..."
+	@sleep 5
+	@echo "Deploying model data setup DaemonSet..."
+	$(KUBECTL) apply -f test/e2e/testdata/model-data-daemonset.yaml
+	@echo "Waiting for model data to be available on all nodes..."
+	$(KUBECTL) rollout status daemonset/model-data-setup -n $(E2E_TEST_NAMESPACE) --timeout=120s
+
+.PHONY: e2e-deploy-operator
+e2e-deploy-operator: e2e-setup-namespaces deploy
+	@echo "E2E operator deployment complete"
+
+.PHONY: e2e-wait-operator
+e2e-wait-operator: ## Wait for operator pod to be ready
+	@echo "Waiting for controller pod to be ready..."
+	$(KUBECTL) wait --for=condition=Ready pod -l control-plane=controller-manager -n $(E2E_OPERATOR_NAMESPACE) --timeout=120s
+
+# test environment setup and teardown - certmanager, operator and test model for testing
+
+.PHONY: e2e-setup
+e2e-setup: e2e-install-certmanager e2e-setup-model-data e2e-deploy-operator e2e-wait-operator ## Complete e2e test setup
+	@echo "E2E test environment setup complete"
+
+.PHONY: e2e-cleanup-resources
+e2e-cleanup-resources: ## Clean up test resources before removing operator
+	@echo "Cleaning up test resources..."
+	-$(KUBECTL) delete pods --all -n $(E2E_TEST_NAMESPACE) --timeout=30s
+	-$(KUBECTL) delete modelvalidations --all -n $(E2E_TEST_NAMESPACE) --timeout=30s
+	-$(KUBECTL) delete daemonset model-data-setup -n $(E2E_TEST_NAMESPACE) --timeout=30s
+
+.PHONY: e2e-teardown
+e2e-teardown: e2e-cleanup-resources undeploy e2e-uninstall-certmanager
+	@echo "Tearing down e2e test environment..."
+	-$(KUBECTL) delete ns $(E2E_OPERATOR_NAMESPACE) --timeout=60s
+	-$(KUBECTL) delete ns $(E2E_TEST_NAMESPACE) --timeout=60s
+
+# run e2e tests
+
+.PHONY: test-e2e
+test-e2e: manifests generate fmt vet ## Run the e2e tests, no setup and teardown.  Expects the operator to be deployed.
+	@echo "Running e2e tests (assumes infrastructure is already set up)..."
+	go test ./test/e2e/ -v -ginkgo.v
+
+.PHONY: test-e2e-full
+test-e2e-full: manifests generate fmt vet e2e-setup ## Run e2e tests with setup and teardown
+	@echo "Running e2e tests with full infrastructure setup..."
+	go test ./test/e2e/ -v -ginkgo.v; \
+	TEST_RESULT=$$?; \
+	$(MAKE) e2e-teardown; \
+	exit $$TEST_RESULT
+
+.PHONY: test-e2e-ci
+test-e2e-ci: manifests generate fmt vet e2e-setup ## Run the e2e tests, with setup.  No teardown as the CI workflow will throw away kind
+	@echo "Running e2e tests with infrastructure setup for CI..."
+	go test ./test/e2e/ -v -ginkgo.v
+
diff --git a/api/v1alpha1/modelvalidation_types.go b/api/v1alpha1/modelvalidation_types.go
@@ -17,6 +17,9 @@ limitations under the License.
 package v1alpha1
 
 import (
+	"crypto/sha256"
+	"fmt"
+
 	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
 )
 
@@ -43,19 +46,32 @@ type PkiConfig struct {
 	CertificateAuthority string `json:"certificateAuthority,omitempty"`
 }
 
-// PrivateKeyConfig defines the private key verification configuration
-// for validating model signatures using a local private key
-type PrivateKeyConfig struct {
-	// Path to the private key.
+// PublicKeyConfig defines the public key verification configuration
+// for validating model signatures using a local public key
+type PublicKeyConfig struct {
+	// Path to the public key.
 	KeyPath string `json:"keyPath,omitempty"`
 }
 
+// ClientTrustConfig defines the configuration for client trust settings,
+// used when working with private rekor/fulcio instances.
+type ClientTrustConfig struct {
+	// TrustConfigPath is the path to the trust configuration file.
+	// This specifies the trust configuration needed for using private rekor/fulcio instances
+	// and should conform to the ClientTrustConfig message.
+	// +kubebuilder:validation:Required
+	TrustConfigPath string `json:"trustConfigPath,omitempty"`
+}
+
 // ValidationConfig defines the various methods available for validating model signatures.
 // At least one validation method must be specified.
 type ValidationConfig struct {
-	SigstoreConfig   *SigstoreConfig   `json:"sigstoreConfig,omitempty"`
-	PkiConfig        *PkiConfig        `json:"pkiConfig,omitempty"`
-	PrivateKeyConfig *PrivateKeyConfig `json:"privateKeyConfig,omitempty"`
+	SigstoreConfig  *SigstoreConfig  `json:"sigstoreConfig,omitempty"`
+	PkiConfig       *PkiConfig       `json:"pkiConfig,omitempty"`
+	PublicKeyConfig *PublicKeyConfig `json:"publicKeyConfig,omitempty"`
+	// +kubebuilder:validation:Optional
+	// ClientTrustConfig is the configuration for client trust settings.
+	ClientTrustConfig *ClientTrustConfig `json:"clientTrustConfig,omitempty"`
 }
 
 // ModelValidationSpec defines the desired state of ModelValidation
@@ -69,15 +85,54 @@ type ModelValidationSpec struct {
 	Config ValidationConfig `json:"config"`
 }
 
+// PodTrackingInfo contains information about a tracked pod
+type PodTrackingInfo struct {
+	// Name is the name of the pod
+	Name string `json:"name"`
+	// UID is the unique identifier of the pod
+	UID string `json:"uid"`
+	// InjectedAt is when the pod was injected
+	InjectedAt metav1.Time `json:"injectedAt"`
+}
+
 // ModelValidationStatus defines the observed state of ModelValidation
 type ModelValidationStatus struct {
 	// INSERT ADDITIONAL STATUS FIELD - define observed state of cluster
 	// Important: Run "make" to regenerate code after modifying this file
 	Conditions []metav1.Condition `json:"conditions,omitempty"`
+
+	// InjectedPodCount is the number of pods that have been injected with validation
+	InjectedPodCount int32 `json:"injectedPodCount"`
+
+	// UninjectedPodCount is the number of pods that have the label but were not injected
+	UninjectedPodCount int32 `json:"uninjectedPodCount"`
+
+	// OrphanedPodCount is the number of injected pods that reference this CR but are inconsistent
+	OrphanedPodCount int32 `json:"orphanedPodCount"`
+
+	// AuthMethod indicates which authentication method is being used
+	AuthMethod string `json:"authMethod,omitempty"`
+
+	// InjectedPods contains detailed information about injected pods
+	InjectedPods []PodTrackingInfo `json:"injectedPods,omitempty"`
+
+	// UninjectedPods contains detailed information about pods that should have been injected but weren't
+	UninjectedPods []PodTrackingInfo `json:"uninjectedPods,omitempty"`
+
+	// OrphanedPods contains detailed information about pods that are injected but inconsistent
+	OrphanedPods []PodTrackingInfo `json:"orphanedPods,omitempty"`
+
+	// LastUpdated is the timestamp of the last status update
+	LastUpdated metav1.Time `json:"lastUpdated,omitempty"`
 }
 
 // +kubebuilder:object:root=true
 // +kubebuilder:subresource:status
+// +kubebuilder:printcolumn:name="Auth Method",type=string,JSONPath=`.status.authMethod`
+// +kubebuilder:printcolumn:name="Injected Pods",type=integer,JSONPath=`.status.injectedPodCount`
+// +kubebuilder:printcolumn:name="Uninjected Pods",type=integer,JSONPath=`.status.uninjectedPodCount`
+// +kubebuilder:printcolumn:name="Orphaned Pods",type=integer,JSONPath=`.status.orphanedPodCount`
+// +kubebuilder:printcolumn:name="Age",type="date",JSONPath=".metadata.creationTimestamp"
 
 // ModelValidation is the Schema for the modelvalidations API
 type ModelValidation struct {
@@ -97,6 +152,47 @@ type ModelValidationList struct {
 	Items           []ModelValidation `json:"items"`
 }
 
+// GetAuthMethod returns the authentication method being used
+func (mv *ModelValidation) GetAuthMethod() string {
+	if mv.Spec.Config.SigstoreConfig != nil {
+		return "sigstore"
+	} else if mv.Spec.Config.PkiConfig != nil {
+		return "pki"
+	} else if mv.Spec.Config.PublicKeyConfig != nil {
+		return "public-key"
+	}
+	return "unknown"
+}
+
+// GetConfigHash returns a hash of the validation configuration for drift detection
+func (mv *ModelValidation) GetConfigHash() string {
+	return mv.Spec.Config.GetConfigHash()
+}
+
+// GetConfigHash returns a hash of the validation configuration for drift detection
+func (vc *ValidationConfig) GetConfigHash() string {
+	hasher := sha256.New()
+
+	if vc.SigstoreConfig != nil {
+		hasher.Write([]byte("sigstore"))
+		hasher.Write([]byte(vc.SigstoreConfig.CertificateIdentity))
+		hasher.Write([]byte(vc.SigstoreConfig.CertificateOidcIssuer))
+	} else if vc.PkiConfig != nil {
+		hasher.Write([]byte("pki"))
+		hasher.Write([]byte(vc.PkiConfig.CertificateAuthority))
+	} else if vc.PublicKeyConfig != nil {
+		hasher.Write([]byte("publickey"))
+		hasher.Write([]byte(vc.PublicKeyConfig.KeyPath))
+	}
+
+	if vc.ClientTrustConfig != nil {
+		hasher.Write([]byte("clienttrust"))
+		hasher.Write([]byte(vc.ClientTrustConfig.TrustConfigPath))
+	}
+
+	return fmt.Sprintf("%x", hasher.Sum(nil))[:16] // Use first 16 chars for brevity
+}
+
 func init() {
 	SchemeBuilder.Register(&ModelValidation{}, &ModelValidationList{})
 }