add tests, dockerfile, deploy manifests

saichandrapandraju · saichandrapandraju · commit 3a4965a3ca45 · 2025-06-11T17:35:27.000-04:00
diff --git a/detectors/Dockerfile.judge b/detectors/Dockerfile.judge
@@ -0,0 +1,31 @@
+FROM registry.access.redhat.com/ubi9/ubi-minimal as base
+RUN microdnf update -y && \
+    microdnf install -y --nodocs \
+        python-pip python-devel && \
+    pip install --upgrade --no-cache-dir pip wheel && \
+    microdnf clean all
+RUN pip install --no-cache-dir torch
+
+# FROM icr.io/fm-stack/ubi9-minimal-py39-torch as builder
+FROM base as builder
+
+COPY ./common/requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+
+COPY ./llm_judge/requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+
+FROM builder
+
+WORKDIR /app
+ARG CACHEBUST=1
+RUN echo "$CACHEBUST"
+COPY ./common /common
+COPY ./llm_judge/app.py /app
+COPY ./llm_judge/detector.py /app
+COPY ./llm_judge/scheme.py /app
+
+EXPOSE 8000
+CMD ["uvicorn", "app:app", "--workers", "4", "--host", "0.0.0.0", "--port", "8000", "--log-config", "/common/log_conf.yaml"]
+
+# gunicorn main:app --workers 4 --worker-class uvicorn.workers.UvicornWorker --bind 0.0.0.0:8000
diff --git a/detectors/llm_judge/README.md b/detectors/llm_judge/README.md
@@ -0,0 +1,8 @@
+# LLM Judge Detector
+
+The LLM Judge detector integrates the [vLLM Judge](https://github.com/saichandrapandraju/vllm_judge) into the Guardrails Detector ecosystem.
+
+```
+oc apply -f deploy/servingruntime.yaml
+oc apply -f deploy/isvc.yaml
+```
diff --git a/detectors/llm_judge/__init__.py b/detectors/llm_judge/__init__.py
diff --git a/detectors/llm_judge/app.py b/detectors/llm_judge/app.py
@@ -8,8 +8,8 @@
 sys.path.insert(0, os.path.abspath(".."))
 
 from common.app import DetectorBaseAPI as FastAPI
-from detector import LLMJudgeDetector
-from scheme import (
+from .detector import LLMJudgeDetector
+from .scheme import (
     ContentAnalysisHttpRequest,
     ContentsAnalysisResponse,
     MetricsListResponse,
diff --git a/detectors/llm_judge/deploy/isvc.yaml b/detectors/llm_judge/deploy/isvc.yaml
@@ -0,0 +1,23 @@
+apiVersion: serving.kserve.io/v1beta1
+kind: InferenceService
+metadata:
+  name: guardrails-detector-llm-judge
+  namespace: model-namespace
+  labels:
+    opendatahub.io/dashboard: 'true'
+  annotations:
+    openshift.io/display-name: guardrails-detector-llm-judge
+    security.opendatahub.io/enable-auth: 'true'
+    serving.knative.openshift.io/enablePassthrough: 'true'
+    sidecar.istio.io/inject: 'true'
+    sidecar.istio.io/rewriteAppHTTPProbers: 'true'
+    serving.kserve.io/deploymentMode: RawDeployment
+spec:
+  predictor:
+    maxReplicas: 1
+    minReplicas: 1
+    model:
+      modelFormat:
+        name: guardrails-detector-llm-judge
+      name: ''
+      runtime: guardrails-detector-runtime-judge
diff --git a/detectors/llm_judge/deploy/servingruntime.yaml b/detectors/llm_judge/deploy/servingruntime.yaml
@@ -0,0 +1,45 @@
+apiVersion: serving.kserve.io/v1alpha1
+kind: ServingRuntime
+metadata:
+  name: guardrails-detector-runtime-judge
+  namespace: model-namespace
+  annotations:
+    openshift.io/display-name: Guardrails LLM Judge Detector ServingRuntime for KServe
+  labels:
+    opendatahub.io/dashboard: 'true'
+spec:
+  annotations:
+    prometheus.io/port: '8080'
+    prometheus.io/path: '/metrics'
+  multiModel: false
+  supportedModelFormats:
+    - autoSelect: true
+      name: guardrails-detector-llm-judge
+  containers:
+    - name: kserve-container
+      image: quay.io/rh-ee-spandraj/guardrails-detector-judge:latest
+      command:
+        - uvicorn
+        - app:app
+      args:
+        - "--workers"
+        - "1"
+        - "--host"
+        - "0.0.0.0"
+        - "--port"
+        - "8000"
+        - "--log-config"
+        - "/common/log_conf.yaml"
+      env:
+        - name: VLLM_BASE_URL
+          value: "http://qwen2-predictor:8080" # <-- Change this to your vLLM URL
+      ports:
+        - containerPort: 8000
+          protocol: TCP
+      resources:
+        requests:
+          memory: "5Gi"
+          cpu: "1"
+        limits:
+          memory: "10Gi"
+          cpu: "2"
diff --git a/detectors/llm_judge/detector.py b/detectors/llm_judge/detector.py
@@ -7,7 +7,7 @@
 from vllm_judge import Judge, EvaluationResult, BUILTIN_METRICS
 from vllm_judge.exceptions import MetricNotFoundError
 from common.app import logger
-from scheme import (
+from .scheme import (
     ContentAnalysisHttpRequest,
     ContentAnalysisResponse,
     ContentsAnalysisResponse,
@@ -41,7 +41,7 @@ def _initialize_judge(self) -> None:
             logger.info(f"Available metrics: {', '.join(sorted(self.available_metrics))}")
             
         except Exception as e:
-            logger.error(f"Failed to initialize LLM Judge: {e}")
+            logger.error(f"Failed to detect model: {e}")
             raise
     
     async def evaluate_single_content(self, content: str, params: Dict[str, Any]) -> ContentAnalysisResponse:
diff --git a/detectors/llm_judge/requirements.txt b/detectors/llm_judge/requirements.txt
@@ -1 +1,2 @@
-vllm-judge>=0.1.5
+vllm-judge>=0.1.5
+pyyaml>=6.0.2
diff --git a/tests/conftest.py b/tests/conftest.py
@@ -9,10 +9,12 @@ def setup_imports():
     project_root = os.path.dirname(os.path.dirname(__file__))
     detectors_path = os.path.join(project_root, "detectors")
     huggingface_path = os.path.join(detectors_path, "huggingface")
+    llm_judge_path = os.path.join(detectors_path, "llm_judge")
     paths = [
         huggingface_path,
         detectors_path,
         project_root,
+        llm_judge_path,
     ]
 
     for path in paths:
diff --git a/tests/detectors/llm_judge/test_llm_judge_detector.py b/tests/detectors/llm_judge/test_llm_judge_detector.py
diff --git a/tests/detectors/llm_judge/test_performance.py b/tests/detectors/llm_judge/test_performance.py
diff --git a/tox.ini b/tox.ini

Original file line number	Diff line number	Diff line change
`@@ -1 +1,2 @@`
`1`		`-vllm-judge>=0.1.5`
	`1`	`+vllm-judge>=0.1.5`
	`2`	`+pyyaml>=6.0.2`