Merge branch 'main' into run-evaluations-from-ui

alvaroloes · web-flow · commit 1f40d7a56f04 · 2025-03-05T11:32:08.000Z
diff --git a/.github/workflows/app-build.yml b/.github/workflows/app-build.yml
@@ -21,9 +21,11 @@ env:
   GIT_REF: ${{ github.ref }} # GitHub Context
   FRONTEND_BUILD_CONTEXT: ./apps/opik-frontend # Repository VAR
   BACKEND_BUILD_CONTEXT: ./apps/opik-backend # Repository VAR
+  EVALUATOR_BUILD_CONTEXT: ./apps/aifindr-evaluations-runner # Repository VAR
   ECR_REGISTRY: ${{ vars.ECR_REGISTRY }} # Repository VAR
   ECR_BACKEND_REPOSITORY: ${{ vars.ECR_BACKEND_REPOSITORY }} # Repository VAR
   ECR_FRONTEND_REPOSITORY: ${{ vars.ECR_FRONTEND_REPOSITORY }} # Repository VAR
+  ECR_EVALUATOR_REPOSITORY: ${{ vars.ECR_EVALUATOR_REPOSITORY }} # Repository VAR
 
 jobs:
   # Check if latest tag is a release candidate and stop flow if it is
@@ -154,6 +156,18 @@ jobs:
           docker push $ECR_REGISTRY/$ECR_BACKEND_REPOSITORY:$APP_VERSION
           docker push $ECR_REGISTRY/$ECR_BACKEND_REPOSITORY:$IMAGE_TAG
 
+          if [ $DEBUG == "true" ]; then
+            echo "building evaluator image into: $ECR_REGISTRY/$ECR_EVALUATOR_REPOSITORY:$APP_VERSION"
+          fi
+
+          docker build -t $ECR_REGISTRY/$ECR_EVALUATOR_REPOSITORY:$APP_VERSION \
+            -f $EVALUATOR_BUILD_CONTEXT/Dockerfile \
+            $EVALUATOR_BUILD_CONTEXT
+
+          docker tag $ECR_REGISTRY/$ECR_EVALUATOR_REPOSITORY:$APP_VERSION $ECR_REGISTRY/$ECR_EVALUATOR_REPOSITORY:$IMAGE_TAG
+          docker push $ECR_REGISTRY/$ECR_EVALUATOR_REPOSITORY:$APP_VERSION
+          docker push $ECR_REGISTRY/$ECR_EVALUATOR_REPOSITORY:$IMAGE_TAG
+
   ecs-deploy:
     environment: "${{ inputs.environment || 'production' }}"
     env:
diff --git a/apps/aifindr-evaluations-runner/.env.example b/apps/aifindr-evaluations-runner/.env.example
@@ -1,2 +1,4 @@
-OPIK_URL=http://host.docker.internal:5173/api
-OPENAI_API_KEY=your-api-key-here
+OPIK_URL_OVERRIDE=http://host.docker.internal:5173/api
+OPENAI_API_KEY=your-api-key-here
+ELLMENTAL_API_URL=
+ELLMENTAL_API_KEY=
diff --git a/apps/aifindr-evaluations-runner/Dockerfile b/apps/aifindr-evaluations-runner/Dockerfile
@@ -1,4 +1,4 @@
-FROM python:3.11-slim
+FROM python:3.12-slim
 
 WORKDIR /app
 
diff --git a/apps/aifindr-evaluations-runner/main.py b/apps/aifindr-evaluations-runner/main.py
@@ -3,6 +3,12 @@
 import logging
 import asyncio
 import uuid
+from requests import request, Response
+
+from urllib.parse import urljoin, urlparse
+from typing import Dict
+
+from settings import settings
 from evaluator import EvaluationParams, ExperimentStatus, execute_evaluation
 
 # Configure logging
@@ -11,9 +17,12 @@
 
 app = FastAPI()
 
-TASK_QUEUE: asyncio.Queue[EvaluationParams] = asyncio.Queue(maxsize=10)  # Maximum number of evaluations in queue
+TASK_QUEUE: asyncio.Queue[EvaluationParams] = asyncio.Queue(
+    maxsize=10
+)  # Maximum number of evaluations in queue
 MAX_CONCURRENT_TASKS = 5  # Number of concurrent evaluations
 
+
 class RunEvaluationsRequest(BaseModel):
     workspace_name: str
     dataset_name: str
@@ -22,10 +31,21 @@ class RunEvaluationsRequest(BaseModel):
     base_prompt_name: str
     workflow: str
 
+
 class RunEvaluationsResponse(BaseModel):
     status: str
     task_id: str
 
+
+class HealthResponse(BaseModel):
+    ellmental: Dict[str, str]
+    opik: Dict[str, str]
+
+
+def get_domain(url: str) -> str:
+    return urlparse(url).netloc.split(":")[0]
+
+
 async def process_queue():
     """Background task to process queued evaluations"""
     while True:
@@ -40,12 +60,58 @@ async def process_queue():
         finally:
             TASK_QUEUE.task_done()
 
+
 @app.on_event("startup")
 async def startup_event():
     # Start background workers to process the queue
     for _ in range(MAX_CONCURRENT_TASKS):
         asyncio.create_task(process_queue())
 
+
+@app.get("/health", response_model=HealthResponse)
+async def health(timeout: int = 5):
+    ellmental_health_url: str = urljoin(settings.ELLMENTAL_API_URL, "/health")
+    opik_health_url: str = urljoin(settings.OPIK_URL_OVERRIDE, "/is-alive/ping")
+
+    ellm_health = {"status": "healthy", "message": "eLLMental is healthy"}
+    opik_health = {"status": "healthy", "message": "OPIK is healthy"}
+    try:
+        ellm_response: Response = request(
+            method="GET", url=ellmental_health_url, timeout=timeout
+        )
+        if ellm_response.status_code != 200:
+            ellm_health["status"] = "unhealthy"
+            ellm_health["message"] = str(ellm_response.text).replace(
+                get_domain(settings.ELLMENTAL_API_URL), "***"
+            )
+    except Exception as e:
+        ellm_health["status"] = "unhealthy"
+        ellm_health["message"] = str(e).replace(
+            get_domain(settings.ELLMENTAL_API_URL), "***"
+        )
+    try:
+        opik_response: Response = request(
+            method="GET", url=opik_health_url, timeout=timeout
+        )
+        if opik_response.status_code != 200:
+            opik_health["status"] = "unhealthy"
+            opik_health["message"] = str(opik_response.text).replace(
+                get_domain(settings.OPIK_URL_OVERRIDE), "***"
+            )
+    except Exception as e:
+        opik_health["status"] = "unhealthy"
+        opik_health["message"] = str(e).replace(
+            get_domain(settings.OPIK_URL_OVERRIDE), "***"
+        )
+
+    response = {"ellmental": ellm_health, "opik": opik_health}
+
+    if all(health["status"] == "healthy" for health in [ellm_health, opik_health]):
+        return HealthResponse(**response)
+    else:
+        raise HTTPException(status_code=503, detail=response)
+
+
 @app.post("/evaluations/run", response_model=RunEvaluationsResponse)
 async def run_evaluation(input: RunEvaluationsRequest, req: Request):
     try:
@@ -67,11 +133,17 @@ async def run_evaluation(input: RunEvaluationsRequest, req: Request):
             TASK_QUEUE.put_nowait(evaluation_params)
             logger.info("Evaluation task added to queue")
         except asyncio.QueueFull:
-            logger.error(f"Queue is full. Evaluation task not added to the queue: {evaluation_params}")
-            raise HTTPException(status_code=503, detail="Server is currently at maximum capacity. Please try again later.")
-        
-        return RunEvaluationsResponse(status=ExperimentStatus.RUNNING.value, task_id=task_id)
+            logger.error(
+                f"Queue is full. Evaluation task not added to the queue: {evaluation_params}"
+            )
+            raise HTTPException(
+                status_code=503,
+                detail="Server is currently at maximum capacity. Please try again later.",
+            )
+
+        return RunEvaluationsResponse(
+            status=ExperimentStatus.RUNNING.value, task_id=task_id
+        )
     except Exception as e:
         logger.error(f"Error processing request: {str(e)}")
-        raise HTTPException(status_code=500, detail=str(e)) 
-    
+        raise HTTPException(status_code=500, detail=str(e))
diff --git a/apps/aifindr-evaluations-runner/settings.py b/apps/aifindr-evaluations-runner/settings.py
@@ -1,20 +1,33 @@
-from pydantic_settings import BaseSettings
+import os
+from functools import lru_cache
+
+from pydantic_settings import BaseSettings, SettingsConfigDict
 from pydantic import field_validator
 
+
 class Settings(BaseSettings):
+    model_config = SettingsConfigDict(env_file=".env", extra="allow")
     OPIK_URL_OVERRIDE: str = "http://host.docker.internal:5173/api"
     OPENAI_API_KEY: str = ""
     ELLMENTAL_API_URL: str = ""
     ELLMENTAL_API_KEY: str = ""
-    
+
     @field_validator("*")
     def no_empty_strings(cls, v):
         if isinstance(v, str) and not v:
             raise ValueError("Field cannot be empty")
         return v
-    
-    class Config:
-        env_file = ".env"
-        extra = "ignore"  # Permite ignorar variables extra
 
-settings = Settings()
+
+class EnvSettings(BaseSettings):
+    settings: Settings = Settings()
+
+
+@lru_cache()  # Cache settings to avoid re-reading the .env file on each call
+def get_settings() -> Settings:
+    if not os.getenv("SETTINGS"):
+        return Settings()
+    return EnvSettings().settings
+
+
+settings = get_settings()
diff --git a/deployment/docker-compose/docker-compose.yaml b/deployment/docker-compose/docker-compose.yaml
@@ -121,6 +121,8 @@ services:
     build:
       context: ../../apps/aifindr-evaluations-runner
       dockerfile: Dockerfile
+    env_file:
+      - ../../apps/aifindr-evaluations-runner/.env
     ports:
       - "8001:8001"
 

Original file line number	Diff line number	Diff line change
`@@ -1,4 +1,4 @@`
`1`		`-FROM python:3.11-slim`
	`1`	`+FROM python:3.12-slim`
`2`	`2`
`3`	`3`	`WORKDIR /app`
`4`	`4`