Merge pull request #11 from lucasalvaa/fast-API

SimoCimmi · web-flow · commit 9c087880372f · 2026-01-29T16:31:31.000+01:00
Fast API and Dockerfile
diff --git a/Dockerfile b/Dockerfile
@@ -0,0 +1,35 @@
+# Python light version
+FROM python:3.12-slim
+
+ENV PYTHONDONTWRITEBYTECODE=1
+ENV PYTHONUNBUFFERED=1
+
+WORKDIR /app
+
+RUN apt-get update && apt-get upgrade -y && apt-get install -y --no-install-recommends \
+    libopenjp2-7 \
+    && rm -rf /var/lib/apt/lists/*
+
+RUN pip install --no-cache-dir --upgrade pip setuptools wheel
+
+# Python dependencies
+RUN pip install --no-cache-dir \
+    fastapi \
+    uvicorn \
+    python-multipart \
+    "pillow>=11.0.0"
+
+# Pytorch
+RUN pip install --no-cache-dir \
+    torch torchvision \
+    --index-url https://download.pytorch.org/whl/cpu
+
+RUN useradd -m appuser
+USER appuser
+
+# Copy script and model weights
+COPY src/api.py .
+COPY --chown=appuser:appuser pipeline3/effnet_s/finetuned/model.pth ./weights/model.pth
+
+EXPOSE 8080
+CMD ["python", "api.py"]
diff --git a/ruff.toml b/ruff.toml
@@ -20,6 +20,8 @@ ignore = [
     "D100", # Spesso i docstring nei file __init__.py sono ridondanti
     "ANN101", # Non serve annotare 'self'
     "ANN102", # Non serve annotare 'cls'
+    "N812",
+    "B008"
 ]
 
 [lint.mccabe]
diff --git a/src/api.py b/src/api.py
@@ -0,0 +1,123 @@
+import io
+import time
+from typing import Dict, Tuple
+
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+import uvicorn
+from fastapi import FastAPI, File, UploadFile
+from PIL import Image
+from pydantic import BaseModel
+from torchvision import models, transforms
+
+MODEL_PATH = "weights/model.pth"  # Container path
+MODEL_VERSION = "efficientnet_v2_s"
+
+CLASSES = [
+    "demodicosis",
+    "dermatitis",
+    "fungal_infections",
+    "healthy",
+    "hypersensitivity",
+    "ringworm",
+]
+
+app = FastAPI(title="Dog Skin Disease Classifier")
+
+
+def load_model() -> Tuple[nn.Module, torch.device]:
+    """Load the EfficientNetV2_S model and its fine-tuned weights.
+
+    The architecture is modified by replacing the final classifier
+    to adapt it to the problem-specific number of classes.
+
+    Returns:
+        Tuple[nn.Module, torch.device]: The loaded model and the device (CPU).
+
+    """
+    # Initialize the model
+    model = getattr(models, MODEL_VERSION)(weights=None)
+
+    # In EfficientNetV2, classifier is accessible through model.classifier[1]
+    # Structure: [0] Dropout, [1] Linear
+    n_inputs = model.classifier[1].in_features
+    model.classifier[1] = nn.Linear(n_inputs, len(CLASSES))
+
+    # state_dict loading
+    device = torch.device("cpu")
+    state_dict = torch.load(MODEL_PATH, map_location=device, weights_only=True)
+
+    model.load_state_dict(state_dict)
+    model.eval()
+    return model, device
+
+
+# Model is loaded when the application starts
+model, device = load_model()
+
+preprocess = transforms.Compose(
+    [
+        transforms.Resize((224, 224)),
+        transforms.ToTensor(),
+        transforms.Normalize(mean=[0.485, 0.456, 0.406], std=[0.229, 0.224, 0.225]),
+    ]
+)
+
+
+class PredictionResponse(BaseModel):
+    """Response pattern for model prediction.
+
+    Attributes:
+        label_name (str): Name of the predicted class.
+        confidence_score (float): Probability associated with the predicted class.
+        inference_time_ms (float): Time taken for inference in milliseconds.
+        model_version_id (str): Model version identifier.
+
+    """
+
+    label_name: str
+    confidence_score: float
+    inference_time_ms: float
+    model_version_id: str
+
+
+@app.post("/predict", response_model=PredictionResponse)
+async def predict(file: UploadFile = File(...)) -> Dict:
+    """Upon receiving an image, it performs preprocessing and returns the prediction.
+
+    Args:
+        file (UploadFile): Image file uploaded via POST request.
+
+    Returns:
+        Dict: Classification result with score and execution time.
+
+    """
+    start_time = time.perf_counter()
+
+    # Read the uploaded image
+    content = await file.read()
+    image = Image.open(io.BytesIO(content)).convert("RGB")
+
+    # Prepare the image to be fed as input to the model
+    input_tensor = preprocess(image).unsqueeze(0).to(device)
+
+    # Inference without gradient calculation
+    with torch.no_grad():
+        outputs = model(input_tensor)
+        probabilities = F.softmax(outputs[0], dim=0)
+
+    # Class and confidence score extraction
+    conf, idx = torch.max(probabilities, 0)
+    label = CLASSES[idx.item()]
+
+    return {
+        "label_name": label,
+        "confidence_score": round(float(conf), 4),
+        "inference_time_ms": round((time.perf_counter() - start_time) * 1000, 2),
+        "model_version_id": MODEL_VERSION,
+    }
+
+
+if __name__ == "__main__":
+    uvicorn.run(app, host="0.0.0.0", port=8080)

Original file line number	Diff line number	Diff line change
`@@ -20,6 +20,8 @@ ignore = [`
`20`	`20`	`"D100", # Spesso i docstring nei file __init__.py sono ridondanti`
`21`	`21`	`"ANN101", # Non serve annotare 'self'`
`22`	`22`	`"ANN102", # Non serve annotare 'cls'`
	`23`	`+ "N812",`
	`24`	`+ "B008"`
`23`	`25`	`]`
`24`	`26`
`25`	`27`	`[lint.mccabe]`