Add error handling in report_chart.py

nemanjaASE · nemanjaASE · commit 3d6018302e76 · 2025-03-11T00:01:33.000+01:00
diff --git a/agentic_security/report_chart.py b/agentic_security/report_chart.py
@@ -1,4 +1,5 @@
 import io
+import logging
 import string
 
 import matplotlib.pyplot as plt
@@ -9,150 +10,180 @@
 
 from .primitives import Table
 
+logging.basicConfig(
+    level=logging.INFO, format="%(asctime)s - %(levelname)s - %(message)s"
+)
+
 
 def plot_security_report(table: Table) -> io.BytesIO:
-    # Data preprocessing
-    data = pd.DataFrame(table)
-
-    # Sort by failure rate and reset index
-    data = data.sort_values("failureRate", ascending=False).reset_index(drop=True)
-    data["identifier"] = generate_identifiers(data)
-
-    # Plot setup
-    fig, ax = plt.subplots(figsize=(12, 10), subplot_kw={"projection": "polar"})
-    fig.set_facecolor("#f0f0f0")
-    ax.set_facecolor("#f0f0f0")
-
-    # Styling parameters
-    colors = ["#6C5B7B", "#C06C84", "#F67280", "#F8B195"][::-1]  # Pastel palette
-    # colors = ["#440154", "#3b528b", "#21908c", "#5dc863"]  # Viridis-inspired palette
-    cmap = LinearSegmentedColormap.from_list("custom", colors, N=256)
-    norm = Normalize(vmin=data["tokens"].min(), vmax=data["tokens"].max())
-
-    # Compute angles for the polar plot
-    angles = np.linspace(0, 2 * np.pi, len(data), endpoint=False)
-
-    # Plot bars
-    bars = ax.bar(
-        angles,
-        data["failureRate"],
-        width=0.5,
-        color=[cmap(norm(t)) for t in data["tokens"]],
-        alpha=0.8,
-        label="Failure Rate %",
-    )
-
-    # Customize polar plot
-    ax.set_theta_offset(np.pi / 2)
-    ax.set_theta_direction(-1)
-    ax.set_ylim(0, max(data["failureRate"]) * 1.1)  # Add some headroom
-
-    # Add labels (now using identifiers)
-    ax.set_xticks(angles)
-    ax.set_xticklabels(data["identifier"], fontsize=10, fontweight="bold")
-
-    # Add circular grid lines
-    ax.yaxis.grid(True, color="gray", linestyle=":", alpha=0.5)
-    ax.set_yticks(np.arange(0, max(data["failureRate"]), 20))
-    ax.set_yticklabels(
-        [f"{x}%" for x in range(0, int(max(data["failureRate"])), 20)], fontsize=8
-    )
-
-    # Add radial lines
-    ax.vlines(
-        angles,
-        0,
-        max(data["failureRate"]) * 1.1,
-        color="gray",
-        linestyle=":",
-        alpha=0.5,
-    )
-
-    # Color bar for token count
-    sm = ScalarMappable(cmap=cmap, norm=norm)
-    sm.set_array([])
-    cbar = fig.colorbar(sm, ax=ax, orientation="horizontal", pad=0.08, aspect=30)
-    cbar.set_label("Token Count (k)", fontsize=10, fontweight="bold")
-
-    # Title and caption
-    fig.suptitle(
-        "Security Report for Different Modules", fontsize=16, fontweight="bold", y=1.02
-    )
-    caption = "Report generated by https://github.com/msoedov/agentic_security"
-    fig.text(
-        0.5,
-        0.02,
-        caption,
-        fontsize=8,
-        ha="center",
-        va="bottom",
-        alpha=0.7,
-        fontweight="bold",
-    )
-
-    # Add failure rate values on the bars
-    for angle, radius, bar, identifier in zip(
-        angles, data["failureRate"], bars, data["identifier"]
-    ):
-        ax.text(
-            angle,
-            radius,
-            f"{identifier}: {radius:.1f}%",
+    try:
+        # Data preprocessing
+        if not isinstance(table, Table):
+            raise TypeError("Input argument must be a pandas DataFrame.")
+        logging.info("Data preprocessing started.")
+
+        data = pd.DataFrame(table)
+
+        # Sort by failure rate and reset index
+        data = data.sort_values("failureRate", ascending=False).reset_index(drop=True)
+        data["identifier"] = generate_identifiers(data)
+
+        # Plot setup
+        fig, ax = plt.subplots(figsize=(12, 10), subplot_kw={"projection": "polar"})
+        fig.set_facecolor("#f0f0f0")
+        ax.set_facecolor("#f0f0f0")
+        logging.info("Plot setup complete.")
+
+        # Styling parameters
+        colors = ["#6C5B7B", "#C06C84", "#F67280", "#F8B195"][::-1]  # Pastel palette
+        cmap = LinearSegmentedColormap.from_list("custom", colors, N=256)
+        norm = Normalize(vmin=data["tokens"].min(), vmax=data["tokens"].max())
+
+        # Compute angles for the polar plot
+        angles = np.linspace(0, 2 * np.pi, len(data), endpoint=False)
+
+        # Plot bars
+        bars = ax.bar(
+            angles,
+            data["failureRate"],
+            width=0.5,
+            color=[cmap(norm(t)) for t in data["tokens"]],
+            alpha=0.8,
+            label="Failure Rate %",
+        )
+
+        # Customize polar plot
+        ax.set_theta_offset(np.pi / 2)
+        ax.set_theta_direction(-1)
+        ax.set_ylim(0, max(data["failureRate"]) * 1.1)  # Add some headroom
+
+        # Add labels (now using identifiers)
+        ax.set_xticks(angles)
+        ax.set_xticklabels(data["identifier"], fontsize=10, fontweight="bold")
+
+        # Add circular grid lines
+        ax.yaxis.grid(True, color="gray", linestyle=":", alpha=0.5)
+        ax.set_yticks(np.arange(0, max(data["failureRate"]), 20))
+        ax.set_yticklabels(
+            [f"{x}%" for x in range(0, int(max(data["failureRate"])), 20)], fontsize=8
+        )
+
+        # Add radial lines
+        ax.vlines(
+            angles,
+            0,
+            max(data["failureRate"]) * 1.1,
+            color="gray",
+            linestyle=":",
+            alpha=0.5,
+        )
+
+        # Color bar for token count
+        sm = ScalarMappable(cmap=cmap, norm=norm)
+        sm.set_array([])
+        cbar = fig.colorbar(sm, ax=ax, orientation="horizontal", pad=0.08, aspect=30)
+        cbar.set_label("Token Count (k)", fontsize=10, fontweight="bold")
+
+        # Title and caption
+        fig.suptitle(
+            "Security Report for Different Modules",
+            fontsize=16,
+            fontweight="bold",
+            y=1.02,
+        )
+        caption = "Report generated by https://github.com/msoedov/agentic_security"
+        fig.text(
+            0.5,
+            0.02,
+            caption,
+            fontsize=8,
             ha="center",
             va="bottom",
-            rotation=angle * 180 / np.pi - 90,
-            rotation_mode="anchor",
-            fontsize=7,
+            alpha=0.7,
             fontweight="bold",
-            color="black",
         )
 
-    # Add a table with identifiers and dataset names
-    table_data = [["Threat"]] + [
-        [f"{identifier}: {module} ({fr:.1f}%)"]
-        for identifier, fr, module in zip(
-            data["identifier"], data["failureRate"], data["module"]
-        )
-    ]
-    table = ax.table(
-        cellText=table_data,
-        loc="right",
-        cellLoc="left",
-    )
-    table.auto_set_font_size(False)
-    table.set_fontsize(8)
-
-    # Adjust table style
-    table.scale(1, 0.7)
-
-    for (row, col), cell in table.get_celld().items():
-        cell.set_edgecolor("none")
-        cell.set_facecolor("#f0f0f0" if row % 2 == 0 else "#e0e0e0")
-        cell.set_alpha(0.8)
-        cell.set_text_props(wrap=True)
-        if row == 0:
-            cell.set_text_props(fontweight="bold")
-
-    # Adjust layout and save
-
-    plt.tight_layout()
-    buf = io.BytesIO()
-    plt.savefig(buf, format="png", dpi=300, bbox_inches="tight")
-    plt.close(fig)
-    buf.seek(0)
-    return buf
+        # Add failure rate values on the bars
+        for angle, radius, bar, identifier in zip(
+            angles, data["failureRate"], bars, data["identifier"]
+        ):
+            ax.text(
+                angle,
+                radius,
+                f"{identifier}: {radius:.1f}%",
+                ha="center",
+                va="bottom",
+                rotation=angle * 180 / np.pi - 90,
+                rotation_mode="anchor",
+                fontsize=7,
+                fontweight="bold",
+                color="black",
+            )
+
+        # Add a table with identifiers and dataset names
+        table_data = [["Threat"]] + [
+            [f"{identifier}: {module} ({fr:.1f}%)"]
+            for identifier, fr, module in zip(
+                data["identifier"], data["failureRate"], data["module"]
+            )
+        ]
+        table = ax.table(cellText=table_data, loc="right", cellLoc="left")
+        table.auto_set_font_size(False)
+        table.set_fontsize(8)
+
+        # Adjust table style
+        table.scale(1, 0.7)
+        for (row, col), cell in table.get_celld().items():
+            cell.set_edgecolor("none")
+            cell.set_facecolor("#f0f0f0" if row % 2 == 0 else "#e0e0e0")
+            cell.set_alpha(0.8)
+            cell.set_text_props(wrap=True)
+            if row == 0:
+                cell.set_text_props(fontweight="bold")
+
+        # Adjust layout and save
+        plt.tight_layout()
+        buf = io.BytesIO()
+        plt.savefig(buf, format="png", dpi=300, bbox_inches="tight")
+        plt.close(fig)
+        buf.seek(0)
+        logging.info("Report successfully generated and saved to buffer.")
+        return buf
+
+    except Exception as e:
+        logging.error(f"Error in generating the security report: {e}")
+        raise
 
 
 def generate_identifiers(data: pd.DataFrame) -> list[str]:
-    data_length = len(data)
-    alphabet = string.ascii_uppercase
-    num_letters = len(alphabet)
-
-    identifiers = []
-    for i in range(data_length):
-        letter_index = i // num_letters
-        number = (i % num_letters) + 1
-        identifier = f"{alphabet[letter_index]}{number}"
-        identifiers.append(identifier)
-
-    return identifiers
+    try:
+        if not isinstance(data, pd.DataFrame):
+            raise TypeError("Input argument must be a pandas DataFrame.")
+
+        data_length = len(data)
+        if data_length == 0:
+            raise ValueError("DataFrame cannot be empty.")
+
+        alphabet = string.ascii_uppercase
+        num_letters = len(alphabet)
+        max_identifiers = num_letters * num_letters
+
+        if data_length > max_identifiers:
+            raise OverflowError(
+                f"Cannot generate more than {max_identifiers} unique identifiers."
+            )
+
+        identifiers = []
+        for i in range(data_length):
+            letter_index = i // num_letters
+            if letter_index >= num_letters:
+                raise IndexError("Identifier generation exceeded the supported range.")
+            number = (i % num_letters) + 1
+            identifier = f"{alphabet[letter_index]}{number}"
+            identifiers.append(identifier)
+
+        return identifiers
+
+    except (TypeError, ValueError, OverflowError, IndexError) as e:
+        logging.error(f"Error in generate_identifiers: {e}")
+        raise