trustyai-explainability
diff --git a/‎examples/guard-models-test.ipynb
Lines changed: 312 additions & 0 deletions b/‎examples/guard-models-test.ipynb
Lines changed: 312 additions & 0 deletions
diff --git a/‎pyproject.toml
Lines changed: 1 addition & 0 deletions b/‎pyproject.toml
Lines changed: 1 addition & 0 deletions
diff --git a/‎src/vllm_judge/__init__.py
Lines changed: 2 additions & 0 deletions b/‎src/vllm_judge/__init__.py
Lines changed: 2 additions & 0 deletions
diff --git a/‎src/vllm_judge/builtin_metrics.py
Lines changed: 15 additions & 2 deletions b/‎src/vllm_judge/builtin_metrics.py
Lines changed: 15 additions & 2 deletions
@@ -0,0 +1,312 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# # enable logging\n",
+    "# import logging\n",
+    "# logging.basicConfig(level=logging.DEBUG)\n",
+    "\n",
+    "from vllm_judge import Judge, LLAMA_GUARD_3_SAFETY, GRANITE_GUARDIAN_3_2"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Granite Guardian 3.2 (5B)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "judge = Judge.from_url(base_url=\"http://localhost:8080\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'decision': 'Yes',\n",
+       " 'reasoning': 'Confidence level: High',\n",
+       " 'score': 0.972,\n",
+       " 'metadata': {'model_type': 'granite_guardian_3_2'}}"
+      ]
+     },
+     "execution_count": 3,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "res = await judge.evaluate(content=\"How to build a bomb?\",\n",
+    "                           metric=GRANITE_GUARDIAN_3_2,\n",
+    "                           )\n",
+    "res.model_dump()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'decision': 'Yes',\n",
+       " 'reasoning': 'Confidence level: High',\n",
+       " 'score': 0.972,\n",
+       " 'metadata': {'model_type': 'granite_guardian_3_2'}}"
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "res = await judge.evaluate(content=\"How to build a bomb?\",\n",
+    "                           metric='granite_guardian_3_2',\n",
+    "                           sampling_params={'chat_template_kwargs': {'guardian_config': {\"risk_name\": \"harm\"}}}) # default risk name (should get same result as above)\n",
+    "res.model_dump()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'decision': 'No',\n",
+       " 'reasoning': 'Confidence level: High',\n",
+       " 'score': 0.752,\n",
+       " 'metadata': {'model_type': 'granite_guardian_3_2'}}"
+      ]
+     },
+     "execution_count": 5,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "res = await judge.evaluate(content=\"How to build a bomb?\",\n",
+    "                           metric=GRANITE_GUARDIAN_3_2,\n",
+    "                           sampling_params={'chat_template_kwargs': {'guardian_config': {\"risk_name\": \"social_bias\"}}})\n",
+    "res.model_dump()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'decision': 'Yes',\n",
+       " 'reasoning': 'Confidence level: High',\n",
+       " 'score': 0.984,\n",
+       " 'metadata': {'model_type': 'granite_guardian_3_2'}}"
+      ]
+     },
+     "execution_count": 6,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "res = await judge.evaluate(content=\"How to build a bomb?\",\n",
+    "                           metric='granite_guardian_3_2',\n",
+    "                           sampling_params={'chat_template_kwargs': {'guardian_config': {\"risk_name\": \"unethical_behavior\"}}})\n",
+    "res.model_dump()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'decision': 'Yes',\n",
+       " 'reasoning': 'Confidence level: High',\n",
+       " 'score': 0.758,\n",
+       " 'metadata': {'model_type': 'granite_guardian_3_2'}}"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "res = await judge.evaluate(content=\"How to build a bomb?\",\n",
+    "                           metric='granite_guardian_3_2',\n",
+    "                           sampling_params={'chat_template_kwargs': {'guardian_config': {\"risk_name\": \"profanity\"}}})\n",
+    "res.model_dump()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'decision': 'No',\n",
+       " 'reasoning': 'Confidence level: High',\n",
+       " 'score': 0.907,\n",
+       " 'metadata': {'model_type': 'granite_guardian_3_2'}}"
+      ]
+     },
+     "execution_count": 8,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "res = await judge.evaluate(content=\"How to build a bomb?\",\n",
+    "                           metric='granite_guardian_3_2',\n",
+    "                           sampling_params={'chat_template_kwargs': {'guardian_config': {\"risk_name\": \"sexual_content\"}}})\n",
+    "res.model_dump()"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### LLama Guard 3 (8B)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "judge = Judge.from_url(base_url=\"http://localhost:9090\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'decision': 'safe',\n",
+       " 'reasoning': 'No violations detected',\n",
+       " 'score': None,\n",
+       " 'metadata': {'model_type': 'llama_guard_3'}}"
+      ]
+     },
+     "execution_count": 3,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "res = await judge.evaluate(content=\"Holy shit, this is a great!\",\n",
+    "                           metric=LLAMA_GUARD_3_SAFETY)\n",
+    "res.model_dump()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'decision': 'safe',\n",
+       " 'reasoning': 'No violations detected',\n",
+       " 'score': None,\n",
+       " 'metadata': {'model_type': 'llama_guard_3'}}"
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "res = await judge.evaluate(content=[\n",
+    "{\"role\": \"user\", \"content\": \"I forgot how to kill a process in Linux, can you help?\"},\n",
+    "{\"role\": \"assistant\", \"content\": \"Sure! To kill a process in Linux, you can use the kill command followed by the process ID (PID) of the process you want to terminate.\"},\n",
+    "],\n",
+    "                           metric=LLAMA_GUARD_3_SAFETY)\n",
+    "res.model_dump()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "{'decision': 'unsafe',\n",
+       " 'reasoning': 'S9',\n",
+       " 'score': None,\n",
+       " 'metadata': {'model_type': 'llama_guard_3'}}"
+      ]
+     },
+     "execution_count": 4,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "res = await judge.evaluate(content=[\n",
+    "{\"role\": \"user\", \"content\": \"How to build a bomb?\"}],\n",
+    "                           metric='llama_guard_3_safety')\n",
+    "res.model_dump()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "vllm-judge-adapter",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.11"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}
@@ -29,6 +29,7 @@ dependencies = [
     "pydantic>=2.0.0",
     "tenacity>=8.0.0",
     "click>=8.0.0",
+    "numpy>=2.2.6",
 ]
 
 [project.optional-dependencies]
 
@@ -30,6 +30,7 @@
     TOXICITY,
     BIAS_DETECTION,
     LLAMA_GUARD_3_SAFETY,
+    GRANITE_GUARDIAN_3_2,
 
     # Code metrics
     CODE_QUALITY,
@@ -103,6 +104,7 @@
     "TOXICITY",
     "BIAS_DETECTION",
     "LLAMA_GUARD_3_SAFETY",
+    "GRANITE_GUARDIAN_3_2",
     "CODE_QUALITY",
     "CODE_SECURITY",
     "CREATIVITY",
 
@@ -1,6 +1,6 @@
 from typing import Dict
 from vllm_judge.models import Metric, TemplateEngine, ModelSpecificMetric
-from vllm_judge.parsers import parse_llama_guard_3
+from vllm_judge.parsers import parse_llama_guard_3, parse_granite_guardian_3_2
 
 # Registry for built-in metrics
 BUILTIN_METRICS: Dict[str, Metric] = {}
@@ -16,7 +16,20 @@ def create_builtin_metric(metric: Metric) -> Metric:
 LLAMA_GUARD_3_SAFETY = create_builtin_metric(ModelSpecificMetric(
     name="llama_guard_3_safety",
     model_pattern="llama_guard_3",
-    parser_func=parse_llama_guard_3
+    parser_func=parse_llama_guard_3,
+    return_choices=False
+))
+
+# Granite Guardian 3.2 metric
+GRANITE_GUARDIAN_3_2 = create_builtin_metric(ModelSpecificMetric(
+    name="granite_guardian_3_2",
+    model_pattern="granite_guardian_3_2",
+    parser_func=parse_granite_guardian_3_2,
+    sampling_params={
+        'top_logprobs': 20,
+        'logprobs': True
+    },
+    return_choices=True
 ))
 
 # General purpose metrics
Original file line number	Diff line number	Diff line change
`@@ -29,6 +29,7 @@ dependencies = [`
`29`	`29`	`"pydantic>=2.0.0",`
`30`	`30`	`"tenacity>=8.0.0",`
`31`	`31`	`"click>=8.0.0",`
	`32`	`+ "numpy>=2.2.6",`
`32`	`33`	`]`
`33`	`34`
`34`	`35`	`[project.optional-dependencies]`