Add APVD text

ruivieira · ruivieira · commit 5eabe2a9dfef · 2022-12-09T15:47:27.000Z
diff --git a/examples/Group fairness metrics.ipynb b/examples/Group fairness metrics.ipynb
@@ -5,7 +5,15 @@
    "id": "62e70a2a",
    "metadata": {},
    "source": [
-    "# Data"
+    "# Data\n",
+    "\n",
+    "For the illustration of the group fairness metrics in TrustyAI, two synthetic datasets were created with the same input features and outcome types. \n",
+    "The outcome is whether a certain invidual reaches a 50k income threshold by using age, race and gender as categorical inputs and both datasets consist of $N=10000$ data points.\n",
+    "The gender values are allocated with a proportion of 20% to `gender=0` and 80% to `gender=1`.\n",
+    "\n",
+    "Both datasets have an increasing likelihood (with uniform probability) of having a positive outcome with age, regardless of race or gender.\n",
+    "The first dataset, deemed _unbiased_, simply allocates the income value with an uniform random value, regardless of race or gender.\n",
+    "The second dataset, deemed _biased_, allocates a positive outcome to `gender=0` with a lower probability than `gender=1`."
    ]
   },
   {
@@ -202,7 +210,7 @@
     "where $\\hat{y}=1$ is the favorable outcome and $\\mathcal{D}_u$, $\\mathcal{D}_p$ are respectively the privileged and unpriviledge group data.\n",
     "\n",
     "\n",
-    "### Not so biased dataset"
+    "### Unbiased dataset"
    ]
   },
   {
@@ -265,7 +273,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 24,
    "id": "2b2c678a",
    "metadata": {},
    "outputs": [],
@@ -283,7 +291,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 7,
    "id": "9e548018",
    "metadata": {},
    "outputs": [
@@ -317,7 +325,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 8,
    "id": "63b953c9",
    "metadata": {},
    "outputs": [
@@ -332,7 +340,7 @@
        "Name: income, dtype: int64"
       ]
      },
-     "execution_count": 9,
+     "execution_count": 8,
      "metadata": {},
      "output_type": "execute_result"
     }
@@ -344,7 +352,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 10,
+   "execution_count": 9,
    "id": "aed61b77",
    "metadata": {},
    "outputs": [
@@ -354,7 +362,7 @@
        "<AxesSubplot:xlabel='gender'>"
       ]
      },
-     "execution_count": 10,
+     "execution_count": 9,
      "metadata": {},
      "output_type": "execute_result"
     },
@@ -375,7 +383,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 11,
+   "execution_count": 10,
    "id": "901e5720",
    "metadata": {},
    "outputs": [],
@@ -390,7 +398,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
+   "execution_count": 11,
    "id": "7be544a7",
    "metadata": {},
    "outputs": [
@@ -438,7 +446,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 13,
+   "execution_count": 12,
    "id": "949fae2f",
    "metadata": {},
    "outputs": [],
@@ -452,7 +460,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
+   "execution_count": 13,
    "id": "2e601762",
    "metadata": {},
    "outputs": [
@@ -478,7 +486,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 15,
+   "execution_count": 14,
    "id": "3231326d",
    "metadata": {},
    "outputs": [],
@@ -490,7 +498,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 16,
+   "execution_count": 15,
    "id": "4b88eec8",
    "metadata": {},
    "outputs": [
@@ -536,7 +544,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 22,
+   "execution_count": 16,
    "id": "50814c63",
    "metadata": {},
    "outputs": [],
@@ -552,7 +560,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 23,
+   "execution_count": 17,
    "id": "cedbd492",
    "metadata": {},
    "outputs": [
@@ -581,12 +589,14 @@
    "id": "74cf44c7",
    "metadata": {},
    "source": [
-    "# Average Predictive Value Difference"
+    "## Average Predictive Value Difference\n",
+    "\n",
+    "The _Average Predictive Value Difference (APVD)_ measures the difference in the average accuracy of predicted values between the privileged and unprivileged groups in a dataset. \n"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 21,
+   "execution_count": 18,
    "id": "ca591646",
    "metadata": {},
    "outputs": [
@@ -603,35 +613,12 @@
     "\n",
     "score = average_predictive_value_difference(test=bias,\n",
     "                                truth=nobias,\n",
-    "                                privilege_columns=[2],\n",
+    "                                privilege_columns=[\"gender\"],\n",
     "                                privilege_values=[1],\n",
     "                                positive_class=[1])\n",
     "print(score)"
    ]
   },
-  {
-   "cell_type": "code",
-   "execution_count": 22,
-   "id": "611a0a6f",
-   "metadata": {},
-   "outputs": [
-    {
-     "name": "stdout",
-     "output_type": "stream",
-     "text": [
-      "-0.052866818520044656\n"
-     ]
-    }
-   ],
-   "source": [
-    "score = average_predictive_value_difference(test=bias,\n",
-    "                                truth=nobias,\n",
-    "                                privilege_columns=[2],\n",
-    "                                privilege_values=[0],\n",
-    "                                positive_class=[1])\n",
-    "print(score)"
-   ]
-  },
   {
    "cell_type": "markdown",
    "id": "b85694b4",
@@ -650,7 +637,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 23,
+   "execution_count": 19,
    "id": "e1a03db7",
    "metadata": {},
    "outputs": [],
@@ -660,7 +647,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 24,
+   "execution_count": 20,
    "id": "da1c2775",
    "metadata": {},
    "outputs": [],
@@ -692,7 +679,7 @@
     "model = Model(xgb.predict, dataframe_input=True, output_names=[\"approved\"])\n",
     "score = statistical_parity_difference_model(samples=X,\n",
     "                                            model=model,\n",
-    "                                            privilege_columns=[2],\n",
+    "                                            privilege_columns=[\"gender\"],\n",
     "                                            privilege_values=[1],\n",
     "                                            favorable=[favorable])\n",
     "print(score)"
@@ -725,7 +712,7 @@
     "\n",
     "score = disparate_impact_ratio_model(samples=X,\n",
     "                                            model=model,\n",
-    "                                            privilege_columns=[2],\n",
+    "                                            privilege_columns=[\"gender\"],\n",
     "                                            privilege_values=[1],\n",
     "                                            favorable=[favorable])\n",
     "print(score)"
@@ -758,7 +745,7 @@
     "\n",
     "score = average_odds_difference_model(samples=X,\n",
     "                                      model=model,\n",
-    "                                      privilege_columns=[2],\n",
+    "                                      privilege_columns=[\"gender\"],\n",
     "                                      privilege_values=[1],\n",
     "                                      positive_class=[1])\n",
     "print(score)"