Merge pull request #105 from NGO-Algorithm-Audit/JFP_edits

jfparie · web-flow · commit a3be459b03c0 · 2025-06-11T11:32:22.000+02:00
Jfp edits
diff --git a/notebooks/synthetic data generation tool/GC_drop_LawSchoolAdmissionBar.ipynb b/notebooks/synthetic data generation tool/GC_drop_LawSchoolAdmissionBar.ipynb
@@ -553,9 +553,24 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 11,
+   "execution_count": 14,
    "metadata": {},
-   "outputs": [],
+   "outputs": [
+    {
+     "ename": "ValueError",
+     "evalue": "All objects passed were None",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[0;31mValueError\u001b[0m                                Traceback (most recent call last)",
+      "Cell \u001b[0;32mIn[14], line 22\u001b[0m\n\u001b[1;32m     20\u001b[0m     encoders[col] \u001b[38;5;241m=\u001b[39m encoder\n\u001b[1;32m     21\u001b[0m     data\u001b[38;5;241m.\u001b[39mdrop(columns\u001b[38;5;241m=\u001b[39m[col], inplace\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m)\n\u001b[0;32m---> 22\u001b[0m     data \u001b[38;5;241m=\u001b[39m \u001b[43mpd\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mconcat\u001b[49m\u001b[43m(\u001b[49m\u001b[43m[\u001b[49m\u001b[43mdata\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mreset_index\u001b[49m\u001b[43m(\u001b[49m\u001b[43mdrop\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mTrue\u001b[39;49;00m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43minplace\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mTrue\u001b[39;49;00m\u001b[43m)\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mtransformed_data\u001b[49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43mreset_index\u001b[49m\u001b[43m(\u001b[49m\u001b[43mdrop\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mTrue\u001b[39;49;00m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43minplace\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;28;43;01mTrue\u001b[39;49;00m\u001b[43m)\u001b[49m\u001b[43m]\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43maxis\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[38;5;241;43m1\u001b[39;49m\u001b[43m)\u001b[49m\n\u001b[1;32m     24\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m dtype \u001b[38;5;241m==\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mnumerical\u001b[39m\u001b[38;5;124m\"\u001b[39m:\n\u001b[1;32m     25\u001b[0m     scaler \u001b[38;5;241m=\u001b[39m StandardScaler(with_mean\u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m, with_std\u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m)\n",
+      "File \u001b[0;32m/opt/homebrew/lib/python3.11/site-packages/pandas/core/reshape/concat.py:382\u001b[0m, in \u001b[0;36mconcat\u001b[0;34m(objs, axis, join, ignore_index, keys, levels, names, verify_integrity, sort, copy)\u001b[0m\n\u001b[1;32m    379\u001b[0m \u001b[38;5;28;01melif\u001b[39;00m copy \u001b[38;5;129;01mand\u001b[39;00m using_copy_on_write():\n\u001b[1;32m    380\u001b[0m     copy \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;01mFalse\u001b[39;00m\n\u001b[0;32m--> 382\u001b[0m op \u001b[38;5;241m=\u001b[39m \u001b[43m_Concatenator\u001b[49m\u001b[43m(\u001b[49m\n\u001b[1;32m    383\u001b[0m \u001b[43m    \u001b[49m\u001b[43mobjs\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    384\u001b[0m \u001b[43m    \u001b[49m\u001b[43maxis\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43maxis\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    385\u001b[0m \u001b[43m    \u001b[49m\u001b[43mignore_index\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mignore_index\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    386\u001b[0m \u001b[43m    \u001b[49m\u001b[43mjoin\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mjoin\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    387\u001b[0m \u001b[43m    \u001b[49m\u001b[43mkeys\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mkeys\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    388\u001b[0m \u001b[43m    \u001b[49m\u001b[43mlevels\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mlevels\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    389\u001b[0m \u001b[43m    \u001b[49m\u001b[43mnames\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mnames\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    390\u001b[0m \u001b[43m    \u001b[49m\u001b[43mverify_integrity\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mverify_integrity\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    391\u001b[0m \u001b[43m    \u001b[49m\u001b[43mcopy\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43mcopy\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    392\u001b[0m \u001b[43m    \u001b[49m\u001b[43msort\u001b[49m\u001b[38;5;241;43m=\u001b[39;49m\u001b[43msort\u001b[49m\u001b[43m,\u001b[49m\n\u001b[1;32m    393\u001b[0m \u001b[43m\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    395\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m op\u001b[38;5;241m.\u001b[39mget_result()\n",
+      "File \u001b[0;32m/opt/homebrew/lib/python3.11/site-packages/pandas/core/reshape/concat.py:445\u001b[0m, in \u001b[0;36m_Concatenator.__init__\u001b[0;34m(self, objs, axis, join, keys, levels, names, ignore_index, verify_integrity, copy, sort)\u001b[0m\n\u001b[1;32m    442\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mverify_integrity \u001b[38;5;241m=\u001b[39m verify_integrity\n\u001b[1;32m    443\u001b[0m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39mcopy \u001b[38;5;241m=\u001b[39m copy\n\u001b[0;32m--> 445\u001b[0m objs, keys \u001b[38;5;241m=\u001b[39m \u001b[38;5;28;43mself\u001b[39;49m\u001b[38;5;241;43m.\u001b[39;49m\u001b[43m_clean_keys_and_objs\u001b[49m\u001b[43m(\u001b[49m\u001b[43mobjs\u001b[49m\u001b[43m,\u001b[49m\u001b[43m \u001b[49m\u001b[43mkeys\u001b[49m\u001b[43m)\u001b[49m\n\u001b[1;32m    447\u001b[0m \u001b[38;5;66;03m# figure out what our result ndim is going to be\u001b[39;00m\n\u001b[1;32m    448\u001b[0m ndims \u001b[38;5;241m=\u001b[39m \u001b[38;5;28mself\u001b[39m\u001b[38;5;241m.\u001b[39m_get_ndims(objs)\n",
+      "File \u001b[0;32m/opt/homebrew/lib/python3.11/site-packages/pandas/core/reshape/concat.py:541\u001b[0m, in \u001b[0;36m_Concatenator._clean_keys_and_objs\u001b[0;34m(self, objs, keys)\u001b[0m\n\u001b[1;32m    538\u001b[0m         keys \u001b[38;5;241m=\u001b[39m Index(clean_keys, name\u001b[38;5;241m=\u001b[39mname, dtype\u001b[38;5;241m=\u001b[39m\u001b[38;5;28mgetattr\u001b[39m(keys, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mdtype\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;28;01mNone\u001b[39;00m))\n\u001b[1;32m    540\u001b[0m \u001b[38;5;28;01mif\u001b[39;00m \u001b[38;5;28mlen\u001b[39m(objs_list) \u001b[38;5;241m==\u001b[39m \u001b[38;5;241m0\u001b[39m:\n\u001b[0;32m--> 541\u001b[0m     \u001b[38;5;28;01mraise\u001b[39;00m \u001b[38;5;167;01mValueError\u001b[39;00m(\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mAll objects passed were None\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m    543\u001b[0m \u001b[38;5;28;01mreturn\u001b[39;00m objs_list, keys\n",
+      "\u001b[0;31mValueError\u001b[0m: All objects passed were None"
+     ]
+    }
+   ],
    "source": [
     "from sklearn.preprocessing import LabelEncoder, OneHotEncoder, StandardScaler, MinMaxScaler\n",
     "\n",
@@ -578,7 +593,7 @@
     "                transformed_data = _encode_categorical(data[col], encoder)\n",
     "                encoders[col] = encoder\n",
     "                data.drop(columns=[col], inplace=True)\n",
-    "                data = pd.concat([data, transformed_data], axis=1)\n",
+    "                data = pd.concat([data.reset_index(drop=True, inplace=True), transformed_data.reset_index(drop=True, inplace=True)], axis=1)\n",
     "\n",
     "            elif dtype == \"numerical\":\n",
     "                scaler = StandardScaler(with_mean= False, with_std= False)\n",
@@ -588,7 +603,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 12,
+   "execution_count": 13,
    "metadata": {},
    "outputs": [
     {
@@ -616,7 +631,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 13,
+   "execution_count": null,
    "metadata": {},
    "outputs": [
     {
@@ -637,7 +652,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 14,
+   "execution_count": null,
    "metadata": {},
    "outputs": [
     {
@@ -663,7 +678,7 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 15,
+   "execution_count": null,
    "metadata": {},
    "outputs": [
     {
diff --git a/src/assets/bias-detection-python-code.tsx b/src/assets/bias-detection-python-code.tsx
@@ -332,7 +332,8 @@ def run():
             'iterations': localIterations,
             'minClusterSize': localClusterSize,
             'performanceMetric': bias_score,
-            'dataType': dataTypeText
+            'dataType': dataTypeText,
+            'higherIsBetter': 'biasAnalysis.higherIsBetter' if higherIsBetter else 'biasAnalysis.lowerIsBetter'
         }
     }))
     setResult(json.dumps({
@@ -375,7 +376,12 @@ def run():
         'defaultIndex': 0,
         'labelKey': 'biasAnalysis.clusterinResults.label',
         'valueKey' : 'biasAnalysis.clusterinResults.valueText',
-        'values': biasInClusters
+        'values': biasInClusters,
+        'params': {
+            'numZeroes': int(numZeros),
+            'totalRecords': int(totalRecords),
+            'clusterCount': clusterCount
+        }
     }))
     setResult(json.dumps({
         'type': 'text',
@@ -402,8 +408,6 @@ def run():
     
     
     decoded_X_test["cluster_label"] = y_test
-
-    # ----
     
     if localDataType == 'numeric':
         test_df["cluster_label"] = y_test
@@ -443,10 +447,6 @@ def run():
         print("The most biased cluster has a significantly higher average bias metric than the rest of the dataset.")
     else:
         print("No significant difference in average bias metric between the most biased cluster and the rest of the dataset.")
-        # setResult(json.dumps({
-        #        'type': 'heading',
-        #        'headingKey': 'biasAnalysis.nodifference.heading',                            
-        #    }))    
 
     setResult(json.dumps({
         'type': 'heading',
@@ -482,12 +482,7 @@ def run():
         charts = []
 
         for i, var in enumerate(variables):
-            
-            #setResult(json.dumps({
-            #    'type': 'heading',
-            #    'headingKey': 'biasAnalysis.distribution.heading',            
-            #    'params': {'variable': var}
-            #}))
+                        
             print(f"means: {var}")
             print(overall_means[var])
             print(means[var])
diff --git a/src/components/BiasSettings.tsx b/src/components/BiasSettings.tsx
@@ -76,7 +76,7 @@ export default function BiasSettings({
         resolver: zodResolver(FormSchema),
         defaultValues: {
             dataType: 'numeric',
-            whichPerformanceMetricValueIsBetter: 'higher',
+            whichPerformanceMetricValueIsBetter: 'lower',
         },
     });
     const [iter, setIter] = useState([10]);
diff --git a/src/components/componentMapper.tsx b/src/components/componentMapper.tsx
@@ -267,6 +267,7 @@ export default function ComponentMapper({
                                         defaultIndex: resultItem.defaultIndex,
                                         labelKey: resultItem.labelKey,
                                         valueKey: resultItem.valueKey,
+                                        params: resultItem.params || {},
                                     }}
                                 />
                             </ErrorBoundary>
diff --git a/src/components/composed-components/ClusterCategoriesDistributionAccordeonContent.tsx b/src/components/composed-components/ClusterCategoriesDistributionAccordeonContent.tsx
@@ -80,7 +80,7 @@ const ClusterCategoriesDistributionAccordeonContent = ({
                                     chart.selectFilterGroup ===
                                         defaultCategory) ||
                                 !chart.selectFilterGroup ? (
-                                    <div className="hideonprint">
+                                    <div className="hideonprint w-full">
                                         <h5
                                             key={index}
                                             className="text-gray-800 font-semibold"
@@ -107,7 +107,7 @@ const ClusterCategoriesDistributionAccordeonContent = ({
                                         />
                                     </div>
                                 ) : null}
-                                <div className="hidden showonprint">
+                                <div className="hidden showonprint overflow-x-hidden">
                                     <h5
                                         key={index}
                                         className="text-gray-800 font-semibold"
diff --git a/src/components/composed-components/ClusterNumericalVariableDistributionAccordeonContent.tsx b/src/components/composed-components/ClusterNumericalVariableDistributionAccordeonContent.tsx
@@ -71,7 +71,7 @@ const ClusterNumericalVariableDistributionAccordeonContent = ({
                                     chart.selectFilterGroup ===
                                         defaultCategory) ||
                                 !chart.selectFilterGroup ? (
-                                    <div className="hideonprint">
+                                    <div className="hideonprint w-full">
                                         <h5
                                             key={chartIndex}
                                             className="text-gray-800 font-semibold"
@@ -91,7 +91,7 @@ const ClusterNumericalVariableDistributionAccordeonContent = ({
                                         />
                                     </div>
                                 ) : null}
-                                <div className="hidden showonprint">
+                                <div className="hidden showonprint overflow-x-hidden">
                                     <h5
                                         key={`SingleBarChart-print-${chartIndex}`}
                                         className="text-gray-800 font-semibold"
diff --git a/src/components/composed-components/TextValueSelect.tsx b/src/components/composed-components/TextValueSelect.tsx
@@ -11,6 +11,7 @@ const TextValueSelect = ({
         defaultIndex: number;
         labelKey: string;
         valueKey: string;
+        params: Record<string, string>;
     };
 }) => {
     const [selectedIndex, setSelectedIndex] = useState<number | null>();
@@ -39,6 +40,7 @@ const TextValueSelect = ({
                     <div>
                         <label className="text-sm font-semibold">
                             {t(data.valueKey, {
+                                ...data.params,
                                 index: selectedIndex ?? data.defaultIndex,
                                 value,
                             })}
diff --git a/src/locales/en.ts b/src/locales/en.ts
@@ -181,7 +181,8 @@ export const en = {
         gaussianCopulaModelTitle: '3. Method: Gaussian Copula model',
         cartModelDescription:
             'The CART (Classification and Regression Trees) method generates synthetic data by learning patterns from real data through a decision tree that splits data into homogeneous groups based on feature values. It predicts averages for numerical data and assigns the most common category for categorical data, using these predictions to create new synthetic points.\n \n {{samples}} synthetic data points are generated.',
-        evaluationOfGeneratedDataTitle: '4. Evaluation of generated synthetic data',
+        evaluationOfGeneratedDataTitle:
+            '4. Evaluation of generated synthetic data',
         distributionsTitle: '4.1 Distributions',
         diagnosticsReportTitle: '4.2. Diagnostic report',
         diagnosticsTitle: 'Diagnostic Results',
@@ -274,11 +275,11 @@ missing data are imputed. For {tooltip:syntheticData.missingDataMCARTooltip}Miss
 - <i class="font-serif">H</i><sub>0</sub>: no difference in bias variable between the most deviating cluster and the rest of the dataset
 - <i class="font-serif">H</i><sub>1</sub>: difference in bias variable between the most deviating cluster and the rest of the dataset
 
-A two-sided t-test is performed to accept or reject <i class="font-serif">H</i><sub>0</sub>:.
+A two-sided t-test is performed to accept or reject <i class="font-serif">H</i><sub>0</sub>:
 
 {tooltip:biasAnalysis.p_valueTooltip}p_value{/tooltip} : {{p_val}} 
         `,
-        p_valueTooltip: `p_value tooltip`,
+        p_valueTooltip: `The p-value represents the probability of incorrectly rejecting the null hypothesis (H<sub>0</sub>) when it is actually true. A commonly used threshold is p≤0.05, which is the probability deemed sufficiently low to reject H<sub>0</sub> in favor of the alternative hypothesis (H<sub>1</sub>).`,
         dataSetPreview: {
             heading: '1. Preview of data',
         },
@@ -303,6 +304,8 @@ A two-sided t-test is performed to accept or reject <i class="font-serif">H</i><
 In this example, we analyze which group is most adversely affected by the risk prediction algorithm. We do this by applying the clustering algorithm on the dataset previewed below. The column "is_recid" indicates whether a defendant reoffended or not (1: yes, 0: no). The "score_text" column indicates whether a defendant was predicted to reoffend (1: yes, 0: no). The column "false_positive" (FP) represents cases where a defendant was predicted to reoffended by the algorithm, but didn't do so (1: FP, 0: no FP). A preview of the data can be found below. The column "false_positive" is used as the bias variable.
 `,
         },
+        higherIsBetter: 'Higher value of bias variable is better',
+        lowerIsBetter: 'Lower value of bias variable is better',
         parameters: {
             heading: '2. Hyperparameters selected for clustering',
             iterations: 'Number of iterations: {{value}}',
@@ -313,6 +316,7 @@ In this example, we analyze which group is most adversely affected by the risk p
 - Minimal cluster size: {{minClusterSize}}
 - Bias variable: {{performanceMetric}}
 - Data type: {{dataType}}
+- Bias variable interpretation: $t({{higherIsBetter}})
 `,
         },
         distributionOfFeaturesAcrossClustersAccordeonTitle:
@@ -366,7 +370,8 @@ In this example, we analyze which group is most adversely affected by the risk p
 - Number of clusters detected: {{clusterCount}}
             `,
             label: 'Choose cluster to show number of datapoints for',
-            valueText: 'Number of datapoints in cluster {{index}}: {{value}}',
+            valueText:
+                'Number of datapoints in cluster {{index}}: {{value}} / {{totalRecords}}',
         },
         higherAverage: `The most deviating cluster has statistically significant different bias variable than the rest of the dataset.`,
         noSignificance: `No statistically significant difference in bias variable between the most biased cluster and the rest of the dataset.`,
diff --git a/src/locales/nl.ts b/src/locales/nl.ts
@@ -303,7 +303,9 @@ Er wordt een tweezijdige t-toets uitgevoerd om <i class="font-serif">H</i><sub>0
 
 {tooltip:biasAnalysis.p_valueTooltip}p-waarde{/tooltip} : {{p_val}}
         `,
-        p_valueTooltip: `p-waarde tooltip`,
+        p_valueTooltip: `De p-waarde is de kans om de nulhypothese (H<sub>0</sub>) onterecht te verwerpen wanneer deze in werkelijkheid waar is. Een veelgebruikte drempelwaarde is p≤0,05, wat wordt beschouwd als een voldoende lage kans om H<sub>0</sub> te verwerpen en de alternatieve hypothese (H<sub>1</sub>) te accepteren.`,
+        higherIsBetter: 'Hogere waarde van bias variabele is beter',
+        lowerIsBetter: 'Lagere waarde van bias variabele is beter',
         parameters: {
             heading: '2. Geselecteerde hyperparameters',
             iterations: 'Aantal iteraties: {{value}}',
@@ -316,6 +318,7 @@ Er wordt een tweezijdige t-toets uitgevoerd om <i class="font-serif">H</i><sub>0
 - Minimale clustergrootte: {{minClusterSize}}
 - Bias variabele: {{performanceMetric}}
 - Gegevenstype: {{dataType}}
+- Interpretatie van bias variabele: $t({{higherIsBetter}}) is better
 `,
         },
         distribution: {
@@ -365,7 +368,8 @@ Er wordt een tweezijdige t-toets uitgevoerd om <i class="font-serif">H</i><sub>0
 - Aantal gevonden clusters: {{clusterCount}}
             `,
             label: 'Kies cluster om het aantal datapunten voor weer te geven',
-            valueText: 'Aantal datapunten in cluster {{index}}: {{value}}',
+            valueText:
+                'Aantal datapunten in cluster {{index}}: {{value}} / {{totalRecords}}',
         },
         higherAverage: `Het meest afwijkende cluster heeft statistisch significant andere bias variabele dan de rest van de dataset.`,
         noSignificance: `Het meest afwijkende cluster heeft statistisch significant geen andere bias variabele dan de rest van de dataset.`,