Skip to content

Commit 8920c3c

Browse files
authored
Merge pull request #84 from NGO-Algorithm-Audit/JFP_edits
Added original COMPAS dataset again and changed categorical encoder t…
2 parents be105a4 + 6a87c84 commit 8920c3c

File tree

2 files changed

+7289
-74
lines changed

2 files changed

+7289
-74
lines changed

notebooks/unsupervised bias detection tool/COMPAS_FP.ipynb

Lines changed: 74 additions & 74 deletions
Original file line numberDiff line numberDiff line change
@@ -597,7 +597,7 @@
597597
},
598598
{
599599
"cell_type": "code",
600-
"execution_count": 6,
600+
"execution_count": 5,
601601
"metadata": {},
602602
"outputs": [
603603
{
@@ -633,100 +633,100 @@
633633
" <tbody>\n",
634634
" <tr>\n",
635635
" <th>0</th>\n",
636-
" <td>1.0</td>\n",
637-
" <td>1.0</td>\n",
638-
" <td>5.0</td>\n",
639-
" <td>0.0</td>\n",
640-
" <td>0.0</td>\n",
641-
" <td>0.0</td>\n",
642-
" <td>0.0</td>\n",
636+
" <td>1</td>\n",
637+
" <td>1</td>\n",
638+
" <td>5</td>\n",
639+
" <td>0</td>\n",
640+
" <td>0</td>\n",
641+
" <td>0</td>\n",
642+
" <td>0</td>\n",
643643
" </tr>\n",
644644
" <tr>\n",
645645
" <th>1</th>\n",
646-
" <td>0.0</td>\n",
647-
" <td>1.0</td>\n",
648-
" <td>0.0</td>\n",
649-
" <td>0.0</td>\n",
650-
" <td>1.0</td>\n",
651-
" <td>0.0</td>\n",
652-
" <td>0.0</td>\n",
646+
" <td>0</td>\n",
647+
" <td>1</td>\n",
648+
" <td>0</td>\n",
649+
" <td>0</td>\n",
650+
" <td>1</td>\n",
651+
" <td>0</td>\n",
652+
" <td>0</td>\n",
653653
" </tr>\n",
654654
" <tr>\n",
655655
" <th>2</th>\n",
656-
" <td>2.0</td>\n",
657-
" <td>1.0</td>\n",
658-
" <td>0.0</td>\n",
659-
" <td>0.0</td>\n",
660-
" <td>1.0</td>\n",
661-
" <td>0.0</td>\n",
662-
" <td>0.0</td>\n",
656+
" <td>2</td>\n",
657+
" <td>1</td>\n",
658+
" <td>0</td>\n",
659+
" <td>0</td>\n",
660+
" <td>1</td>\n",
661+
" <td>0</td>\n",
662+
" <td>0</td>\n",
663663
" </tr>\n",
664664
" <tr>\n",
665665
" <th>3</th>\n",
666-
" <td>2.0</td>\n",
667-
" <td>1.0</td>\n",
668-
" <td>0.0</td>\n",
669-
" <td>0.0</td>\n",
670-
" <td>0.0</td>\n",
671-
" <td>1.0</td>\n",
672-
" <td>1.0</td>\n",
666+
" <td>2</td>\n",
667+
" <td>1</td>\n",
668+
" <td>0</td>\n",
669+
" <td>0</td>\n",
670+
" <td>0</td>\n",
671+
" <td>1</td>\n",
672+
" <td>1</td>\n",
673673
" </tr>\n",
674674
" <tr>\n",
675675
" <th>4</th>\n",
676-
" <td>0.0</td>\n",
677-
" <td>1.0</td>\n",
678-
" <td>5.0</td>\n",
679-
" <td>0.0</td>\n",
680-
" <td>0.0</td>\n",
681-
" <td>0.0</td>\n",
682-
" <td>0.0</td>\n",
676+
" <td>0</td>\n",
677+
" <td>1</td>\n",
678+
" <td>5</td>\n",
679+
" <td>0</td>\n",
680+
" <td>0</td>\n",
681+
" <td>0</td>\n",
682+
" <td>0</td>\n",
683683
" </tr>\n",
684684
" </tbody>\n",
685685
"</table>\n",
686686
"</div>"
687687
],
688688
"text/plain": [
689689
" age_cat sex race c_charge_degree is_recid score_text false_positive\n",
690-
"0 1.0 1.0 5.0 0.0 0.0 0.0 0.0\n",
691-
"1 0.0 1.0 0.0 0.0 1.0 0.0 0.0\n",
692-
"2 2.0 1.0 0.0 0.0 1.0 0.0 0.0\n",
693-
"3 2.0 1.0 0.0 0.0 0.0 1.0 1.0\n",
694-
"4 0.0 1.0 5.0 0.0 0.0 0.0 0.0"
690+
"0 1 1 5 0 0 0 0\n",
691+
"1 0 1 0 0 1 0 0\n",
692+
"2 2 1 0 0 1 0 0\n",
693+
"3 2 1 0 0 0 1 1\n",
694+
"4 0 1 5 0 0 0 0"
695695
]
696696
},
697-
"execution_count": 6,
697+
"execution_count": 5,
698698
"metadata": {},
699699
"output_type": "execute_result"
700700
}
701701
],
702702
"source": [
703703
"# Apply OrdinalEncoder to the categorical columns\n",
704704
"encoder = OrdinalEncoder()\n",
705-
"filtered_df[filtered_df.columns] = encoder.fit_transform(filtered_df)\n",
705+
"filtered_df[filtered_df.columns] = encoder.fit_transform(filtered_df).astype(\"uint32\")\n",
706706
"\n",
707707
"# Display the transformed DataFrame\n",
708708
"filtered_df.head()"
709709
]
710710
},
711711
{
712712
"cell_type": "code",
713-
"execution_count": 7,
713+
"execution_count": 6,
714714
"metadata": {},
715715
"outputs": [
716716
{
717717
"data": {
718718
"text/plain": [
719-
"age_cat float64\n",
720-
"sex float64\n",
721-
"race float64\n",
722-
"c_charge_degree float64\n",
723-
"is_recid float64\n",
724-
"score_text float64\n",
725-
"false_positive float64\n",
719+
"age_cat uint32\n",
720+
"sex uint32\n",
721+
"race uint32\n",
722+
"c_charge_degree uint32\n",
723+
"is_recid uint32\n",
724+
"score_text uint32\n",
725+
"false_positive uint32\n",
726726
"dtype: object"
727727
]
728728
},
729-
"execution_count": 7,
729+
"execution_count": 6,
730730
"metadata": {},
731731
"output_type": "execute_result"
732732
}
@@ -737,7 +737,7 @@
737737
},
738738
{
739739
"cell_type": "code",
740-
"execution_count": null,
740+
"execution_count": 7,
741741
"metadata": {},
742742
"outputs": [
743743
{
@@ -767,7 +767,7 @@
767767
},
768768
{
769769
"cell_type": "code",
770-
"execution_count": 9,
770+
"execution_count": 8,
771771
"metadata": {},
772772
"outputs": [
773773
{
@@ -787,7 +787,7 @@
787787
},
788788
{
789789
"cell_type": "code",
790-
"execution_count": 10,
790+
"execution_count": 9,
791791
"metadata": {},
792792
"outputs": [
793793
{
@@ -845,7 +845,7 @@
845845
},
846846
{
847847
"cell_type": "code",
848-
"execution_count": null,
848+
"execution_count": 10,
849849
"metadata": {},
850850
"outputs": [
851851
{
@@ -896,7 +896,7 @@
896896
},
897897
{
898898
"cell_type": "code",
899-
"execution_count": 12,
899+
"execution_count": 11,
900900
"metadata": {},
901901
"outputs": [
902902
{
@@ -1331,7 +1331,7 @@
13311331
"BiasAwareHierarchicalKModes(bahc_max_iter=20, bahc_min_cluster_size=57.71)"
13321332
]
13331333
},
1334-
"execution_count": 12,
1334+
"execution_count": 11,
13351335
"metadata": {},
13361336
"output_type": "execute_result"
13371337
}
@@ -1344,7 +1344,7 @@
13441344
},
13451345
{
13461346
"cell_type": "code",
1347-
"execution_count": 13,
1347+
"execution_count": 12,
13481348
"metadata": {},
13491349
"outputs": [
13501350
{
@@ -1353,7 +1353,7 @@
13531353
"5"
13541354
]
13551355
},
1356-
"execution_count": 13,
1356+
"execution_count": 12,
13571357
"metadata": {},
13581358
"output_type": "execute_result"
13591359
}
@@ -1365,7 +1365,7 @@
13651365
},
13661366
{
13671367
"cell_type": "code",
1368-
"execution_count": 14,
1368+
"execution_count": 13,
13691369
"metadata": {},
13701370
"outputs": [
13711371
{
@@ -1374,7 +1374,7 @@
13741374
"array([ 0.05290941, -0.02457072, -0.04827102, -0.04888889, -0.05093596])"
13751375
]
13761376
},
1377-
"execution_count": 14,
1377+
"execution_count": 13,
13781378
"metadata": {},
13791379
"output_type": "execute_result"
13801380
}
@@ -1386,7 +1386,7 @@
13861386
},
13871387
{
13881388
"cell_type": "code",
1389-
"execution_count": 15,
1389+
"execution_count": 14,
13901390
"metadata": {},
13911391
"outputs": [
13921392
{
@@ -1417,7 +1417,7 @@
14171417
},
14181418
{
14191419
"cell_type": "code",
1420-
"execution_count": 16,
1420+
"execution_count": 15,
14211421
"metadata": {},
14221422
"outputs": [
14231423
{
@@ -1426,7 +1426,7 @@
14261426
"array([0, 0, 4, ..., 0, 0, 1], dtype=uint32)"
14271427
]
14281428
},
1429-
"execution_count": 16,
1429+
"execution_count": 15,
14301430
"metadata": {},
14311431
"output_type": "execute_result"
14321432
}
@@ -1439,7 +1439,7 @@
14391439
},
14401440
{
14411441
"cell_type": "code",
1442-
"execution_count": 17,
1442+
"execution_count": 16,
14431443
"metadata": {},
14441444
"outputs": [
14451445
{
@@ -1618,7 +1618,7 @@
16181618
"[1443 rows x 7 columns]"
16191619
]
16201620
},
1621-
"execution_count": 17,
1621+
"execution_count": 16,
16221622
"metadata": {},
16231623
"output_type": "execute_result"
16241624
}
@@ -1642,7 +1642,7 @@
16421642
},
16431643
{
16441644
"cell_type": "code",
1645-
"execution_count": 18,
1645+
"execution_count": 17,
16461646
"metadata": {},
16471647
"outputs": [
16481648
{
@@ -1752,7 +1752,7 @@
17521752
"4 0 0 0 "
17531753
]
17541754
},
1755-
"execution_count": 18,
1755+
"execution_count": 17,
17561756
"metadata": {},
17571757
"output_type": "execute_result"
17581758
}
@@ -1776,7 +1776,7 @@
17761776
},
17771777
{
17781778
"cell_type": "code",
1779-
"execution_count": 19,
1779+
"execution_count": 18,
17801780
"metadata": {},
17811781
"outputs": [],
17821782
"source": [
@@ -1787,7 +1787,7 @@
17871787
},
17881788
{
17891789
"cell_type": "code",
1790-
"execution_count": 20,
1790+
"execution_count": 19,
17911791
"metadata": {},
17921792
"outputs": [
17931793
{
@@ -1842,7 +1842,7 @@
18421842
},
18431843
{
18441844
"cell_type": "code",
1845-
"execution_count": 21,
1845+
"execution_count": 20,
18461846
"metadata": {},
18471847
"outputs": [
18481848
{
@@ -1906,7 +1906,7 @@
19061906
},
19071907
{
19081908
"cell_type": "code",
1909-
"execution_count": 22,
1909+
"execution_count": 21,
19101910
"metadata": {
19111911
"vscode": {
19121912
"languageId": "ruby"
@@ -1970,7 +1970,7 @@
19701970
},
19711971
{
19721972
"cell_type": "code",
1973-
"execution_count": 23,
1973+
"execution_count": 22,
19741974
"metadata": {
19751975
"vscode": {
19761976
"languageId": "ruby"

0 commit comments

Comments
 (0)