Updated stats #218

dpuenteramirez · dpuenteramirez · commit 6d541fee86aa · 2022-05-11T23:14:32.000+02:00
diff --git a/experimentation/rank_statistics.ipynb b/experimentation/rank_statistics.ipynb
@@ -15,54 +15,74 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 209,
+   "execution_count": 9,
+   "metadata": {
+    "collapsed": false,
+    "pycharm": {
+     "name": "#%%\n"
+    }
+   },
    "outputs": [],
    "source": [
     "import os.path\n",
     "import scipy.stats\n",
     "from itertools import product\n",
     "import pandas as pd\n",
     "import numpy as np"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 42,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "np.set_printoptions(formatter={'float_kind': \"{:6.3f}\".format})\n",
+    "#np.set_printoptions(precision=4)\n",
+    "RED='\\033[0;31m'\n",
+    "GRN='\\033[0;32m'\n",
+    "NC='\\033[0m'\n",
+    "BLD='\\033[1m'"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 210,
+   },
    "outputs": [],
    "source": [
     "metric = 'f1-score'\n",
     "results = os.path.join('ranks', 'results.csv')"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 211,
+   },
    "outputs": [],
    "source": [
     "results_df = pd.read_csv(results)"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 12,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 212,
+   },
    "outputs": [
     {
      "name": "stdout",
@@ -86,17 +106,17 @@
     "print(f\"Filters used: {filters}\")\n",
     "print(f\"Percents labeled used: {percents_labeled}\")\n",
     "print(f\"# Datasets used: {len(datasets)}\")\n"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 13,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 213,
+   },
    "outputs": [
     {
      "name": "stdout",
@@ -127,17 +147,17 @@
     "\n",
     "bases_filters = np.array(list(product(base_estimators, filters)))\n",
     "print(\"Pairs of base estimator with filters:\\n\", bases_filters)"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 14,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 214,
+   },
    "outputs": [
     {
      "name": "stdout",
@@ -175,17 +195,17 @@
    ],
    "source": [
     "print(grouped_df)"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 15,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 215,
+   },
    "outputs": [],
    "source": [
     "def base_filter_values():\n",
@@ -208,17 +228,26 @@
     "def split_onto_base_estimators():\n",
     "    for base_ in base_estimators:\n",
     "        base_dfs.append(curr_vals.filter(regex=base_))"
-   ],
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 24,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "data = []"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 40,
    "metadata": {
     "collapsed": false,
     "pycharm": {
      "name": "#%%\n"
     }
-   }
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 216,
+   },
    "outputs": [
     {
      "name": "stdout",
@@ -368,6 +397,7 @@
     }
    ],
    "source": [
+    "data = []\n",
     "for percent in percents_labeled:\n",
     "    curr_vals = base_filter_values()\n",
     "\n",
@@ -392,36 +422,139 @@
     "                                              value in zip(df.columns,\n",
     "                                                           average_ranks)}\n",
     "        print()\n",
-    "        for k, v in average_rank_for.items():\n",
-    "            print(k, f'{v:.2f}')\n"
-   ],
-   "metadata": {
-    "collapsed": false,
-    "pycharm": {
-     "name": "#%%\n"
+    "        for key, value in average_rank_for.items():\n",
+    "            print(key, f'{value:.2f}')\n",
+    "            \n",
+    "            \n",
+    "        part0 = (12*N)/(k*(k+1))\n",
+    "        part1 = sum([Rj**2 for Rj in average_ranks])\n",
+    "        part2 = (k*(k+1)**2)/4     \n",
+    "        𝛘2_F = part0*(part1-part2)\n",
+    "        F_F = (N-1)*𝛘2_F/(N*(k-1)-𝛘2_F)\n",
+    "        \n",
+    "        data.append([percent, F_F, average_rank_for, N, k])  "
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Ivan And Davenport \n",
+    "F_F = (N-1)*𝛘2_F/(N*(k-1)-𝛘2_F)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "https://www.statology.org/f-distribution-calculator/\n",
+    "\n",
+    "With 3 classifiers, 3 filters and the base one, and 18 data sets, $F_F$ is distributed according to the $F$ distribution with\n",
+    "$7-1=6$ and $(7-1)×(18−1)=102$ degrees of freedom. The critical value of $F(6,102)$ for $\\alpha=0.05$\n",
+    "is $2.00002$, so we reject the null-hypothesis"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": []
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 43,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.359) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (1.84) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;32mWe reject the null-hypothesis, as the F_F value (3.15) is greater than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (1.12) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.277) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;32mWe reject the null-hypothesis, as the F_F value (3.4) is greater than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.452) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.475) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.106) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.814) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (2.56) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.277) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.321) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (1.19) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.906) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.452) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (1.19) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (1.71) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.25) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (0.364) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n",
+      "\u001b[0;31mWe CAN NOT reject the null-hypothesis, as the F_F value (2.21) is less than the critical value (2.79)\n",
+      "\u001b[1mThat means that there are not statistically differences between classifiers\u001b[0m\n"
+     ]
     }
-   }
+   ],
+   "source": [
+    "# Using critical values\n",
+    "# FROM: https://stackoverflow.com/questions/39813470/f-test-with-python-finding-the-critical-value\n",
+    "# SEE ALSO: https://www.statology.org/f-critical-value-python/\n",
+    "alpha = 0.05\n",
+    "for percent, F_F, average_rank_for, N, k in data:\n",
+    "    critical_value = scipy.stats.f.ppf(q=1-alpha, dfn=(k-1), dfd=(k-1)*(N-1))\n",
+    "\n",
+    "    if F_F > critical_value:\n",
+    "        print(f\"{GRN}We reject the null-hypothesis, as the F_F value ({F_F:.3}) is greater than the critical value ({critical_value:.3})\")\n",
+    "        print(f\"{BLD}That means that there are statistically differences between classifiers{NC}\")\n",
+    "    else:\n",
+    "        print(f\"{RED}We CAN NOT reject the null-hypothesis, as the F_F value ({F_F:.3}) is less than the critical value ({critical_value:.3})\")\n",
+    "        print(f\"{BLD}That means that there are not statistically differences between classifiers{NC}\")\n",
+    "        #print(f\"Or that the test is not powerfull enough to detect the differences\")\n"
+   ]
   }
  ],
  "metadata": {
+  "interpreter": {
+   "hash": "ddbf58beb0ceb3f28487c8a8d7192b043471fe4d33849d20361912ddb46861bb"
+  },
   "kernelspec": {
-   "display_name": "Python 3",
+   "display_name": "Python 3.9.12 ('IS-SSL')",
    "language": "python",
    "name": "python3"
   },
   "language_info": {
    "codemirror_mode": {
     "name": "ipython",
-    "version": 2
+    "version": 3
    },
    "file_extension": ".py",
    "mimetype": "text/x-python",
    "name": "python",
    "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython2",
-   "version": "2.7.6"
+   "pygments_lexer": "ipython3",
+   "version": "3.9.12"
   }
  },
  "nbformat": 4,
  "nbformat_minor": 0
-}
+}