New notebooks

boireauromain-collab · boireauromain-collab · commit fa38e8f45438 · 2025-11-15T14:43:05.000-05:00
diff --git a/.gitignore b/.gitignore
@@ -9,4 +9,5 @@ lab*.ipynb
 # virtual environments
 .venv/
 myenv/
-2017.csv
+2017.csv
+airlines.csv
diff --git a/Project_1.ipynb b/Project_1.ipynb
@@ -0,0 +1,190 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "b4a01b39",
+   "metadata": {},
+   "source": [
+    "# Project 1"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "1cc24e93",
+   "metadata": {},
+   "source": [
+    "For this project, we will be looking at F1 team data. More specifically, team data. \n",
+    "\n",
+    "We will be looking at the mode, median and average age number of laps done during the qualifying sessions. \n",
+    "\n",
+    "We will looking at a solidifed dataset including qualifying session from 2022 to 2025"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "ed9d198c",
+   "metadata": {},
+   "source": [
+    "# Let me merge the 4 years of data to have a big enough dataset"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "2f86d349",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "#step 1\n",
+    "\n",
+    "import pandas as pd\n",
+    "years = [2022, 2023, 2024, 2025]\n",
+    "qual = pd.concat((pd.read_csv(f\"{y}.csv\").assign(season=y) for y in years), ignore_index=True)\n",
+    "qual.to_csv(\"f1_qualifying_2022_2025.csv\", index=False)\n"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "d858a645",
+   "metadata": {},
+   "source": [
+    "# Average of laps done in qualifying across all seasons"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "c8485d2d",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "15.943181818181818\n"
+     ]
+    }
+   ],
+   "source": [
+    "# step 2\n",
+    "import pandas as pd\n",
+    "\n",
+    "df = pd.read_csv(\"f1_qualifying_2022_2025.csv\")\n",
+    "avg_laps = df[\"Laps\"].mean()\n",
+    "print(avg_laps)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "4ac17b31",
+   "metadata": {},
+   "source": [
+    "# The median now"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "61d744bd",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "15.943181818181818\n"
+     ]
+    }
+   ],
+   "source": [
+    "# step 3\n",
+    "import pandas as pd\n",
+    "\n",
+    "df = pd.read_csv(\"f1_qualifying_2022_2025.csv\")\n",
+    "median_laps = df[\"Laps\"].mean()\n",
+    "print(median_laps)\n",
+    "\n",
+    "# I think all entries in Laps are number. If not, to be sure, I could use \n",
+    "\n",
+    "#import pandas as pd\n",
+    "\n",
+    "#df = pd.read_csv(\"f1_qualifying_2022_2025.csv\")\n",
+    "#median_laps = pd.to_numeric(df[\"Laps\"], errors=\"coerce\").median()\n",
+    "#print(f\"Median laps (2022–2025): {median_laps}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "15a68fe0",
+   "metadata": {},
+   "source": [
+    "# Mode"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "id": "51205acc",
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "0    15.0\n",
+      "Name: Laps, dtype: float64\n"
+     ]
+    }
+   ],
+   "source": [
+    "# step 4\n",
+    "import pandas as pd\n",
+    "\n",
+    "df = pd.read_csv(\"f1_qualifying_2022_2025.csv\")\n",
+    "mode_laps = df[\"Laps\"].mode()\n",
+    "print(mode_laps)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "id": "87e45682",
+   "metadata": {},
+   "source": [
+    "# Now the hardway: average, median, mode"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "08ee701f",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import csv\n",
+    "\n",
+    "with open(\"f1_qualifying_2022_2025.csv\", \"r\") as f1:\n"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.13.7"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
diff --git a/Project_2.ipynb b/Project_2.ipynb
diff --git a/_toc.yml b/_toc.yml
@@ -1,4 +1,6 @@
 format: jb-book
 root: index
 chapters:
-  - file: lecture_16_example
+  - file: lecture_16_example
+  - file: Project_1
+  - file: Project_2