fix: tutorial file restored

bayo-ibm · bayo-ibm · commit caa5b2f920ae · 2025-07-17T15:49:00.000Z
Signed-off-by: omobayode.fagbohungbe &lt;omobayode.fagbohungbe@ibm.com&gt;
diff --git a/tutorials/quantization_tutorial.ipynb b/tutorials/quantization_tutorial.ipynb
@@ -162,7 +162,7 @@
     "\n",
     "# Plotting the histogram.\n",
     "plt.figure(figsize=(16, 10))\n",
-    "plt.hist(raw_data, density=True, bins=128, alpha=0.8, label=\"y\")\n",
+    "plt.hist(raw_data, density=True, bins=128, alpha=0.8, label='y')\n",
     "#plt.legend(loc='upper right')\n",
     "plt.xlabel(\"Data\")\n",
     "plt.ylabel(\"density\")\n",
@@ -220,9 +220,9 @@
     "isClipped=np.logical_or(raw_data>clip_max, raw_data<clip_min)\n",
     "idx_clipped_elements=np.where( isClipped )[0]\n",
     "pd.DataFrame( \n",
-    "                {\"idx\":idx_clipped_elements[:5], \n",
-    "                \"raw\": raw_data[ idx_clipped_elements[:5] ],\n",
-    "                \"clipped\": clipped_data[idx_clipped_elements[:5]] }\n",
+    "                {'idx':idx_clipped_elements[:5], \n",
+    "                'raw': raw_data[ idx_clipped_elements[:5] ],\n",
+    "                'clipped': clipped_data[idx_clipped_elements[:5]] }\n",
     "            )"
    ]
   },
@@ -236,8 +236,8 @@
     "# Plot the distribution and the clipped data to visualize\n",
     "\n",
     "plt.figure(figsize=(16, 10))\n",
-    "plt.hist(raw_data,     density=True, bins=64, label=\"y (raw values)\", histtype=\"step\", linewidth=3.5),\n",
-    "plt.hist(clipped_data, density=True, bins=64, color=[\"#33b1ff\"], alpha=0.8,label=\"y_clamp (clipped edges)\"), \n",
+    "plt.hist(raw_data,     density=True, bins=64, label=\"y (raw values)\", histtype='step', linewidth=3.5),\n",
+    "plt.hist(clipped_data, density=True, bins=64, color=['#33b1ff'], alpha=0.8,label=\"y_clamp (clipped edges)\"), \n",
     "plt.legend(fancybox=True, ncol=2)\n",
     "plt.xlabel(\"Data\")\n",
     "plt.ylabel(\"density\")\n",
@@ -294,10 +294,10 @@
    "outputs": [],
    "source": [
     "plt.figure(figsize=(16, 10))\n",
-    "plt.hist(raw_data, density=True, bins=64, alpha=0.8,label=\"y (raw values)\", histtype=\"step\", linewidth=3.5)\n",
-    "plt.hist(y_scaled, density=True,  bins=64, color=[\"#33b1ff\"], alpha=0.6,label=\"scale+shift\")\n",
-    "plt.hist(y_int,    density=True,  bins=64, color=[\"#007d79\"],alpha=0.8,label=\"quantize\")\n",
-    "plt.legend(loc=\"upper left\", fancybox=True, ncol=3)\n",
+    "plt.hist(raw_data, density=True, bins=64, alpha=0.8,label=\"y (raw values)\", histtype='step', linewidth=3.5)\n",
+    "plt.hist(y_scaled, density=True,  bins=64, color=['#33b1ff'], alpha=0.6,label=\"scale+shift\")\n",
+    "plt.hist(y_int,    density=True,  bins=64, color=['#007d79'],alpha=0.8,label=\"quantize\")\n",
+    "plt.legend(loc='upper left', fancybox=True, ncol=3)\n",
     "plt.xlabel(\"Data\")\n",
     "plt.ylabel(\"density\")\n",
     "#plt.yscale('log')\n",
@@ -340,8 +340,8 @@
     "yq = y_int * stepsize + zp\n",
     "\n",
     "plt.figure(figsize=(16, 10))\n",
-    "plt.hist(raw_data, density=True, bins=64, label=\"original y\", histtype=\"step\", linewidth=2.5)#alpha=0.8,\n",
-    "plt.hist(yq,       density=True, color=[\"#33b1ff\"], bins=64, label=\"quantized y\")#alpha=0.7,\n",
+    "plt.hist(raw_data, density=True, bins=64, label=\"original y\", histtype='step', linewidth=2.5)#alpha=0.8,\n",
+    "plt.hist(yq,       density=True, color=['#33b1ff'], bins=64, label=\"quantized y\")#alpha=0.7,\n",
     "plt.legend(fancybox=True, ncol=2)\n",
     "plt.xlabel(\"Data\")\n",
     "plt.ylabel(\"density\")\n",
@@ -367,15 +367,15 @@
    "source": [
     "plt.subplots(3,1, figsize=(16, 12), sharex=True)\n",
     "\n",
-    "arstyle=dict(facecolor=\"C1\",alpha=0.5, shrink=0.05)\n",
+    "arstyle=dict(facecolor='C1',alpha=0.5, shrink=0.05)\n",
     "\n",
     "n_bit = 4\n",
     "clip_min, clip_max = -2.5, 2.5\n",
     "asym_raw_data = np.abs(raw_data)\n",
-    "for i, (raw_i, lbl_i) in enumerate([(raw_data, \"Case 1: sym data, sym Q\"), \n",
-    "                                    (asym_raw_data, \"Case 2: asym data, asym Q\"),\n",
-    "                                    (asym_raw_data, \"Case 3: asym data sym Q\") ]):\n",
-    "    if \"asym Q\" in lbl_i:\n",
+    "for i, (raw_i, lbl_i) in enumerate([(raw_data, 'Case 1: sym data, sym Q'), \n",
+    "                                    (asym_raw_data, 'Case 2: asym data, asym Q'),\n",
+    "                                    (asym_raw_data, 'Case 3: asym data sym Q') ]):\n",
+    "    if 'asym Q' in lbl_i:\n",
     "        # asym quantization for range [0, clip_max]\n",
     "        clip_min_i = np.min(raw_i)\n",
     "        nbins = 2**n_bit -1\n",
@@ -396,13 +396,13 @@
     "    max_bin_i = np.round( (clip_max-zp)/scale)*scale + zp\n",
     "\n",
     "    plt.subplot(311+i)\n",
-    "    plt.hist(raw_i, density=False, bins=64, label=\"original y\", histtype=\"step\", linewidth=2.5)\n",
-    "    plt.hist(yq_i,  density=False, color=[\"#33b1ff\"], bins=64, label=\"y_q\")\n",
+    "    plt.hist(raw_i, density=False, bins=64, label=\"original y\", histtype='step', linewidth=2.5)\n",
+    "    plt.hist(yq_i,  density=False, color=['#33b1ff'], bins=64, label='y_q')\n",
     "    plt.legend(fancybox=True, ncol=2, fontsize=14)\n",
     "\n",
     "    plt.ylabel(\"Count\")\n",
-    "    plt.annotate(\"upper clip bound\", xy=(max_bin_i, 0), xytext=(max_bin_i, 1e5), arrowprops=arstyle)    \n",
-    "    plt.annotate(\"lower clip bound\", xy=(clip_min_i, 0), xytext=(clip_min_i, 1e5), arrowprops=arstyle)    \n",
+    "    plt.annotate('upper clip bound', xy=(max_bin_i, 0), xytext=(max_bin_i, 1e5), arrowprops=arstyle)    \n",
+    "    plt.annotate('lower clip bound', xy=(clip_min_i, 0), xytext=(clip_min_i, 1e5), arrowprops=arstyle)    \n",
     "    plt.title(lbl_i)\n",
     "\n",
     "plt.tight_layout()\n",
@@ -478,9 +478,9 @@
     "# Generate 1 sample\n",
     "input = torch.randn(N,C,H,W)\n",
     "\n",
-    "print(\"Input Shape: \", input.shape)\n",
-    "print(\"Number of unique input values: \", input.detach().unique().size()[0])\n",
-    "print(f\"Expected: {N * C * H * W} (Based on randomly generated values for shape {N} x {C} x {H} x {W})\")"
+    "print('Input Shape: ', input.shape)\n",
+    "print('Number of unique input values: ', input.detach().unique().size()[0])\n",
+    "print(f'Expected: {N * C * H * W} (Based on randomly generated values for shape {N} x {C} x {H} x {W})')"
    ]
   },
   {
@@ -508,9 +508,9 @@
     "# Quantize the input data\n",
     "input_quant = simpleQuantizer(input, n_bit, clip_min, clip_max)\n",
     "\n",
-    "print(\"Quantized input Shape: \", input_quant.shape)\n",
-    "print(\"Number of unique quantized input values: \", input_quant.detach().unique().size()[0])\n",
-    "print(f\"Expected: {2 ** n_bit} (Based on 2 ^ {n_bit})\")"
+    "print('Quantized input Shape: ', input_quant.shape)\n",
+    "print('Number of unique quantized input values: ', input_quant.detach().unique().size()[0])\n",
+    "print(f'Expected: {2 ** n_bit} (Based on 2 ^ {n_bit})')"
    ]
   },
   {
@@ -577,9 +577,9 @@
     "# ignore bias for now \n",
     "net.conv.bias = torch.nn.Parameter(bias)\n",
     "\n",
-    "print(\"Weight Shape: \", weight.shape)\n",
-    "print(\"Number of unique weight values: \", weight.detach().unique().size()[0])\n",
-    "print(f\"Expected: {weight.numel()} (Based on randomly generated values for shape {weight.shape[0]} x {weight.shape[1]} x {weight.shape[2]} x {weight.shape[3]})\")"
+    "print('Weight Shape: ', weight.shape)\n",
+    "print('Number of unique weight values: ', weight.detach().unique().size()[0])\n",
+    "print(f'Expected: {weight.numel()} (Based on randomly generated values for shape {weight.shape[0]} x {weight.shape[1]} x {weight.shape[2]} x {weight.shape[3]})')"
    ]
   },
   {
@@ -605,10 +605,10 @@
     "# Quantize the weights (similar to input)\n",
     "weight_quant = simpleQuantizer(weight, n_bit, clip_min, clip_max)\n",
     "\n",
-    "print(\"Quantized weight Shape: \", weight_quant.shape)\n",
-    "print(\"Number of unique quantized weight values: \", weight_quant.detach().unique().size()[0])\n",
-    "print(f\"Expected: {2 ** n_bit} (Based on 2 ^ {n_bit})\")\n",
-    "print(\"First Channel of Quantized Weight\", weight_quant[0])\n"
+    "print('Quantized weight Shape: ', weight_quant.shape)\n",
+    "print('Number of unique quantized weight values: ', weight_quant.detach().unique().size()[0])\n",
+    "print(f'Expected: {2 ** n_bit} (Based on 2 ^ {n_bit})')\n",
+    "print('First Channel of Quantized Weight', weight_quant[0])\n"
    ]
   },
   {
@@ -635,9 +635,9 @@
     "# Generate quantized output y, NOTE, this net is currently using non-quantized weight \n",
     "y_quant = net(input_quant)\n",
     "\n",
-    "print(\"Number of unique output values: \", y.detach().unique().size()[0])\n",
-    "print(\"Expected maximum unique output values: \", y.flatten().size()[0])\n",
-    "print(\"Number of unique quantized output values: \", y_quant.detach().unique().size()[0])\n"
+    "print('Number of unique output values: ', y.detach().unique().size()[0])\n",
+    "print('Expected maximum unique output values: ', y.flatten().size()[0])\n",
+    "print('Number of unique quantized output values: ', y_quant.detach().unique().size()[0])\n"
    ]
   },
   {
@@ -662,26 +662,26 @@
    "outputs": [],
    "source": [
     "def PlotAndCompare(d1, d2, labels, title):\n",
-    "    mse = nn.functional.mse_loss(d1, d2, reduction=\"mean\" )\n",
+    "    mse = nn.functional.mse_loss(d1, d2, reduction='mean' )\n",
     "    plt.hist( d1.flatten().detach().numpy(), bins=64, alpha = 0.7, density=True, label=labels[0])\n",
-    "    plt.hist( d2.flatten().detach().numpy(), bins=64, color=[\"#33b1ff\"], alpha = 0.8, density=True, label=labels[1], histtype=\"step\", linewidth=3.5)\n",
-    "    plt.yscale(\"log\")\n",
-    "    plt.legend(loc=\"upper center\", bbox_to_anchor=(0.5, -0.1), fancybox=True, ncol=2)\n",
+    "    plt.hist( d2.flatten().detach().numpy(), bins=64, color=['#33b1ff'], alpha = 0.8, density=True, label=labels[1], histtype='step', linewidth=3.5)\n",
+    "    plt.yscale('log')\n",
+    "    plt.legend(loc='upper center', bbox_to_anchor=(0.5, -0.1), fancybox=True, ncol=2)\n",
     "    plt.title(f\"{title}, MSE={mse:.3f}\")\n",
     "\n",
     "\n",
     "\n",
-    "titles=[\"inputs\", \"weights\", \"outputs\"]\n",
-    "isQ = [\"not quantized\", \"quantized\"]\n",
+    "titles=['inputs', 'weights', 'outputs']\n",
+    "isQ = ['not quantized', 'quantized']\n",
     "for i, inp in enumerate([input, input_quant]):\n",
     "    for j, W in enumerate([weight, weight_quant]):\n",
     "        plt.subplots(1,3,figsize=(18,5))\n",
-    "        plt.suptitle(f\"Case {i*2+j+1}: Input {isQ[i]}, Weight {isQ[j]}\", fontsize=20, ha=\"center\", va=\"bottom\")\n",
-    "        plt.subplot(131); PlotAndCompare(input,     inp,        [\"raw\", isQ[i]],  f\"input, {isQ[i]}\")\n",
-    "        plt.subplot(132); PlotAndCompare(weight,    W,          [\"raw\", isQ[j]],  f\"weight, {isQ[j]}\")\n",
+    "        plt.suptitle(f'Case {i*2+j+1}: Input {isQ[i]}, Weight {isQ[j]}', fontsize=20, ha='center', va='bottom')\n",
+    "        plt.subplot(131); PlotAndCompare(input,     inp,        ['raw', isQ[i]],  f\"input, {isQ[i]}\")\n",
+    "        plt.subplot(132); PlotAndCompare(weight,    W,          ['raw', isQ[j]],  f\"weight, {isQ[j]}\")\n",
     "        net.conv.weight = torch.nn.Parameter(W)\n",
     "        y_quant = net(inp)\n",
-    "        plt.subplot(133); PlotAndCompare(y,         y_quant,   [\"raw\", f\"A={isQ[j]}, W={isQ[i]}\"], \"conv output\")\n",
+    "        plt.subplot(133); PlotAndCompare(y,         y_quant,   ['raw', f'A={isQ[j]}, W={isQ[i]}'], \"conv output\")\n",
     "        plt.show()\n",
     "\n",
     "\n"
@@ -737,34 +737,34 @@
     "qcfg = qconfig_init()\n",
     "\n",
     "# set bits for quantization (nbits_a needs to be set to quantize input regardless of bias)\n",
-    "qcfg[\"nbits_w\"] = 4\n",
-    "qcfg[\"nbits_a\"] = 4\n",
+    "qcfg['nbits_w'] = 4\n",
+    "qcfg['nbits_a'] = 4\n",
     "\n",
     "# just to be consistent with our \"simple Quantizer\" (normally align_zero is True)\n",
-    "qcfg[\"align_zero\"] = False\n",
+    "qcfg['align_zero'] = False\n",
     "\n",
     "# Quantization Mode here means which quantizers we would like to use,\n",
     "# There are many quantizers available in fms_mo, such as PArameterized Clipping acTivation (PACT),\n",
     "# Statstics-Aware Weight Binning (SAWB).\n",
-    "qcfg[\"qw_mode\"] = \"pact\"\n",
-    "qcfg[\"qa_mode\"] = \"pact\"\n",
+    "qcfg['qw_mode'] = 'pact'\n",
+    "qcfg['qa_mode'] = 'pact'\n",
     "\n",
     "# Set weight and input (activation) clip vals\n",
-    "qcfg[\"w_clip_init_valn\"], qcfg[\"w_clip_init_val\"] = -2.5, 2.5\n",
-    "qcfg[\"act_clip_init_valn\"], qcfg[\"act_clip_init_val\"] = -2.5, 2.5\n",
+    "qcfg['w_clip_init_valn'], qcfg['w_clip_init_val'] = -2.5, 2.5\n",
+    "qcfg['act_clip_init_valn'], qcfg['act_clip_init_val'] = -2.5, 2.5\n",
     "\n",
     "\n",
     "# This parameter is usually False, but for Demo purposes we quantize the first/only layer\n",
-    "qcfg[\"q1stlastconv\"] = True\n",
+    "qcfg['q1stlastconv'] = True\n",
     "\n",
     "\n",
     "if path.exists(\"results\"):\n",
     "    print(\"results folder exists!\")\n",
     "else:\n",
-    "    os.makedirs(\"results\")\n",
+    "    os.makedirs('results')\n",
     "    \n",
     "# Step 2: Prepare the model to convert layer to add Quantizers\n",
-    "qmodel_prep(net_fms_mo, input, qcfg, save_fname=\"./results/temp.pt\")\n",
+    "qmodel_prep(net_fms_mo, input, qcfg, save_fname='./results/temp.pt')\n",
     "\n"
    ]
   },
@@ -780,7 +780,7 @@
     "y_quant      = net(input_quant) \n",
     "\n",
     "plt.figure(figsize=(16, 10))\n",
-    "PlotAndCompare(y_quant_fms_mo, y_quant, [\"fms_mo\",\"manual\"],\"quantized Conv output by different methods\")\n",
+    "PlotAndCompare(y_quant_fms_mo, y_quant, ['fms_mo','manual'],'quantized Conv output by different methods')\n",
     "plt.show()\n"
    ]
   },
@@ -804,10 +804,9 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "import os\n",
-    "import wget\n",
-    "IMG_FILE_NAME = \"lion.png\"\n",
-    "url = \"https://raw.githubusercontent.com/foundation-model-stack/fms-model-optimizer/main/tutorials/images/\" + IMG_FILE_NAME\n",
+    "import os, wget\n",
+    "IMG_FILE_NAME = 'lion.png'\n",
+    "url = 'https://raw.githubusercontent.com/foundation-model-stack/fms-model-optimizer/main/tutorials/images/' + IMG_FILE_NAME\n",
     "\n",
     "if not os.path.isfile(IMG_FILE_NAME):\n",
     "  wget.download(url, out=IMG_FILE_NAME)\n",
@@ -864,19 +863,19 @@
     "\n",
     "plt.subplots(3,1,figsize=(16,25))\n",
     "plt.subplot(311)\n",
-    "plt.title(\"Output from non-quantized model\", fontsize=20)\n",
-    "plt.imshow(feature_map, cmap=\"RdBu\")\n",
+    "plt.title('Output from non-quantized model', fontsize=20)\n",
+    "plt.imshow(feature_map, cmap='RdBu')\n",
     "plt.clim(0,255)\n",
     "plt.colorbar()\n",
     "\n",
     "plt.subplot(312)\n",
-    "plt.title(\"Output from quantized model\", fontsize=20)\n",
-    "plt.imshow(feature_map_quant, cmap=\"RdBu\")\n",
+    "plt.title('Output from quantized model', fontsize=20)\n",
+    "plt.imshow(feature_map_quant, cmap='RdBu')\n",
     "plt.clim(0,255)\n",
     "plt.colorbar()\n",
     "\n",
     "plt.subplot(313)\n",
-    "PlotAndCompare(y_img_tensor, y_img_quant, [\"raw\",\"quantized\"],\"Conv output\")\n",
+    "PlotAndCompare(y_img_tensor, y_img_quant, ['raw','quantized'],'Conv output')\n",
     "\n",
     "plt.tight_layout()\n",
     "plt.show()\n"