sassoftware
diff --git a/‎examples/ARCHIVE/v1_8/pzmmModelImportExampleRegression.ipynb‎
Lines changed: 274 additions & 30 deletions b/‎examples/ARCHIVE/v1_8/pzmmModelImportExampleRegression.ipynb‎
Lines changed: 274 additions & 30 deletions
diff --git a/‎examples/data/hmeqModels/DecisionTreeClassifier/DecisionTreeClassifier.zip‎
0 Bytes b/‎examples/data/hmeqModels/DecisionTreeClassifier/DecisionTreeClassifier.zip‎
0 Bytes
diff --git a/‎examples/data/hmeqModels/GradientBoosting/GradientBoosting.zip‎
0 Bytes b/‎examples/data/hmeqModels/GradientBoosting/GradientBoosting.zip‎
0 Bytes
diff --git a/‎examples/data/hmeqModels/RandomForest/RandomForest.zip‎
0 Bytes b/‎examples/data/hmeqModels/RandomForest/RandomForest.zip‎
0 Bytes
@@ -21,9 +21,13 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 1,
    "metadata": {
-    "Collapsed": "false"
+    "Collapsed": "false",
+    "ExecuteTime": {
+     "end_time": "2023-04-03T14:28:44.170919Z",
+     "start_time": "2023-04-03T14:28:41.650760Z"
+    }
    },
    "outputs": [],
    "source": [
@@ -60,36 +64,172 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 5,
    "metadata": {
-    "Collapsed": "false"
+    "Collapsed": "false",
+    "ExecuteTime": {
+     "end_time": "2023-04-03T14:29:22.362807Z",
+     "start_time": "2023-04-03T14:29:22.227471Z"
+    }
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "(5000, 7)"
+      ]
+     },
+     "execution_count": 5,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
    "source": [
-    "housingData = pd.read_csv('data/USA_Housing.csv',sep= ',')\n",
+    "housingData = pd.read_csv('../../data/USA_Housing.csv',sep= ',')\n",
     "housingData.shape"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 6,
    "metadata": {
-    "Collapsed": "false"
+    "Collapsed": "false",
+    "ExecuteTime": {
+     "end_time": "2023-04-03T14:29:24.284223Z",
+     "start_time": "2023-04-03T14:29:24.269273Z"
+    }
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "data": {
+      "text/html": [
+       "<div>\n",
+       "<style scoped>\n",
+       "    .dataframe tbody tr th:only-of-type {\n",
+       "        vertical-align: middle;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe tbody tr th {\n",
+       "        vertical-align: top;\n",
+       "    }\n",
+       "\n",
+       "    .dataframe thead th {\n",
+       "        text-align: right;\n",
+       "    }\n",
+       "</style>\n",
+       "<table border=\"1\" class=\"dataframe\">\n",
+       "  <thead>\n",
+       "    <tr style=\"text-align: right;\">\n",
+       "      <th></th>\n",
+       "      <th>Avg_Area_Income</th>\n",
+       "      <th>Avg_Area_House_Age</th>\n",
+       "      <th>Avg_Area_Number_of_Rooms</th>\n",
+       "      <th>Avg_Area_Number_of_Bedrooms</th>\n",
+       "      <th>Area_Population</th>\n",
+       "      <th>Price</th>\n",
+       "    </tr>\n",
+       "  </thead>\n",
+       "  <tbody>\n",
+       "    <tr>\n",
+       "      <th>0</th>\n",
+       "      <td>79545.45857</td>\n",
+       "      <td>5.682861</td>\n",
+       "      <td>7.009188</td>\n",
+       "      <td>4.09</td>\n",
+       "      <td>23086.80050</td>\n",
+       "      <td>1.059034e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>1</th>\n",
+       "      <td>79248.64245</td>\n",
+       "      <td>6.002900</td>\n",
+       "      <td>6.730821</td>\n",
+       "      <td>3.09</td>\n",
+       "      <td>40173.07217</td>\n",
+       "      <td>1.505891e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>2</th>\n",
+       "      <td>61287.06718</td>\n",
+       "      <td>5.865890</td>\n",
+       "      <td>8.512727</td>\n",
+       "      <td>5.13</td>\n",
+       "      <td>36882.15940</td>\n",
+       "      <td>1.058988e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>3</th>\n",
+       "      <td>63345.24005</td>\n",
+       "      <td>7.188236</td>\n",
+       "      <td>5.586729</td>\n",
+       "      <td>3.26</td>\n",
+       "      <td>34310.24283</td>\n",
+       "      <td>1.260617e+06</td>\n",
+       "    </tr>\n",
+       "    <tr>\n",
+       "      <th>4</th>\n",
+       "      <td>59982.19723</td>\n",
+       "      <td>5.040555</td>\n",
+       "      <td>7.839388</td>\n",
+       "      <td>4.23</td>\n",
+       "      <td>26354.10947</td>\n",
+       "      <td>6.309435e+05</td>\n",
+       "    </tr>\n",
+       "  </tbody>\n",
+       "</table>\n",
+       "</div>"
+      ],
+      "text/plain": [
+       "   Avg_Area_Income  Avg_Area_House_Age  Avg_Area_Number_of_Rooms  \\\n",
+       "0      79545.45857            5.682861                  7.009188   \n",
+       "1      79248.64245            6.002900                  6.730821   \n",
+       "2      61287.06718            5.865890                  8.512727   \n",
+       "3      63345.24005            7.188236                  5.586729   \n",
+       "4      59982.19723            5.040555                  7.839388   \n",
+       "\n",
+       "   Avg_Area_Number_of_Bedrooms  Area_Population         Price  \n",
+       "0                         4.09      23086.80050  1.059034e+06  \n",
+       "1                         3.09      40173.07217  1.505891e+06  \n",
+       "2                         5.13      36882.15940  1.058988e+06  \n",
+       "3                         3.26      34310.24283  1.260617e+06  \n",
+       "4                         4.23      26354.10947  6.309435e+05  "
+      ]
+     },
+     "execution_count": 6,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
    "source": [
     "housingData = housingData.drop(['Address'], axis=1)\n",
     "housingData.head()"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 7,
    "metadata": {
     "Collapsed": "false",
+    "ExecuteTime": {
+     "end_time": "2023-04-03T14:29:25.456875Z",
+     "start_time": "2023-04-03T14:29:25.450876Z"
+    },
     "scrolled": true
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "data": {
+      "text/plain": [
+       "Index(['Avg_Area_Income', 'Avg_Area_House_Age', 'Avg_Area_Number_of_Rooms',\n",
+       "       'Avg_Area_Number_of_Bedrooms', 'Area_Population', 'Price'],\n",
+       "      dtype='object')"
+      ]
+     },
+     "execution_count": 7,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
    "source": [
     "housingData.columns"
    ]
@@ -105,11 +245,24 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 8,
    "metadata": {
-    "Collapsed": "false"
+    "Collapsed": "false",
+    "ExecuteTime": {
+     "end_time": "2023-04-03T14:29:38.649081Z",
+     "start_time": "2023-04-03T14:29:38.634078Z"
+    }
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "(1500, 5)\n",
+      "(3500, 5)\n"
+     ]
+    }
+   ],
    "source": [
     "# Input \n",
     "predictorColumns = ['Avg_Area_Income', 'Avg_Area_House_Age', 'Avg_Area_Number_of_Rooms', \n",
@@ -140,11 +293,46 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 9,
    "metadata": {
-    "Collapsed": "false"
+    "Collapsed": "false",
+    "ExecuteTime": {
+     "end_time": "2023-04-03T14:29:40.804108Z",
+     "start_time": "2023-04-03T14:29:40.673110Z"
+    }
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "C:\\ProgramData\\Anaconda3\\lib\\site-packages\\sklearn\\linear_model\\_base.py:141: FutureWarning: 'normalize' was deprecated in version 1.0 and will be removed in 1.2.\n",
+      "If you wish to scale the data, use Pipeline with a StandardScaler in a preprocessing stage. To reproduce the previous behavior:\n",
+      "\n",
+      "from sklearn.pipeline import make_pipeline\n",
+      "\n",
+      "model = make_pipeline(StandardScaler(with_mean=False), LinearRegression())\n",
+      "\n",
+      "If you wish to pass a sample_weight parameter, you need to pass it as a fit parameter to each step of the pipeline as follows:\n",
+      "\n",
+      "kwargs = {s[0] + '__sample_weight': sample_weight for s in model.steps}\n",
+      "model.fit(X, y, **kwargs)\n",
+      "\n",
+      "\n",
+      "  warnings.warn(\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "LinearRegression(normalize=True)"
+      ]
+     },
+     "execution_count": 9,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
    "source": [
     "# Linear Regression Training\n",
     "from sklearn.linear_model import LinearRegression\n",
@@ -154,11 +342,23 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 10,
    "metadata": {
-    "Collapsed": "false"
+    "Collapsed": "false",
+    "ExecuteTime": {
+     "end_time": "2023-04-03T14:29:42.800193Z",
+     "start_time": "2023-04-03T14:29:42.787165Z"
+    }
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "0.9146818498916266\n"
+     ]
+    }
+   ],
    "source": [
     "# Test Predictions\n",
     "from sklearn import metrics\n",
@@ -177,25 +377,70 @@
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 11,
    "metadata": {
-    "Collapsed": "false"
+    "Collapsed": "false",
+    "ExecuteTime": {
+     "end_time": "2023-04-03T14:34:10.912291Z",
+     "start_time": "2023-04-03T14:34:10.906281Z"
+    }
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Model LinearRegression was successfully pickled and saved to C:\\Users\\sclind\\Documents\\Python Scripts\\GitHub\\sassoftware\\python-sasctl\\examples\\ARCHIVE\\v1_8\\RegressionModel\\LinearRegression.pickle.\n"
+     ]
+    }
+   ],
    "source": [
     "modelPrefix = 'LinearRegression'\n",
-    "zipFolder = Path.cwd() / 'data/USAHousingModels/LinearRegression'\n",
+    "zipFolder = Path.cwd() / 'RegressionModel/'\n",
     "\n",
     "pzmm.PickleModel.pickle_trained_model(linReg, modelPrefix, zipFolder)"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": null,
+   "execution_count": 13,
    "metadata": {
-    "Collapsed": "false"
+    "Collapsed": "false",
+    "ExecuteTime": {
+     "end_time": "2023-04-03T14:35:59.447060Z",
+     "start_time": "2023-04-03T14:35:59.327305Z"
+    }
    },
-   "outputs": [],
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "inputVar.json was successfully written and saved to C:\\Users\\sclind\\Documents\\Python Scripts\\GitHub\\sassoftware\\python-sasctl\\examples\\ARCHIVE\\v1_8\\RegressionModel\\inputVar.json\n",
+      "outputVar.json was successfully written and saved to C:\\Users\\sclind\\Documents\\Python Scripts\\GitHub\\sassoftware\\python-sasctl\\examples\\ARCHIVE\\v1_8\\RegressionModel\\outputVar.json\n",
+      "ModelProperties.json was successfully written and saved to C:\\Users\\sclind\\Documents\\Python Scripts\\GitHub\\sassoftware\\python-sasctl\\examples\\ARCHIVE\\v1_8\\RegressionModel\\ModelProperties.json\n",
+      "fileMetaData.json was successfully written and saved to C:\\Users\\sclind\\Documents\\Python Scripts\\GitHub\\sassoftware\\python-sasctl\\examples\\ARCHIVE\\v1_8\\RegressionModel\\fileMetaData.json\n"
+     ]
+    },
+    {
+     "name": "stderr",
+     "output_type": "stream",
+     "text": [
+      "C:\\Users\\sclind\\AppData\\Roaming\\Python\\Python39\\site-packages\\sasctl\\pzmm\\write_json_files.py:133: FutureWarning: The frame.append method is deprecated and will be removed from pandas in a future version. Use pandas.concat instead.\n",
+      "  outputJSON = outputJSON.append([outputRow], ignore_index=True)\n",
+      "C:\\Users\\sclind\\AppData\\Roaming\\Python\\Python39\\site-packages\\sasctl\\pzmm\\write_json_files.py:133: FutureWarning: The frame.append method is deprecated and will be removed from pandas in a future version. Use pandas.concat instead.\n",
+      "  outputJSON = outputJSON.append([outputRow], ignore_index=True)\n",
+      "C:\\Users\\sclind\\AppData\\Roaming\\Python\\Python39\\site-packages\\sasctl\\pzmm\\write_json_files.py:133: FutureWarning: The frame.append method is deprecated and will be removed from pandas in a future version. Use pandas.concat instead.\n",
+      "  outputJSON = outputJSON.append([outputRow], ignore_index=True)\n",
+      "C:\\Users\\sclind\\AppData\\Roaming\\Python\\Python39\\site-packages\\sasctl\\pzmm\\write_json_files.py:133: FutureWarning: The frame.append method is deprecated and will be removed from pandas in a future version. Use pandas.concat instead.\n",
+      "  outputJSON = outputJSON.append([outputRow], ignore_index=True)\n",
+      "C:\\Users\\sclind\\AppData\\Roaming\\Python\\Python39\\site-packages\\sasctl\\pzmm\\write_json_files.py:133: FutureWarning: The frame.append method is deprecated and will be removed from pandas in a future version. Use pandas.concat instead.\n",
+      "  outputJSON = outputJSON.append([outputRow], ignore_index=True)\n",
+      "C:\\Users\\sclind\\AppData\\Roaming\\Python\\Python39\\site-packages\\sasctl\\pzmm\\write_json_files.py:133: FutureWarning: The frame.append method is deprecated and will be removed from pandas in a future version. Use pandas.concat instead.\n",
+      "  outputJSON = outputJSON.append([outputRow], ignore_index=True)\n"
+     ]
+    }
+   ],
    "source": [
     "def writeJSONFiles(data, predict, target, zipFolder, modelPrefix):\n",
     "    J = pzmm.JSONFiles()\n",
@@ -204,8 +449,7 @@
     "    J.writeVarJSON(data[predict], isInput=True, jPath=zipFolder)\n",
     "    \n",
     "    # Set output variables and assign an event threshold, then write output variable mapping\n",
-    "    outputVar = pd.DataFrame(columns=['EM_PREDICTION'])\n",
-    "    outputVar['EM_PREDICTION'].loc[1] = 0.5\n",
+    "    outputVar = pd.DataFrame(data=[[0.5]], columns=['EM_PREDICTION'])\n",
     "    J.writeVarJSON(outputVar, isInput=False, jPath=zipFolder)\n",
     "    \n",
     "    # Write model properties to a json file\n",
@@ -276,7 +520,7 @@
    "name": "python",
    "nbconvert_exporter": "python",
    "pygments_lexer": "ipython3",
-   "version": "3.8.16"
+   "version": "3.9.12"
   },
   "latex_envs": {
    "LaTeX_envs_menu_present": true,