diff --git a/Automated Essay Grading/Model/Automated_Essay_Grading (2).ipynb b/Automated Essay Grading/Model/Automated_Essay_Grading (2).ipynb
new file mode 100644
index 0000000000..20b01d626f
--- /dev/null
+++ b/Automated Essay Grading/Model/Automated_Essay_Grading (2).ipynb	
@@ -0,0 +1,1466 @@
+{
+  "nbformat": 4,
+  "nbformat_minor": 0,
+  "metadata": {
+    "colab": {
+      "name": "Automated_Essay_Grading.ipynb",
+      "provenance": [],
+      "collapsed_sections": []
+    },
+    "kernelspec": {
+      "display_name": "Python 3",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.8.3"
+    }
+  },
+  "cells": [
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "pGeJ9Tlf5gRq",
+        "outputId": "366bd917-cfda-4464-eebb-5407a3eb10ec"
+      },
+      "source": [
+        "import numpy as np \n",
+        "import pandas as pd \n",
+        "\n",
+        "#for pre-processing\n",
+        "import nltk\n",
+        "import re\n",
+        "from nltk.corpus import stopwords\n",
+        "from gensim.models import Word2Vec\n",
+        "\n",
+        "nltk.download('stopwords')\n",
+        "nltk.download('punkt')\n",
+        "\n",
+        "#for model training\n",
+        "\n",
+        "from keras.layers import Embedding, LSTM, Dense, Dropout, Lambda, Flatten\n",
+        "from keras.models import Sequential, load_model, model_from_config\n",
+        "import keras.backend as K\n",
+        "from sklearn.model_selection import KFold\n",
+        "from sklearn.model_selection import train_test_split\n",
+        "from sklearn.svm import SVR\n",
+        "from sklearn.linear_model import LogisticRegression\n",
+        "from sklearn.neighbors import KNeighborsClassifier\n",
+        "from sklearn.ensemble import RandomForestClassifier\n",
+        "from sklearn.tree import DecisionTreeClassifier\n",
+        "from sklearn.metrics import mean_squared_error\n",
+        "from sklearn.metrics import explained_variance_score\n",
+        "from sklearn import ensemble\n",
+        "from sklearn.linear_model import LinearRegression\n",
+        "from sklearn.metrics import cohen_kappa_score"
+      ],
+      "execution_count": 1,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "[nltk_data] Downloading package stopwords to /root/nltk_data...\n",
+            "[nltk_data]   Unzipping corpora/stopwords.zip.\n",
+            "[nltk_data] Downloading package punkt to /root/nltk_data...\n",
+            "[nltk_data]   Unzipping tokenizers/punkt.zip.\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "xpYqK4V55taJ"
+      },
+      "source": [
+        "test_data = pd.read_csv(\"test_set.tsv\",sep='\\t', encoding='ISO-8859-1')"
+      ],
+      "execution_count": 9,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "EkUUzJU1GZgk"
+      },
+      "source": [
+        "training_data = pd.read_csv(\"training_set_rel3.tsv\",sep='\\t', encoding='ISO-8859-1',\n",
+        "                            usecols = ['essay_id', 'essay_set', 'essay','domain1_score']).dropna(axis=1)"
+      ],
+      "execution_count": 16,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "Zuqui4TA-msu"
+      },
+      "source": [
+        "scores = training_data['domain1_score']"
+      ],
+      "execution_count": 17,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 204
+        },
+        "id": "UNYVwze36yUS",
+        "outputId": "cff2ed4f-a510-4159-b200-46af5ce91112"
+      },
+      "source": [
+        "test_data.head()"
+      ],
+      "execution_count": 18,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/html": [
+              "<div>\n",
+              "<style scoped>\n",
+              "    .dataframe tbody tr th:only-of-type {\n",
+              "        vertical-align: middle;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe tbody tr th {\n",
+              "        vertical-align: top;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe thead th {\n",
+              "        text-align: right;\n",
+              "    }\n",
+              "</style>\n",
+              "<table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              "    <tr style=\"text-align: right;\">\n",
+              "      <th></th>\n",
+              "      <th>essay_id</th>\n",
+              "      <th>essay_set</th>\n",
+              "      <th>essay</th>\n",
+              "      <th>domain1_predictionid</th>\n",
+              "      <th>domain2_predictionid</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <th>0</th>\n",
+              "      <td>2383</td>\n",
+              "      <td>1</td>\n",
+              "      <td>I believe that computers have a positive effec...</td>\n",
+              "      <td>2383</td>\n",
+              "      <td>NaN</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>1</th>\n",
+              "      <td>2384</td>\n",
+              "      <td>1</td>\n",
+              "      <td>Dear @CAPS1, I know some problems have came up...</td>\n",
+              "      <td>2384</td>\n",
+              "      <td>NaN</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2</th>\n",
+              "      <td>2385</td>\n",
+              "      <td>1</td>\n",
+              "      <td>Dear to whom it @MONTH1 concern, Computers are...</td>\n",
+              "      <td>2385</td>\n",
+              "      <td>NaN</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>3</th>\n",
+              "      <td>2386</td>\n",
+              "      <td>1</td>\n",
+              "      <td>Dear @CAPS1 @CAPS2, @CAPS3 has come to my atte...</td>\n",
+              "      <td>2386</td>\n",
+              "      <td>NaN</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>4</th>\n",
+              "      <td>2387</td>\n",
+              "      <td>1</td>\n",
+              "      <td>Dear Local newspaper, I think that people have...</td>\n",
+              "      <td>2387</td>\n",
+              "      <td>NaN</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n",
+              "</div>"
+            ],
+            "text/plain": [
+              "   essay_id  essay_set  ... domain1_predictionid  domain2_predictionid\n",
+              "0      2383          1  ...                 2383                   NaN\n",
+              "1      2384          1  ...                 2384                   NaN\n",
+              "2      2385          1  ...                 2385                   NaN\n",
+              "3      2386          1  ...                 2386                   NaN\n",
+              "4      2387          1  ...                 2387                   NaN\n",
+              "\n",
+              "[5 rows x 5 columns]"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 18
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "k-Y0cEu8650v",
+        "outputId": "3a208166-8286-4f23-fe61-6840da1b3816"
+      },
+      "source": [
+        "test_data.shape"
+      ],
+      "execution_count": 19,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/plain": [
+              "(4254, 5)"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 19
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 204
+        },
+        "id": "UyhgfBgk60Vh",
+        "outputId": "53805d71-89e5-438d-a55c-f2f2048db8c4"
+      },
+      "source": [
+        "training_data.head()"
+      ],
+      "execution_count": 20,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/html": [
+              "<div>\n",
+              "<style scoped>\n",
+              "    .dataframe tbody tr th:only-of-type {\n",
+              "        vertical-align: middle;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe tbody tr th {\n",
+              "        vertical-align: top;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe thead th {\n",
+              "        text-align: right;\n",
+              "    }\n",
+              "</style>\n",
+              "<table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              "    <tr style=\"text-align: right;\">\n",
+              "      <th></th>\n",
+              "      <th>essay_id</th>\n",
+              "      <th>essay_set</th>\n",
+              "      <th>essay</th>\n",
+              "      <th>domain1_score</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <th>0</th>\n",
+              "      <td>1</td>\n",
+              "      <td>1</td>\n",
+              "      <td>Dear local newspaper, I think effects computer...</td>\n",
+              "      <td>8</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>1</th>\n",
+              "      <td>2</td>\n",
+              "      <td>1</td>\n",
+              "      <td>Dear @CAPS1 @CAPS2, I believe that using compu...</td>\n",
+              "      <td>9</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2</th>\n",
+              "      <td>3</td>\n",
+              "      <td>1</td>\n",
+              "      <td>Dear, @CAPS1 @CAPS2 @CAPS3 More and more peopl...</td>\n",
+              "      <td>7</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>3</th>\n",
+              "      <td>4</td>\n",
+              "      <td>1</td>\n",
+              "      <td>Dear Local Newspaper, @CAPS1 I have found that...</td>\n",
+              "      <td>10</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>4</th>\n",
+              "      <td>5</td>\n",
+              "      <td>1</td>\n",
+              "      <td>Dear @LOCATION1, I know having computers has a...</td>\n",
+              "      <td>8</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n",
+              "</div>"
+            ],
+            "text/plain": [
+              "   essay_id  ...  domain1_score\n",
+              "0         1  ...              8\n",
+              "1         2  ...              9\n",
+              "2         3  ...              7\n",
+              "3         4  ...             10\n",
+              "4         5  ...              8\n",
+              "\n",
+              "[5 rows x 4 columns]"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 20
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "lIo08YSV64G_",
+        "outputId": "70658373-5015-4ea6-cd22-274224309911"
+      },
+      "source": [
+        "training_data.shape"
+      ],
+      "execution_count": 21,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/plain": [
+              "(12976, 4)"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 21
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "fmt-Jt9u6qqY"
+      },
+      "source": [
+        "test_data.dropna(axis=1,inplace=True)"
+      ],
+      "execution_count": 22,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "v9Cvw9XM6wR0"
+      },
+      "source": [
+        "\n",
+        "y = training_data['domain1_score']\n",
+        "X = training_data.copy()\n"
+      ],
+      "execution_count": 23,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "YLIUc7pe7TnY"
+      },
+      "source": [
+        "def essay_to_wordlist(essay_v, remove_stopwords):\n",
+        "    #Remove the tagged labels and word tokenize the sentence.\n",
+        "    essay_v = re.sub(\"[^a-zA-Z]\", \" \", essay_v)\n",
+        "    words = essay_v.lower().split()\n",
+        "    if remove_stopwords:\n",
+        "        stops = set(stopwords.words(\"english\"))\n",
+        "        words = [w for w in words if not w in stops]\n",
+        "    return (words)\n",
+        "\n",
+        "def essay_to_sentences(essay_v, remove_stopwords):\n",
+        "    \"\"\"Sentence tokenize the essay and call essay_to_wordlist() for word tokenization.\"\"\"\n",
+        "    tokenizer = nltk.data.load('tokenizers/punkt/english.pickle')\n",
+        "    raw_sentences = tokenizer.tokenize(essay_v.strip())\n",
+        "    sentences = []\n",
+        "    for raw_sentence in raw_sentences:\n",
+        "        if len(raw_sentence) > 0:\n",
+        "            sentences.append(essay_to_wordlist(raw_sentence, remove_stopwords))\n",
+        "    return sentences\n",
+        "\n",
+        "def makeFeatureVec(words, model, num_features):\n",
+        "    \"\"\"Make ar from the words list of an Essay.\"\"\"\n",
+        "    featureVec = np.zeros((num_features,),dtype=\"float32\")\n",
+        "    num_words = 0.\n",
+        "    index2word_set = set(model.wv.index2word)\n",
+        "    for word in words:\n",
+        "        if word in index2word_set:\n",
+        "            num_words += 1\n",
+        "            featureVec = np.add(featureVec,model[word])        \n",
+        "    featureVec = np.divide(featureVec,num_words)\n",
+        "    return featureVec\n",
+        "\n",
+        "def getAvgFeatureVecs(essays, model, num_features):\n",
+        "    \"\"\"Main function to generate the word vectors for word2vec model.\"\"\"\n",
+        "    counter = 0\n",
+        "    essayFeatureVecs = np.zeros((len(essays),num_features),dtype=\"float32\")\n",
+        "    for essay in essays:\n",
+        "        essayFeatureVecs[counter] = makeFeatureVec(essay, model, num_features)\n",
+        "        counter = counter + 1\n",
+        "    return essayFeatureVecs"
+      ],
+      "execution_count": 24,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "poBfr2pm7b1c"
+      },
+      "source": [
+        "from keras.layers import Embedding, LSTM, Dense, Dropout, Lambda, Flatten\n",
+        "from keras.models import Sequential, load_model, model_from_config\n",
+        "import keras.backend as K\n",
+        "\n",
+        "def get_model():\n",
+        "    \"\"\"Define the model.\"\"\"\n",
+        "    model = Sequential()\n",
+        "    model.add(LSTM(300, dropout=0.4, recurrent_dropout=0.4, input_shape=[1, 300], return_sequences=True))\n",
+        "    model.add(LSTM(64, recurrent_dropout=0.4))\n",
+        "    model.add(Dropout(0.5))\n",
+        "    model.add(Dense(1, activation='relu'))\n",
+        "\n",
+        "    model.compile(loss='mean_squared_error', optimizer='rmsprop', metrics=['mae'])\n",
+        "    model.summary()\n",
+        "\n",
+        "    return model"
+      ],
+      "execution_count": 25,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "j3T0MKXk7gti",
+        "outputId": "c6022e85-0b13-4c42-f133-3449ee989b5c"
+      },
+      "source": [
+        "cv = KFold(n_splits = 8, shuffle = True)\n",
+        "results = []\n",
+        "y_pred_list = []\n",
+        "\n",
+        "count = 1\n",
+        "for traincv, testcv in cv.split(X):\n",
+        "    print(\"\\n--------Fold {}--------\\n\".format(count))\n",
+        "    X_test, X_train, y_test, y_train = X.iloc[testcv], X.iloc[traincv], y.iloc[testcv], y.iloc[traincv]\n",
+        "    \n",
+        "    train_essays = X_train['essay']\n",
+        "    test_essays = X_test['essay']\n",
+        "    \n",
+        "    sentences = []\n",
+        "    \n",
+        "    for essay in train_essays:\n",
+        "            # Obtaining all sentences from the training essays.\n",
+        "            sentences += essay_to_sentences(essay, remove_stopwords = True)\n",
+        "            \n",
+        "    # Initializing variables for word2vec model.\n",
+        "    num_features = 300\n",
+        "    min_word_count = 40\n",
+        "    num_workers = 8\n",
+        "    context = 10\n",
+        "    downsampling = 1e-3\n",
+        "\n",
+        "    \n",
+        "    print(\"Training Word2Vec Model...\")\n",
+        "    model = Word2Vec(sentences, workers=num_workers, size=num_features, min_count = min_word_count, window = context, sample = downsampling)\n",
+        "\n",
+        "    model.init_sims(replace=True)\n",
+        "    model.wv.save_word2vec_format('word2vecmodel.bin', binary=True)\n",
+        "\n",
+        "    clean_train_essays = []\n",
+        "    \n",
+        "    # Generate training and testing data word vectors.\n",
+        "    for essay_v in train_essays:\n",
+        "        clean_train_essays.append(essay_to_wordlist(essay_v, remove_stopwords=True))\n",
+        "    trainDataVecs = getAvgFeatureVecs(clean_train_essays, model, num_features)\n",
+        "    \n",
+        "    clean_test_essays = []\n",
+        "    for essay_v in test_essays:\n",
+        "        clean_test_essays.append(essay_to_wordlist( essay_v, remove_stopwords=True ))\n",
+        "    testDataVecs = getAvgFeatureVecs( clean_test_essays, model, num_features )\n",
+        "    \n",
+        "    trainDataVecs = np.array(trainDataVecs)\n",
+        "    testDataVecs = np.array(testDataVecs)\n",
+        "    # Reshaping train and test vectors to 3 dimensions. (1 represnts one timestep)\n",
+        "    trainDataVecs = np.reshape(trainDataVecs, (trainDataVecs.shape[0], 1, trainDataVecs.shape[1]))\n",
+        "    testDataVecs = np.reshape(testDataVecs, (testDataVecs.shape[0], 1, testDataVecs.shape[1]))\n",
+        "    \n",
+        "    lstm_model = get_model()\n",
+        "    lstm_model.fit(trainDataVecs, y_train, batch_size=64, epochs=2)\n",
+        "    #lstm_model.load_weights('./model_weights/final_lstm.h5')\n",
+        "    y_pred = lstm_model.predict(testDataVecs)\n",
+        "    \n",
+        "    # Save any one of the 5 models.\n",
+        "    if count == 5:\n",
+        "         lstm_model.save_weights('final_lstm.h5')\n",
+        "    \n",
+        "    # Round y_pred to the nearest integer.\n",
+        "    y_pred = np.around(y_pred)\n",
+        "    \n",
+        "    # Evaluate the model on the evaluation metric. \"Quadratic mean averaged Kappa\"\n",
+        "    result = cohen_kappa_score(y_test.values,y_pred,weights='quadratic')\n",
+        "    print(\"Kappa Score: {}\".format(result))\n",
+        "    results.append(result)\n",
+        "\n",
+        "    count += 1    "
+      ],
+      "execution_count": 26,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "\n",
+            "--------Fold 1--------\n",
+            "\n",
+            "Training Word2Vec Model...\n"
+          ],
+          "name": "stdout"
+        },
+        {
+          "output_type": "stream",
+          "text": [
+            "/usr/local/lib/python3.7/dist-packages/ipykernel_launcher.py:28: DeprecationWarning: Call to deprecated `__getitem__` (Method will be removed in 4.0.0, use self.wv.__getitem__() instead).\n"
+          ],
+          "name": "stderr"
+        },
+        {
+          "output_type": "stream",
+          "text": [
+            "Model: \"sequential\"\n",
+            "_________________________________________________________________\n",
+            "Layer (type)                 Output Shape              Param #   \n",
+            "=================================================================\n",
+            "lstm (LSTM)                  (None, 1, 300)            721200    \n",
+            "_________________________________________________________________\n",
+            "lstm_1 (LSTM)                (None, 64)                93440     \n",
+            "_________________________________________________________________\n",
+            "dropout (Dropout)            (None, 64)                0         \n",
+            "_________________________________________________________________\n",
+            "dense (Dense)                (None, 1)                 65        \n",
+            "=================================================================\n",
+            "Total params: 814,705\n",
+            "Trainable params: 814,705\n",
+            "Non-trainable params: 0\n",
+            "_________________________________________________________________\n",
+            "Epoch 1/2\n",
+            "178/178 [==============================] - 34s 26ms/step - loss: 80.0289 - mae: 5.0009\n",
+            "Epoch 2/2\n",
+            "178/178 [==============================] - 5s 26ms/step - loss: 42.6830 - mae: 3.6584\n",
+            "Kappa Score: 0.7903575237442636\n",
+            "\n",
+            "--------Fold 2--------\n",
+            "\n",
+            "Training Word2Vec Model...\n",
+            "Model: \"sequential_1\"\n",
+            "_________________________________________________________________\n",
+            "Layer (type)                 Output Shape              Param #   \n",
+            "=================================================================\n",
+            "lstm_2 (LSTM)                (None, 1, 300)            721200    \n",
+            "_________________________________________________________________\n",
+            "lstm_3 (LSTM)                (None, 64)                93440     \n",
+            "_________________________________________________________________\n",
+            "dropout_1 (Dropout)          (None, 64)                0         \n",
+            "_________________________________________________________________\n",
+            "dense_1 (Dense)              (None, 1)                 65        \n",
+            "=================================================================\n",
+            "Total params: 814,705\n",
+            "Trainable params: 814,705\n",
+            "Non-trainable params: 0\n",
+            "_________________________________________________________________\n",
+            "Epoch 1/2\n",
+            "178/178 [==============================] - 13s 26ms/step - loss: 80.4811 - mae: 4.9985\n",
+            "Epoch 2/2\n",
+            "178/178 [==============================] - 5s 26ms/step - loss: 41.0250 - mae: 3.5642\n",
+            "Kappa Score: 0.7576200645615898\n",
+            "\n",
+            "--------Fold 3--------\n",
+            "\n",
+            "Training Word2Vec Model...\n",
+            "Model: \"sequential_2\"\n",
+            "_________________________________________________________________\n",
+            "Layer (type)                 Output Shape              Param #   \n",
+            "=================================================================\n",
+            "lstm_4 (LSTM)                (None, 1, 300)            721200    \n",
+            "_________________________________________________________________\n",
+            "lstm_5 (LSTM)                (None, 64)                93440     \n",
+            "_________________________________________________________________\n",
+            "dropout_2 (Dropout)          (None, 64)                0         \n",
+            "_________________________________________________________________\n",
+            "dense_2 (Dense)              (None, 1)                 65        \n",
+            "=================================================================\n",
+            "Total params: 814,705\n",
+            "Trainable params: 814,705\n",
+            "Non-trainable params: 0\n",
+            "_________________________________________________________________\n",
+            "Epoch 1/2\n",
+            "178/178 [==============================] - 12s 26ms/step - loss: 86.8164 - mae: 5.1346\n",
+            "Epoch 2/2\n",
+            "178/178 [==============================] - 5s 25ms/step - loss: 42.9669 - mae: 3.6482\n",
+            "Kappa Score: 0.7750784192913241\n",
+            "\n",
+            "--------Fold 4--------\n",
+            "\n",
+            "Training Word2Vec Model...\n",
+            "Model: \"sequential_3\"\n",
+            "_________________________________________________________________\n",
+            "Layer (type)                 Output Shape              Param #   \n",
+            "=================================================================\n",
+            "lstm_6 (LSTM)                (None, 1, 300)            721200    \n",
+            "_________________________________________________________________\n",
+            "lstm_7 (LSTM)                (None, 64)                93440     \n",
+            "_________________________________________________________________\n",
+            "dropout_3 (Dropout)          (None, 64)                0         \n",
+            "_________________________________________________________________\n",
+            "dense_3 (Dense)              (None, 1)                 65        \n",
+            "=================================================================\n",
+            "Total params: 814,705\n",
+            "Trainable params: 814,705\n",
+            "Non-trainable params: 0\n",
+            "_________________________________________________________________\n",
+            "Epoch 1/2\n",
+            "178/178 [==============================] - 12s 26ms/step - loss: 84.9276 - mae: 5.1270\n",
+            "Epoch 2/2\n",
+            "178/178 [==============================] - 5s 26ms/step - loss: 41.1146 - mae: 3.5898\n",
+            "Kappa Score: 0.7666838457375764\n",
+            "\n",
+            "--------Fold 5--------\n",
+            "\n",
+            "Training Word2Vec Model...\n",
+            "Model: \"sequential_4\"\n",
+            "_________________________________________________________________\n",
+            "Layer (type)                 Output Shape              Param #   \n",
+            "=================================================================\n",
+            "lstm_8 (LSTM)                (None, 1, 300)            721200    \n",
+            "_________________________________________________________________\n",
+            "lstm_9 (LSTM)                (None, 64)                93440     \n",
+            "_________________________________________________________________\n",
+            "dropout_4 (Dropout)          (None, 64)                0         \n",
+            "_________________________________________________________________\n",
+            "dense_4 (Dense)              (None, 1)                 65        \n",
+            "=================================================================\n",
+            "Total params: 814,705\n",
+            "Trainable params: 814,705\n",
+            "Non-trainable params: 0\n",
+            "_________________________________________________________________\n",
+            "Epoch 1/2\n",
+            "178/178 [==============================] - 13s 27ms/step - loss: 82.9046 - mae: 5.0942\n",
+            "Epoch 2/2\n",
+            "178/178 [==============================] - 5s 27ms/step - loss: 44.5824 - mae: 3.7365\n",
+            "Kappa Score: 0.7679175647531018\n",
+            "\n",
+            "--------Fold 6--------\n",
+            "\n",
+            "Training Word2Vec Model...\n",
+            "Model: \"sequential_5\"\n",
+            "_________________________________________________________________\n",
+            "Layer (type)                 Output Shape              Param #   \n",
+            "=================================================================\n",
+            "lstm_10 (LSTM)               (None, 1, 300)            721200    \n",
+            "_________________________________________________________________\n",
+            "lstm_11 (LSTM)               (None, 64)                93440     \n",
+            "_________________________________________________________________\n",
+            "dropout_5 (Dropout)          (None, 64)                0         \n",
+            "_________________________________________________________________\n",
+            "dense_5 (Dense)              (None, 1)                 65        \n",
+            "=================================================================\n",
+            "Total params: 814,705\n",
+            "Trainable params: 814,705\n",
+            "Non-trainable params: 0\n",
+            "_________________________________________________________________\n",
+            "Epoch 1/2\n",
+            "178/178 [==============================] - 12s 26ms/step - loss: 82.4743 - mae: 5.0568\n",
+            "Epoch 2/2\n",
+            "178/178 [==============================] - 5s 26ms/step - loss: 41.3642 - mae: 3.6533\n",
+            "Kappa Score: 0.7668898538505264\n",
+            "\n",
+            "--------Fold 7--------\n",
+            "\n",
+            "Training Word2Vec Model...\n",
+            "Model: \"sequential_6\"\n",
+            "_________________________________________________________________\n",
+            "Layer (type)                 Output Shape              Param #   \n",
+            "=================================================================\n",
+            "lstm_12 (LSTM)               (None, 1, 300)            721200    \n",
+            "_________________________________________________________________\n",
+            "lstm_13 (LSTM)               (None, 64)                93440     \n",
+            "_________________________________________________________________\n",
+            "dropout_6 (Dropout)          (None, 64)                0         \n",
+            "_________________________________________________________________\n",
+            "dense_6 (Dense)              (None, 1)                 65        \n",
+            "=================================================================\n",
+            "Total params: 814,705\n",
+            "Trainable params: 814,705\n",
+            "Non-trainable params: 0\n",
+            "_________________________________________________________________\n",
+            "Epoch 1/2\n",
+            "178/178 [==============================] - 12s 26ms/step - loss: 77.7445 - mae: 4.8427\n",
+            "Epoch 2/2\n",
+            "178/178 [==============================] - 5s 26ms/step - loss: 41.1949 - mae: 3.6313\n",
+            "Kappa Score: 0.7526492043229287\n",
+            "\n",
+            "--------Fold 8--------\n",
+            "\n",
+            "Training Word2Vec Model...\n",
+            "Model: \"sequential_7\"\n",
+            "_________________________________________________________________\n",
+            "Layer (type)                 Output Shape              Param #   \n",
+            "=================================================================\n",
+            "lstm_14 (LSTM)               (None, 1, 300)            721200    \n",
+            "_________________________________________________________________\n",
+            "lstm_15 (LSTM)               (None, 64)                93440     \n",
+            "_________________________________________________________________\n",
+            "dropout_7 (Dropout)          (None, 64)                0         \n",
+            "_________________________________________________________________\n",
+            "dense_7 (Dense)              (None, 1)                 65        \n",
+            "=================================================================\n",
+            "Total params: 814,705\n",
+            "Trainable params: 814,705\n",
+            "Non-trainable params: 0\n",
+            "_________________________________________________________________\n",
+            "Epoch 1/2\n",
+            "178/178 [==============================] - 13s 27ms/step - loss: 85.8951 - mae: 5.1660\n",
+            "Epoch 2/2\n",
+            "178/178 [==============================] - 5s 26ms/step - loss: 41.5336 - mae: 3.6033\n",
+            "Kappa Score: 0.789614734201678\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "1uVCRjAG-CMF",
+        "outputId": "f3edc244-db77-4e9d-c2cc-f61d0db6e099"
+      },
+      "source": [
+        "print(\"Average Kappa score after a 5-fold cross validation: \",np.around(np.array(results).mean(),decimals=4))"
+      ],
+      "execution_count": 27,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Average Kappa score after a 5-fold cross validation:  0.7709\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "5IVKdy1d7j2q",
+        "outputId": "ef6d01d4-64f6-4bcd-8cd6-ee4803fb1ac8"
+      },
+      "source": [
+        "# Splitting dataset into training and test set and generating word embeddings for other models other than\n",
+        "# neural networks\n",
+        "\n",
+        "indep_train, indep_test, dep_train, dep_test = train_test_split(X, scores, test_size = 0.25)\n",
+        "\n",
+        "train_essays2 = indep_train['essay']\n",
+        "test_essays2 = indep_test['essay']\n",
+        "    \n",
+        "sentences2 = []\n",
+        "\n",
+        "\n",
+        "for essay2 in train_essays2:\n",
+        "            # Obtaining all sentences from the training set of essays.\n",
+        "            sentences2 += essay_to_sentences(essay2,remove_stopwords = True)\n",
+        "            \n",
+        "# Initializing variables for word2vec model.\n",
+        "num_features = 300 \n",
+        "min_word_count = 40\n",
+        "num_workers = 4\n",
+        "context = 10\n",
+        "downsampling = 1e-3\n",
+        "\n",
+        "print(\"Training Word2Vec Model...\")\n",
+        "model = Word2Vec(sentences, workers=num_workers, size=num_features, min_count = min_word_count, window = context, sample = downsampling)\n",
+        "\n",
+        "model.init_sims(replace=True)\n",
+        "model.wv.save_word2vec_format('word2vecmodel.bin', binary=True)\n",
+        "\n",
+        "clean_train_essays2 = []\n",
+        "    \n",
+        "# Generate training and testing data word vectors.\n",
+        "for essay_text2 in train_essays2:\n",
+        "    clean_train_essays2.append(essay_to_wordlist(essay_text2,remove_stopwords = True))\n",
+        "trainDataVecs2 = getAvgFeatureVecs(clean_train_essays2, model, num_features)\n",
+        "    \n",
+        "clean_test_essays2 = []\n",
+        "for essay_text2 in test_essays2:\n",
+        "    clean_test_essays2.append(essay_to_wordlist(essay_text2,remove_stopwords = True))\n",
+        "testDataVecs2 = getAvgFeatureVecs(clean_test_essays2, model, num_features)\n",
+        "    \n",
+        "trainDataVecs2 = np.array(trainDataVecs2)\n",
+        "testDataVecs2 = np.array(testDataVecs2)"
+      ],
+      "execution_count": 28,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Training Word2Vec Model...\n"
+          ],
+          "name": "stdout"
+        },
+        {
+          "output_type": "stream",
+          "text": [
+            "/usr/local/lib/python3.7/dist-packages/ipykernel_launcher.py:28: DeprecationWarning: Call to deprecated `__getitem__` (Method will be removed in 4.0.0, use self.wv.__getitem__() instead).\n"
+          ],
+          "name": "stderr"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "cCDipn8i9zee",
+        "outputId": "7a19bca9-8523-4f51-8a9c-4edf9838e2a1"
+      },
+      "source": [
+        "# Generating scores using Linear Regression Model\n",
+        "\n",
+        "linear_regressor = LinearRegression()\n",
+        "\n",
+        "linear_regressor.fit(trainDataVecs2, dep_train)\n",
+        "\n",
+        "dep_pred = linear_regressor.predict(testDataVecs2)\n",
+        "\n",
+        "# The mean squared error\n",
+        "print(\"Mean squared error: %.2f\" % mean_squared_error(dep_test, dep_pred))\n",
+        "\n",
+        "# Explained variance score: 1 is perfect prediction\n",
+        "print('Variance score: %.2f' % explained_variance_score(dep_test,dep_pred))\n",
+        "\n",
+        "#print('Cohen\\'s kappa score: %.2f' % cohen_kappa_score(dep_pred, dep_test))\n",
+        "print(\"Kappa Score: {0:.2f}\".format(cohen_kappa_score(dep_test.values,np.around(dep_pred),weights='quadratic')))"
+      ],
+      "execution_count": 29,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Mean squared error: 20.85\n",
+            "Variance score: 0.72\n",
+            "Kappa Score: 0.85\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "VSsXfIkpUmTe"
+      },
+      "source": [
+        "ksr = (\"Kappa Score: {0:.2f}\".format(cohen_kappa_score(dep_test.values,np.around(dep_pred),weights='quadratic')))"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "RD9X4cplAJm3",
+        "outputId": "6ece1d9b-d7f2-45c1-a465-380e410c2b6f"
+      },
+      "source": [
+        "#Generating scores using Gradient Boosting regressor\n",
+        "\n",
+        "'''from sklearn.model_selection import GridSearchCV\n",
+        "params = {'n_estimators':[100, 1000], 'max_depth':[2], 'min_samples_split': [2],\n",
+        "          'learning_rate':[3, 1, 0.1, 0.3], 'loss': ['ls']}\n",
+        "\n",
+        "gbr = ensemble.GradientBoostingRegressor()\n",
+        "\n",
+        "grid = GridSearchCV(gbr, params)\n",
+        "grid.fit(trainDataVecs2, dep_train)\n",
+        "\n",
+        "y_pred = grid.predict(testDataVecs2)\n",
+        "\n",
+        "# summarize the results of the grid search\n",
+        "print(grid.best_score_)\n",
+        "print(grid.best_estimator_)'''\n",
+        "\n",
+        "#USING THE PARAMS FOUND OUT USING GRID SEARCH CV\n",
+        "gbr = ensemble.GradientBoostingRegressor(alpha=0.9, criterion='friedman_mse', init=None,\n",
+        "             learning_rate=0.1, loss='ls', max_depth=2, max_features=None,\n",
+        "             max_leaf_nodes=None, min_impurity_decrease=0.0,\n",
+        "             min_impurity_split=None, min_samples_leaf=1,\n",
+        "             min_samples_split=2, min_weight_fraction_leaf=0.0,\n",
+        "             n_estimators=1000, presort='auto', random_state=None,\n",
+        "             subsample=1.0, verbose=0, warm_start=False)\n",
+        "gbr.fit(trainDataVecs2, dep_train)\n",
+        "dep_pred = gbr.predict(testDataVecs2)\n",
+        "\n",
+        "# The mean squared error\n",
+        "print(\"Mean squared error: %.2f\" % mean_squared_error(dep_test, dep_pred))\n",
+        "\n",
+        "# Explained variance score: 1 is perfect prediction\n",
+        "print('Variance score: %.2f' % explained_variance_score(dep_test,dep_pred))\n",
+        "\n",
+        "print(\"Kappa Score: {0:.2f}\".format(cohen_kappa_score(dep_test.values,np.around(dep_pred),weights='quadratic')))"
+      ],
+      "execution_count": 30,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "/usr/local/lib/python3.7/dist-packages/sklearn/ensemble/_gb.py:1342: FutureWarning: The parameter 'presort' is deprecated and has no effect. It will be removed in v0.24. You can suppress this warning by not passing any value to the 'presort' parameter. We also recommend using HistGradientBoosting models instead.\n",
+            "  FutureWarning)\n"
+          ],
+          "name": "stderr"
+        },
+        {
+          "output_type": "stream",
+          "text": [
+            "Mean squared error: 9.14\n",
+            "Variance score: 0.88\n",
+            "Kappa Score: 0.94\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "_K6BGP2OAraH",
+        "outputId": "5585d00c-8c5c-4ead-97c2-9468ab167714"
+      },
+      "source": [
+        "# Generating scores using Support Vector Regression\n",
+        "svr = SVR()\n",
+        "\n",
+        "'''parameters = {'kernel':['linear', 'rbf'], 'C':[1, 100], 'gamma':[0.1, 0.001]}\n",
+        "\n",
+        "grid = GridSearchCV(svr, parameters)\n",
+        "grid.fit(trainDataVecs2, dep_train)\n",
+        "\n",
+        "y_pred = grid.predict(testDataVecs2)\n",
+        "\n",
+        "# summarize the results of the grid search\n",
+        "print(grid.best_score_)\n",
+        "print(grid.best_estimator_)'''\n",
+        "\n",
+        "#USING THE PARAMS FOUND OUT USING GRID SEARCH CV\n",
+        "svr = SVR(C=100, cache_size=200, coef0=0.0, degree=3, epsilon=0.1, gamma=0.1,kernel='rbf', max_iter=-1, shrinking=True, tol=0.001, verbose=False)\n",
+        "svr.fit(trainDataVecs2, dep_train)\n",
+        "dep_pred = svr.predict(testDataVecs2)\n",
+        "\n",
+        "\n",
+        "# The mean squared error\n",
+        "print(\"Mean squared error: %.2f\" % mean_squared_error(dep_test, dep_pred))\n",
+        "\n",
+        "# Explained variance score: 1 is perfect prediction\n",
+        "print('Variance score: %.2f' % explained_variance_score(dep_test,dep_pred))\n",
+        "\n",
+        "#Cohen's Kappa score\n",
+        "print(\"Kappa Score: {0:.2f}\".format(cohen_kappa_score(dep_test.values,np.around(dep_pred),weights='quadratic')))"
+      ],
+      "execution_count": 31,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Mean squared error: 34.61\n",
+            "Variance score: 0.55\n",
+            "Kappa Score: 0.65\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "pzwT3hDvBIxU",
+        "outputId": "f031d8ff-8a08-4d29-a62c-0cdc69a59352"
+      },
+      "source": [
+        "# Generating scores using XGBClassifier\n",
+        "from xgboost import XGBClassifier\n",
+        "xgb=XGBClassifier(colsample_bytree=0.4,gamma=0,learning_rate=0.01,max_depth=4,min_child_weight=0.5,n_estimators=100,                                                                    reg_alpha=0.75,reg_lambda=0.45,\n",
+        "                 subsample=0.6,seed=42)\n",
+        "xgb.fit(trainDataVecs2, dep_train)\n",
+        "dep_pred = xgb.predict(testDataVecs2)\n",
+        "\n",
+        "# The mean squared error\n",
+        "print(\"Mean squared error: %.2f\" % mean_squared_error(dep_test, dep_pred))\n",
+        "\n",
+        "# Explained variance score: 1 is perfect prediction\n",
+        "print('Variance score: %.2f' % explained_variance_score(dep_test,dep_pred))\n",
+        "\n",
+        "#print('Cohen\\'s kappa score: %.2f' % cohen_kappa_score(dep_pred, dep_test))\n",
+        "print(\"Kappa Score: {0:.2f}\".format(cohen_kappa_score(dep_test.values,np.around(dep_pred),weights='quadratic')))"
+      ],
+      "execution_count": 32,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Mean squared error: 17.12\n",
+            "Variance score: 0.77\n",
+            "Kappa Score: 0.88\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "auYVWNYdDkTS",
+        "outputId": "2bc380e5-3760-4abd-cde5-72a21e9811ff"
+      },
+      "source": [
+        "# Generating scores using Logistic Regression\n",
+        "lr = LogisticRegression(random_state=1, max_iter=1000)\n",
+        "lr.fit(trainDataVecs2, dep_train)\n",
+        "dep_pred = lr.predict(testDataVecs2)\n",
+        "\n",
+        "# The mean squared error\n",
+        "print(\"Mean squared error: %.2f\" % mean_squared_error(dep_test, dep_pred))\n",
+        "\n",
+        "# Explained variance score: 1 is perfect prediction\n",
+        "print('Variance score: %.2f' % explained_variance_score(dep_test,dep_pred))\n",
+        "\n",
+        "#print('Cohen\\'s kappa score: %.2f' % cohen_kappa_score(dep_pred, dep_test))\n",
+        "print(\"Kappa Score: {0:.2f}\".format(cohen_kappa_score(dep_test.values,np.around(dep_pred),weights='quadratic')))"
+      ],
+      "execution_count": 33,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Mean squared error: 40.63\n",
+            "Variance score: 0.48\n",
+            "Kappa Score: 0.66\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "WcV-obvrH8ES",
+        "outputId": "974ce7e2-4b24-41bb-fe1d-3fac293548e0"
+      },
+      "source": [
+        "# Generating scores using K-Nearest Neighbor\n",
+        "knn = KNeighborsClassifier(n_neighbors=1)\n",
+        "knn.fit(trainDataVecs2, dep_train)\n",
+        "dep_pred = knn.predict(testDataVecs2)\n",
+        "\n",
+        "# The mean squared error\n",
+        "print(\"Mean squared error: %.2f\" % mean_squared_error(dep_test, dep_pred))\n",
+        "\n",
+        "# Explained variance score: 1 is perfect prediction\n",
+        "print('Variance score: %.2f' % explained_variance_score(dep_test,dep_pred))\n",
+        "\n",
+        "#print('Cohen\\'s kappa score: %.2f' % cohen_kappa_score(dep_pred, dep_test))\n",
+        "print(\"Kappa Score: {0:.2f}\".format(cohen_kappa_score(dep_test.values,np.around(dep_pred),weights='quadratic')))\n"
+      ],
+      "execution_count": 34,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Mean squared error: 15.10\n",
+            "Variance score: 0.81\n",
+            "Kappa Score: 0.91\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "R1w0mbbAIOEw",
+        "outputId": "5ab17902-79b9-4597-f3f5-59bd54d8ec30"
+      },
+      "source": [
+        "# Generating scores using Desion Tree Classifier\n",
+        "dt = DecisionTreeClassifier(criterion = 'entropy',random_state=0,max_depth = 30)\n",
+        "dt.fit(trainDataVecs2, dep_train)\n",
+        "dep_pred = dt.predict(testDataVecs2)\n",
+        "\n",
+        "# The mean squared error\n",
+        "print(\"Mean squared error: %.2f\" % mean_squared_error(dep_test, dep_pred))\n",
+        "\n",
+        "# Explained variance score: 1 is perfect prediction\n",
+        "print('Variance score: %.2f' % explained_variance_score(dep_test,dep_pred))\n",
+        "\n",
+        "#print('Cohen\\'s kappa score: %.2f' % cohen_kappa_score(dep_pred, dep_test))\n",
+        "print(\"Kappa Score: {0:.2f}\".format(cohen_kappa_score(dep_test.values,np.around(dep_pred),weights='quadratic')))"
+      ],
+      "execution_count": 35,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Mean squared error: 21.12\n",
+            "Variance score: 0.72\n",
+            "Kappa Score: 0.86\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "8MW8TGHBIbbx",
+        "outputId": "0b33a055-d8e1-4e9e-aea9-f2aa6b178b0f"
+      },
+      "source": [
+        "# Generating scores using Random Forest Classifier\n",
+        "rf = RandomForestClassifier(n_estimators=200, random_state=0,max_depth=12)\n",
+        "rf.fit(trainDataVecs2, dep_train)\n",
+        "dep_pred = rf.predict(testDataVecs2)\n",
+        "\n",
+        "# The mean squared error\n",
+        "print(\"Mean squared error: %.2f\" % mean_squared_error(dep_test, dep_pred))\n",
+        "\n",
+        "# Explained variance score: 1 is perfect prediction\n",
+        "print('Variance score: %.2f' % explained_variance_score(dep_test,dep_pred))\n",
+        "\n",
+        "#print('Cohen\\'s kappa score: %.2f' % cohen_kappa_score(dep_pred, dep_test))\n",
+        "print(\"Kappa Score: {0:.2f}\".format(cohen_kappa_score(dep_test.values,np.around(dep_pred),weights='quadratic')))"
+      ],
+      "execution_count": 36,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Mean squared error: 10.44\n",
+            "Variance score: 0.86\n",
+            "Kappa Score: 0.93\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "cxJwnPuvterS"
+      },
+      "source": [
+        "**Comparison of Kappa Score of different algorithms**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 350
+        },
+        "id": "SbIeCEVHYkg8",
+        "outputId": "afafb246-f0c2-4540-bc52-3bf7139918ef"
+      },
+      "source": [
+        "\n",
+        "\n",
+        "import numpy as np\n",
+        "import matplotlib.pyplot as plt\n",
+        "\n",
+        "data = {'LR': 85, 'GBR': 94, 'SVR': 65, 'XGB':88, 'LR':66, 'KNN':91,'Decision Tree':86, 'RF':93  }\n",
+        "courses = list(data.keys())\n",
+        "values = list(data.values())\n",
+        " \n",
+        "ks =[ks_lr, ks_gb]\n",
+        "  \n",
+        "fig = plt.figure(figsize = (10, 5))\n",
+        " \n",
+        "# creating the bar plot\n",
+        "plt.bar(courses, values, color ='teal',width = 0.4)\n",
+        " \n",
+        "plt.xlabel(\"Algorithm\")\n",
+        "plt.ylabel(\"Kappa Score\")\n",
+        "plt.title(\"Coparison of Kappa Score for different algoriths\")\n",
+        "plt.show()"
+      ],
+      "execution_count": 104,
+      "outputs": [
+        {
+          "output_type": "display_data",
+          "data": {
+            "image/png": "iVBORw0KGgoAAAANSUhEUgAAAl4AAAFNCAYAAADRi2EuAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4yLjIsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy+WH4yJAAAgAElEQVR4nO3deZhkZX238fsbhl0CKCOiIJsEBQ0EUTSiILhv4C4vMYAo7uKWiAZFDTFoVFCDIq64IURFcEPAgLvooLgAGnFkFWRYBRUQ+L1/nKe1pu3uqZ6ZOr3M/bmuurrqrL966nTXt5/z1KlUFZIkSRq9v5npAiRJklYVBi9JkqSeGLwkSZJ6YvCSJEnqicFLkiSpJwYvSZKknhi8pJUoyT2T3JRktZmuZUySw5NcneTKma5lvhl12yY5K8lz2/19k5w2MO8hSX7Zjre9k2yc5BtJbkzyjlHUMypJdk9y2Qi3f1OSraaYf1GSR4xq/9Igg5fmhST/L8mi9gf2iiRfSbJr33VU1SVVdaequr3vfU8kyT2BVwHbVdXdJpi/1BtekjWSfC7Jt5P8bZ+1TiXJpkk+20LODUl+lmT/Ga5pyrZd2arqk1X1qIFJbwb+ux1vnwcOAq4G/raqXjXqegYl2T/Jt/rc53S0NloMkOSjSQ6f6Zq06jJ4ac5L8krgKOAtwMbAPYH3Anv1XMeCPvc3pHsC11TVVctaMMmawOeADYBHVdXvRl3cNHwcuBTYHLgL8GzgtytzB8vx+g3dtithXxPZHDhv3OPzazmuij1Lj90VNl+fl+a4qvLmbc7egPWBm4CnT7HMmnTB7DftdhSwZpu3O3AZ8Dq63oKLgH0H1n088CPgd3Rv/G8cmLcFUMCBwCXANwamLWjL7A8sBm4Efj22bbp/eg4FLgauAj4GrD9uu/u17V4N/Nsy2uBjwJK2vUPb9h8B/BG4o7XRRydYd+z5rwOcBpwKrD0w/wDgglb/YuD5E6w7Wdt9FDgGOL2t/3Vg84H572pt+jvgHOChUzzHm4Adp5i/K/Ad4Pq2zf2napuB1+bbwJHANcDh7Vh5e2v337b6155gfxO2LfAkujB0PXAWcJ+BdS4CXgP8BLhl7BgZt91HAj8HbgD+u7XZcwfq/Va7/6u27z+2/R8P/Am4tT1+RDsGDmnLXgOcCNx5smO3TX9Oe72vA7467vUq4AXAL9vzOxoIcB/gZuD2tu/rJ3mNlnksDTzeie737kbgf4ATgMMH5j8PuBC4FjgFuPu4Ol/c6vz1wLR70fUKDrbTFwZem1e31+aGtr+12ryNgC+253wt8E3aMeTN2/LcZrwAb95W5AY8BrhtojexgWXeDHwPuCuwkO4N+t/bvN3b+u+ke9PdDfg9sO3A/Pu1N7G/p3sz3rvNG3vz+hiwLrD2wLQFbdrvBra1CbB9u/+c9saxFXAnup6mj4/b7gfaNnege6O+zyTP72PAycB6bd3/Aw4cqP+yKdpmd7pQ8vX2BrbmuPmPB7ame4PdDfgDsNOQbfdRujfOh7X576IFhzb/n+h6rxbQnbK7cuzNboI6z6ALSc8C7jlu3uZtP/sAq7dt7jhE2+zf6n9pq2FtuhB2CnDnts4XgP+cou0Gw8Lftef/yFbHv7bXeI02/yLgXGAzJg5zG7Xn8bS2/itafX8VvAa294iBxx9l6XByMN1xv2lr//cDx09x7O7V6r1Pa49Dge8MbK/oAsgGdL19S4DHTFTbJO21rGPpsnZ/DbqQfHBrh6fQBaXD2/w96IL+Tu15vYcWHAfqPL29hmsPTLvXRO000JbfB+7e1rsAeEGb9590AXz1dnsokJn+2+dt7t5mvABv3lbkBuwLXLmMZX4FPG7g8aOBi9r93dub27oD808EXj/Jto4Cjmz3x968thqYPzZtLHhdDzyVcW+0wNeAFw083pbuP/EFA9vYdGD+94FnTVDPau1NabuBac8Hzhp4fssKXje3bTx1iPb+PHDwMG3X3uA+PTDvTnS9IptNsu3rgB0mmbchcARdb9LtdAHmAW3ea4GTlqNt9gcuGZgXuuC09cC0B9N6TSZpu8Hg9XrgxIHHfwNcDuzeHl8EPGeKtv1n4Hvj6rmM5Q9eFwB7DjzeZIJjbPDY/QotlA7U/wdar1dbftdxr/UhE9U25O/u+GNpLHg9rLVbBpb9Fn8JXh8C3jbuuPoTsMVAnXuM29cwweufBh6/DTim3X8zXXi/13Senzdvk90c46W57hpgo2WM5bg73X/QYy5u08ZcV1W/n2h+kl2SnJlkSZIb6E61bDRu+5dOtNO2zWe2da5I8qUk956ipgV0Y9TGDH5S7g90bzDjbUT3X/j4bd1jopomcTVdT9JxSR49OCPJY5N8L8m1Sa4HHsfSz3/Stmv+3DZVdRPdqZqxtn11kgvaYPnr6U4Ljm/bsXWvq6pDqmp7ujY6F/h8ktD1IP1qgtWGaZvB124h3SnXc5Jc32o6tU0fxlKvaVXd0bY/2f4mWn+wvWoZyy/L5sBJA8/lArrQOniMXTpu+XcNLH8tXfgbrH+YY3JCQxxLY+4OXN6e/0R1jm/nm+j+DgzbzpOZ7Ln9F11P4GlJFic5ZDm2Lf2ZwUtz3XfpTsPtPcUyv6F7UxlzzzZtzIZJ1p1k/qfoTj1tVlXr051yyLjtF5Ooqq9W1SPpeht+Tnf6cLKabmP6A8avpvtvf/y2Lp/ORqrqc3TjZj6T5OHw58H2n6Ub87RxVW0AfJmln/9UbQddKKJt7050p3F+k+ShdKfingFs2LZ9A3/dthPVenWraey00KV0p7DGG6Ztatzyf6Q7HbxBu61fVcOGi6Ve04FQONn+xruCpdsrg4+Xw6XAYweeywZVtVZVTVbPpXTjrgaXX7uqvjPEvqZ6XsMeS2OuAO7Rnv+YwXYY387r0p1eHradp6z1rxauurGqXlVVW9GN4Xtlkj2nsw1pkMFLc1pV3QC8ATi6XctonSSrt/+u39YWOx44NMnCJBu15T8xblNvapdSeCjwBLoBvdCN87m2qm5O8kDg/w1bW7uu0l7tjeEWusG8dwzU9IokW7ZA8hbghKq6bZrP/3a6Uz7/kWS9JJsDr5zg+Q2zreOBlwAnJ3kI3VibNenG8tyW5LHAoyZYdbK2A3hckl2TrAH8O92ptEvp2vW2tu0FSd4ATHr5iiRvTXLfJAuSrAe8ELiwqq4BPgk8Iskz2vy7JNlxum3Teqg+AByZ5K5tv/cY3ws4hROBxyfZM8nqdOPWbqEbUziMLwHbJ3lK68F9GbAil6k4hu65bw7Qjv+pPul7DPDaJNu35ddP8vQh9/VbYNP2Ok9k2GMJun+mbgde0l7PvYAHDsw/HjggyY4t0L0FOLuqLppGrZNe02u8JE9Icq8WBG9otd2xjNWkSRm8NOdV1Tvo3lAPpfvDfildgPh8W+RwYBHdJ5Z+CvywTRtzJd34ot/QvYm/oKp+3ua9CHhzkhvpAtuJ0yjtb1pdv6E7bbMbXWAA+DDdJRK+Qfdpx5vpBnkvj5fSjU1aTDcW5lNt+9NWVcfRBYYv0Q2yfhndc76OLnSeMm6VqdqOVsthdM///nQD6qH7xNypdIPdL6Z7/lOdHloHOIluzNxiuh6PJ7WaL6E7bfWqtp9z6T6QANNvm9fQnVb6XpLf0Q3q33aK5f+sqn7Rnt976HrPngg8sapuHXL9q4Gn041luwbYhu4DBcvrXXSv12nt+P0esMsU+z8JeCvw6fbcfwY8dsh9/S/d+Lsrk1w9wbZvZNnH0tiyt9INqD+Q7vX+J7pB/be0+WfQjaf7LF3v2NZ0p8qH9SFgu3ZK9fPLXLp7Hc6g+8fpu8B7q+rMaexPWkqWPo0urVqS7A58oqo2nela5ppltV2Sj9INmD60z7o0/yQ5m26w+0dmuhZpRdnjJUmaVZLsluRu7VTjfnSXcjl1puuSVgav6itJmm22pTstuS7daeKnVdUVM1uStHJ4qlGSJKknnmqUJEnqicFLkiSpJ3NijNdGG21UW2yxxUyXIUmStEznnHPO1VU14bdezIngtcUWW7Bo0aKZLkOSJGmZklw82TxPNUqSJPXE4CVJktQTg5ckSVJPDF6SJEk9MXhJkiT1xOAlSZLUE4OXJElSTwxekiRJPTF4SZIk9cTgJUmS1BODlyRJUk/mxHc1anbLm940o/uvww6b0f1LkjQse7wkSZJ6YvCSJEnqiacaJUlSb2ZyeMpsGJpij5ckSVJPDF6SJEk9MXhJkiT1xOAlSZLUEwfXS9IqyOvvSTPDHi9JkqSeGLwkSZJ6YvCSJEnqicFLkiSpJwYvSZKknhi8JEmSemLwkiRJ6onX8ZI0Z3ktKklzjT1ekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8MXpIkST3xU42SJE2Dn6bVirDHS5IkqScGL0mSpJ4YvCRJknpi8JIkSeqJwUuSJKknBi9JkqSeGLwkSZJ6YvCSJEnqicFLkiSpJwYvSZKknhi8JEmSemLwkiRJ6slIg1eSVyQ5L8nPkhyfZK0kWyY5O8mFSU5IssYoa5AkSZotRha8ktwDeBmwc1XdF1gNeBbwVuDIqroXcB1w4KhqkCRJmk1GfapxAbB2kgXAOsAVwB7AZ9r844C9R1yDJEnSrDCy4FVVlwNvBy6hC1w3AOcA11fVbW2xy4B7TLR+koOSLEqyaMmSJaMqU5IkqTejPNW4IbAXsCVwd2Bd4DHDrl9Vx1bVzlW188KFC0dUpSRJUn9GearxEcCvq2pJVf0J+BzwEGCDduoRYFPg8hHWIEmSNGuMMnhdAjwoyTpJAuwJnA+cCTytLbMfcPIIa5AkSZo1RjnG62y6QfQ/BH7a9nUs8BrglUkuBO4CfGhUNUiSJM0mC5a9yPKrqsOAw8ZNXgw8cJT7lSRJmo28cr0kSVJPDF6SJEk9MXhJkiT1xOAlSZLUE4OXJElSTwxekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8MXpIkST0xeEmSJPXE4CVJktQTg5ckSVJPDF6SJEk9MXhJkiT1xOAlSZLUE4OXJElSTwxekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8MXpIkST0xeEmSJPXE4CVJktQTg5ckSVJPDF6SJEk9MXhJkiT1xOAlSZLUE4OXJElSTwxekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8WzHQBs0Xe9KYZ3X8ddtiM7l+SJI2ePV6SJEk9MXhJkiT1xFON0gybydPcnuKWpH7Z4yVJktQTg5ckSVJPDF6SJEk9MXhJkiT1xOAlSZLUE4OXJElSTwxekiRJPTF4SZIk9cTgJUmS1JORBq8kGyT5TJKfJ7kgyYOT3DnJ6Ul+2X5uOMoaJEmSZotR93i9Czi1qu4N7ABcABwCfK2qtgG+1h5LkiTNeyMLXknWBx4GfAigqm6tquuBvYDj2mLHAXuPqgZJkqTZZKjglWTXJAe0+wuTbDnEalsCS4CPJPlRkg8mWRfYuKquaMtcCWy8PIVLkiTNNcsMXkkOA14DvLZNWh34xBDbXgDsBLyvqv4B+D3jTitWVQE1yX4PSrIoyaIlS5YMsTtJkqTZbZgerycDT6ILTlTVb4D1hljvMuCyqjq7Pf4MXRD7bZJNANrPqyZauaqOraqdq2rnhQsXDrE7SZKk2W2Y4HXrYM9UO124TFV1JXBpkm3bpD2B84FTgP3atP2Ak6dVsSRJ0hy1YIhlTkzyfmCDJM8DngN8YMjtvxT4ZJI1gMXAAXRh78QkBwIXA8+YftmSJElzz5TBK0mAE4B7A78DtgXeUFWnD7PxqjoX2HmCWXtOs05JkqQ5b8rgVVWV5MtVdT9gqLAlSZKkiQ0zxuuHSR4w8kokSZLmuWHGeO0C7JvkYrpPNoauM+zvR1qZJEnSPDNM8Hr0yKuQJElaBSzzVGNVXQxsADyx3TZo0yRJkjQNw1y5/mDgk8Bd2+0TSV466sIkSZLmm2FONR4I7FJVvwdI8lbgu8B7RlmYJEnSfDPMpxoD3D7w+PY2TZIkSdMwTI/XR4Czk5zUHu8NfGh0JUmSJM1PywxeVfXOJGcBu7ZJB1TVj0ZalSRJ0jy0zOCV5EHAeVX1w/b4b5PsUlVnj7w6SZKkeWSYMV7vA24aeHxTmyZJkqRpGGpwfVXV2IOquoPhxoZJkiRpwDDBa3GSlyVZvd0OBhaPujBJkqT5Zpjg9QLgH4HL220X4KBRFiVJkjQfDfOpxquAZ/VQiyRJ0rw2aY9Xkucl2abdT5IPJ7khyU+S7NRfiZIkSfPDVKcaDwYuavf3AXYAtgJeCbxrtGVJkiTNP1MFr9uq6k/t/hOAj1XVNVV1BrDu6EuTJEmaX6YKXnck2STJWsCewBkD89YebVmSJEnzz1SD698ALAJWA06pqvMAkuyGl5OQJEmatkmDV1V9McnmwHpVdd3ArEXAM0demSRJ0jwz5eUkquo24Lpx034/0ookSZLmqWEuoCpJkqSVwOAlSZLUk6G+7DrJhsA2wFpj06rqG6MqSpIkaT5aZvBK8ly6i6luCpwLPAj4LrDHaEuTJEmaX4Y51Xgw8ADg4qp6OPAPwPUjrUqSJGkeGiZ43VxVNwMkWbOqfg5sO9qyJEmS5p9hxnhdlmQD4PPA6UmuAy4ebVmSJEnzzzKDV1U9ud19Y5IzgfWBU0dalSRJ0jw07KcadwJ2BQr4dlXdOtKqJEmS5qFljvFK8gbgOOAuwEbAR5IcOurCJEmS5ptherz2BXYYGGB/BN1lJQ4fZWGSJEnzzTCfavwNAxdOBdYELh9NOZIkSfPXMD1eNwDnJTmdbozXI4HvJ3k3QFW9bIT1SZIkzRvDBK+T2m3MWaMpRZIkaX4b5nISxyVZA7g3XY/XL/xUoyRJ0vQN812NjwPeD/wKCLBlkudX1VdGXZwkSdJ8MsypxncCD6+qCwGSbA18CTB4SZIkTcMwn2q8cSx0NYuBG0dUjyRJ0rw1TI/XoiRfBk6kG+P1dOAHSZ4CUFWfG2F9kiRJ88YwwWst4LfAbu3xEmBt4Il0QczgJUmSNIRhPtV4QB+FSJIkzXfDfKpxLeBAYHsGrmBfVc8ZYV2SJEnzzjCD6z8O3A14NPB1YFMcXC9JkjRtwwSve1XV64HfV9VxwOOBXYbdQZLVkvwoyRfb4y2TnJ3kwiQntIuzSpIkzXvDBK8/tZ/XJ7kvsD5w12ns42DggoHHbwWOrKp7AdfRncaUJEma94YJXscm2RA4FDgFOJ8uPC1Tkk3pesg+2B4H2AP4TFvkOGDvadYsSZI0J00avJJsBlBVH6yq66rqG1W1VVXdFbh8yO0fBfwrcEd7fBfg+qq6rT2+DLjH8pUuSZI0t0zV43V6ki3GT0xyAPCuZW04yROAq6rqnOUpLMlBSRYlWbRkyZLl2YQkSdKsMlXweiVwWpJtxiYkeW2bvtuka/3FQ4AnJbkI+DTdKcZ3ARskGbuMxaZM0ntWVcdW1c5VtfPChQuH2J0kSdLsNmnwqqovAy8EvpLkvkmOorta/cOq6rJlbbiqXltVm1bVFsCzgP+tqn2BM4GntcX2A05ewecgSZI0J0w5uL6qvgYcAJwFbAXsUVXXreA+XwO8MsmFdGO+PrSC25MkSZoTJr1yfZIb6b6LMcCawJ7AVe2TiVVVfzvsTqrqLLrwRlUtBh64/CVLkiTNTZMGr6par89CJEmS5rthruMlSZKklcDgJUmS1BODlyRJUk8MXpIkST0xeEmSJPXE4CVJktQTg5ckSVJPDF6SJEk9MXhJkiT1xOAlSZLUE4OXJElSTwxekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8MXpIkST0xeEmSJPXE4CVJktQTg5ckSVJPDF6SJEk9MXhJkiT1xOAlSZLUE4OXJElSTwxekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8MXpIkST0xeEmSJPXE4CVJktQTg5ckSVJPDF6SJEk9MXhJkiT1xOAlSZLUE4OXJElSTwxekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8MXpIkST0xeEmSJPXE4CVJktQTg5ckSVJPDF6SJEk9MXhJkiT1ZGTBK8lmSc5Mcn6S85Ic3KbfOcnpSX7Zfm44qhokSZJmk1H2eN0GvKqqtgMeBLw4yXbAIcDXqmob4GvtsSRJ0rw3suBVVVdU1Q/b/RuBC4B7AHsBx7XFjgP2HlUNkiRJs0kvY7ySbAH8A3A2sHFVXdFmXQls3EcNkiRJM23kwSvJnYDPAi+vqt8NzquqAmqS9Q5KsijJoiVLloy6TEmSpJEbafBKsjpd6PpkVX2uTf5tkk3a/E2AqyZat6qOraqdq2rnhQsXjrJMSZKkXozyU40BPgRcUFXvHJh1CrBfu78fcPKoapAkSZpNFoxw2w8Bng38NMm5bdrrgCOAE5McCFwMPGOENUiSJM0aIwteVfUtIJPM3nNU+5UkSZqtvHK9JElSTwxekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8MXpIkST0xeEmSJPXE4CVJktQTg5ckSVJPDF6SJEk9MXhJkiT1xOAlSZLUE4OXJElSTwxekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8MXpIkST0xeEmSJPXE4CVJktQTg5ckSVJPDF6SJEk9MXhJkiT1xOAlSZLUE4OXJElSTwxekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8MXpIkST0xeEmSJPXE4CVJktQTg5ckSVJPDF6SJEk9MXhJkiT1xOAlSZLUE4OXJElSTwxekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8MXpIkST0xeEmSJPXE4CVJktQTg5ckSVJPDF6SJEk9mZHgleQxSX6R5MIkh8xEDZIkSX3rPXglWQ04GngssB2wT5Lt+q5DkiSpbzPR4/VA4MKqWlxVtwKfBvaagTokSZJ6NRPB6x7ApQOPL2vTJEmS5rVUVb87TJ4GPKaqntsePxvYpapeMm65g4CD2sNtgV/0Wuj0bQRcPdNFzFG23Yqx/Zafbbf8bLvlZ9utmLnQfptX1cKJZizouxLgcmCzgcebtmlLqapjgWP7KmpFJVlUVTvPdB1zkW23Ymy/5WfbLT/bbvnZditmrrffTJxq/AGwTZItk6wBPAs4ZQbqkCRJ6lXvPV5VdVuSlwBfBVYDPlxV5/VdhyRJUt9m4lQjVfVl4Mszse8RmjOnRWch227F2H7Lz7Zbfrbd8rPtVsycbr/eB9dLkiStqvzKIEmSpJ4YvJZDkpsmmPbGJJcnOTfJ+Un2mYnaZpskGyf5VJLFSc5J8t0kT06ye5IbWnv9JMkZSe7a1tk/yZI27+dJXjHTz2OmJPm3JOe1Njo3yWFJ/nPcMjsmuaDdvyjJT9vyX0+y+cxUPnOSbJbk10nu3B5v2B5vkWSbJF9M8qt2PJ6Z5GFtucHj7rwkn0myzsw+m/4N/n1L8rgk/5dk8/Y37g9jv6cTLFtJ3jHw+NVJ3thb4dOQ5PaB1/nHSV6VZLneD5O8Ockjppj/giT/vPzVQpL7tXrPTXJtO57PTXLGimx3tht4nX6W5AtJNmjTt0jyx4E2Obd9WG9OMHitXEdW1Y50V+J/f5LVZ7qgmZQkwOeBb1TVVlV1f7pPsW7aFvlmVe1YVX9P92nXFw+sfkJry4cA/5Zk8BIkq4QkDwaeAOzU2ugRwJnAM8ct+izg+IHHD2/LnwUc2kOps0pVXQq8DziiTTqCbkzIlcCXgGOraut2PL4U2Gpg9RPaMbk9cCt/3darjCR7Au8GHltVF7fJVwOvmmSVW4CnJNmoj/pW0B8HXudH0n2F3WHLs6GqekNVTRqAquqYqvrYctY5to2ftnp3pLsKwL+0x38OfElmZMz2iI29TvcFrmXp94hfjbVJu906QzVOm8FrBKrql8AfgA1nupYZtgdwa1UdMzahqi6uqvcMLtQC2nrAdeM3UFXXABcCm4y41tloE+DqqroFoKqurqpvANcl2WVguWewdPAa811W3W+FOBJ4UJKXA7sCbwf2Bb5bVX++fE1V/ayqPjp+5fYmti4THJOrgtYL+AHgCVX1q4FZHwaeOdabOM5tdAF3TvVQV9VVdBfrfkk6qyX5ryQ/aD3Hzx9bNslrWo/yj5Mc0aZ9NN2FwUlyRDvj8ZMkb2/T3pjk1e3+jkm+1+aflGTDNv2sJG9N8v3Ww/jQYWpv6x2VZBFwcJL7t57uc5J8Nckmbbmtk5zapn8zyb1XYhP2Zd78PTN4jUCSnYBftl/oVdn2wA+nmP/QJOcCl9D15nx4/AJJ7gmsBfxkJBXObqcBm7U/xO9NslubfjxdLxdJHgRc28L+eI+h63Fc5VTVn4B/oQtgL2+Pl3U8QhcqzqW7qPOdgS+MtNDZaU2642bvqvr5uHk30f2eHjzJukcD+yZZf4T1rXRVtZju8kZ3BQ4EbqiqBwAPAJ6X7rqTj6U7m7FLVe0AvG1wG0nuAjwZ2L71OB8+wa4+Brymzf8pS/eyLaiqBwIvZ3q9b2u0i4m+G3gP8LTWm/th4D/aMscCL23TXw28dxrbn3FJVgP2ZOlrfm49cJrx6BkqbbkYvFauVyQ5DzibvxzwapIc3f5T/EGbNHaqcTPgIyz9h+yZSX5C19v13qq6ue96Z1pV3QTcn+6/8SXACUn2B04AntbGpIw/zQhwZpLL6U6fTNQTtqp4LHAFcN+JZrYeh58l+dzA5LFT3Heje2P8l9GXOev8CfgOXQCZyLuB/ZKsN35GVf2OLly8bHTljdyjgH9uAfxs4C7ANnT/HH6kqv4AUFXXjlvvBuBm4ENJnkJ31uPPWhjdoKq+3iYdBzxsYJGx4/AcYItp1HtC+7kt3bF+eqv9UGDTJHcC/hH4nzb9/cydMwhrt5qvBDYGTh+YN3iq8cUTrz47GbxWriPbmIGn0v3yrTXTBc2w84Cdxh60X449gYm+v+oUlv4jdEL7r/AfgSOS3G2Uhc5WVXV7VZ1VVYcBLwGe2sYw/RrYje5YO2Hcag8HNgfOBd7UZ72zRZId6cbuPIjuH6JN+Ovj8cnA/nQ9W0up7jo7X2DpY3JVcQfd6esHJnnd+JlVdT3wKZYebzPoKLrQtu7IKlzJkmwF3A5cBYSud5bckJYAAATESURBVGjsTX3LqjptWduoqtuABwKfoRubeeo0y7il/byd6V1j8/ftZ4DzBuq+X1U9iu59/vpx46HuM83aZsof2z9Cm9M9vzkVsCZj8BqBNoZkEbDfTNcyw/4XWCvJCwemTfYpsV2BX42fWFWLgI8z+amNeSvJtkm2GZi0IzA2yPl4utNoi6vqsvHrtjeBl9P95z7ReJx5q40ZfB/dKcZLgP+iG+P1KeAhSZ40sPhUn1qc8JhcFbRencfTnTacqOfrncDzmSAgtJ6gE5m8x2xWSbIQOAb47xa4vwq8cOzDUUn+Lsm6dL0tB6R90nX871XrWVq/XSD8FcAOg/Or6ga68Zlj47eeDXydlecXwML2oRySrJ5k+9YL+eskT2/Tk2SHqTY027Tj8WXAq+bDhwjm/BOYIeskGXyze+cEy7wZ+FSSD1TVHT3VNatUVSXZGzgyyb/SnS77PfCatsjYGK/QddM/d5JNvRX4YZK3VNWNo657FrkT8J50H6G+je6060Ft3v/QnfJ56WQrV9UVSY6n+y/x30dc62zyPOCSqho7LfFe4AC63ognAO9MchTwW+BGlh6L88wku9L9U3oZXY/YKqmqrk3yGOAbSZaMm3d1kpOYfCD9O+h6aGersVNYq9P9bn2cv/wd/yDdqb4fthC/hG6826mtJ3VRklvpvn1lsEdwPeDkdqYjwCsn2O9+wDEtvC2mOy5Xiqq6tQ3yf3c7rbmArvfxPLoPlrwvyaHtOX8a+PHK2ncfqupHbfjJPsA3Z7qeFeGV6yVJknriqUZJkqSeGLwkSZJ6YvCSJEnqicFLkiSpJwYvSZKknhi8JM1qSfZOUmPfL5dkiyQ/W4nb/2CS7dr91w1MX6n7kSQweEma/fYBvtV+rlRJVquq51bV+W3SX12pXZJWJoOXpFmrXQ18V7qroD9rgvnrJDkxyfntuxfPTrJzm7dPkp+272N868A6NyV5R5IfAw9OclaSnZMcQbuwZpJPtsVXS/KBJOclOS3J2m0bZyU5MsmiJBckeUCSzyX5ZZKJvhxZkgCDl6TZbS/g1Kr6P+CaJPcfN/9FwHVVtR3werovFSfJ3em+8WAPuq9aekD7FgXovkPw7Kraoaq+NbahqjqE9t1wVbVvm7wNcHT7Dtbr6b4bc8ytVbUz3dfNnEz3DQH3BfZPcpeV9PwlzTMGL0mz2T50X29C+zn+dOOuY/Or6mfAT9r0BwBnVdWS9r2Vn+QvX3h9O/DZIff/66o6t90/h+6rZMac0n7+lO7Lia+oqlvovgpmsyG3L2kV43c1SpqV2pcQ7wHcL0kBqwEFHL2Cm765qm4fctlbBu7fDqw9wbw7xi13B/5tlTQJe7wkzVZPAz5eVZtX1RZVtRnwa5buTfo28AyA9snE+7Xp3wd2S7JRktXoesq+PsQ+/5Rk9ZX2DCRpHIOXpNlqH+CkcdM+C7x24PF7gYVJzgcOB84DbqiqK4BDgDOBHwPnVNXJQ+zzWOAnA4PrJWmlSlXNdA2StFxab9bqVXVzkq2BM4Btq+rWGS5NkibkOARJc9k6wJnt9GCAFxm6JM1m9nhJkiT1xDFekiRJPTF4SZIk9cTgJUmS1BODlyRJUk8MXpIkST0xeEmSJPXk/wMDLtSbyvTPBwAAAABJRU5ErkJggg==\n",
+            "text/plain": [
+              "<Figure size 720x360 with 1 Axes>"
+            ]
+          },
+          "metadata": {
+            "tags": [],
+            "needs_background": "light"
+          }
+        }
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "LfIe5758PeG_"
+      },
+      "source": [
+        "* Gradient Boosting regressor gives highest cohen kappa score (0.95) \n",
+        "* We made our final prediction with Gradient Boosting Regressor Model"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "TkAilMekTwOi"
+      },
+      "source": [
+        "## Prediction by best Model"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "b0b7vb8FTqD4",
+        "outputId": "c083c493-c6ad-4966-c88c-b9bb8f2342e7"
+      },
+      "source": [
+        "gbr = ensemble.GradientBoostingRegressor(alpha=0.9, criterion='friedman_mse', init=None,\n",
+        "             learning_rate=0.1, loss='ls', max_depth=2, max_features=None,\n",
+        "             max_leaf_nodes=None, min_impurity_decrease=0.0,\n",
+        "             min_impurity_split=None, min_samples_leaf=1,\n",
+        "             min_samples_split=2, min_weight_fraction_leaf=0.0,\n",
+        "             n_estimators=1000, presort='auto', random_state=None,\n",
+        "             subsample=1.0, verbose=0, warm_start=False)\n",
+        "gbr.fit(trainDataVecs2, dep_train)\n",
+        "predicted_scores = gbr.predict(testDataVecs2)"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "/usr/local/lib/python3.7/dist-packages/sklearn/ensemble/_gb.py:1342: FutureWarning: The parameter 'presort' is deprecated and has no effect. It will be removed in v0.24. You can suppress this warning by not passing any value to the 'presort' parameter. We also recommend using HistGradientBoosting models instead.\n",
+            "  FutureWarning)\n"
+          ],
+          "name": "stderr"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 202
+        },
+        "id": "S6_0WOLVMLwL",
+        "outputId": "a172a169-14b6-4c32-b703-7b64a28be425"
+      },
+      "source": [
+        "predicted_score = predicted_scores\n",
+        "# predicted_score = pd.Series([score for sublist in predicted_scores for score in sublist])\n",
+        "predicted_score=pd.DataFrame(predicted_score,columns=['Predicted_Score']).round()\n",
+        "predicted_score.head()"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/html": [
+              "<div>\n",
+              "<style scoped>\n",
+              "    .dataframe tbody tr th:only-of-type {\n",
+              "        vertical-align: middle;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe tbody tr th {\n",
+              "        vertical-align: top;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe thead th {\n",
+              "        text-align: right;\n",
+              "    }\n",
+              "</style>\n",
+              "<table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              "    <tr style=\"text-align: right;\">\n",
+              "      <th></th>\n",
+              "      <th>Predicted_Score</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <th>0</th>\n",
+              "      <td>3.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>1</th>\n",
+              "      <td>2.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2</th>\n",
+              "      <td>3.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>3</th>\n",
+              "      <td>2.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>4</th>\n",
+              "      <td>16.0</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n",
+              "</div>"
+            ],
+            "text/plain": [
+              "   Predicted_Score\n",
+              "0              3.0\n",
+              "1              2.0\n",
+              "2              3.0\n",
+              "3              2.0\n",
+              "4             16.0"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 26
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "bZgNaf5PMOEu",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 164
+        },
+        "outputId": "9ca8f68c-fe9a-430c-fe1d-58cd8d7d3bef"
+      },
+      "source": [
+        "final_scores = pd.concat([test_data, predicted_score], axis = 1).rename(columns = {0:\"predicted_score\"})\n"
+      ],
+      "execution_count": 37,
+      "outputs": [
+        {
+          "output_type": "error",
+          "ename": "NameError",
+          "evalue": "ignored",
+          "traceback": [
+            "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+            "\u001b[0;31mNameError\u001b[0m                                 Traceback (most recent call last)",
+            "\u001b[0;32m<ipython-input-37-c6eda3cc4f0b>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0mfinal_scores\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mpd\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mconcat\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0mtest_data\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mpredicted_score\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0maxis\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;36m1\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrename\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mcolumns\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0;34m{\u001b[0m\u001b[0;36m0\u001b[0m\u001b[0;34m:\u001b[0m\u001b[0;34m\"predicted_score\"\u001b[0m\u001b[0;34m}\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m",
+            "\u001b[0;31mNameError\u001b[0m: name 'predicted_score' is not defined"
+          ]
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "WnaKTQw2MOGW"
+      },
+      "source": [
+        "final_scores.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    }
+  ]
+}
\ No newline at end of file