BBT4206-PHP-Lab15of15-ConsumePlumberAPIOutput-acers_team/Lab 15 Savemodel.R at main · BI-course/BBT4206-PHP-Lab15of15-ConsumePlumberAPIOutput-acers_team · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
# *****************************************************************************
# Lab 11: Saving the Model ----
#
# Course Code: BBT4206
# Course Name: Business Intelligence II
# Semester Duration: 21st August 2023 to 28th November 2023
#
# Lecturer: Allan Omondi
# Contact: aomondi [at] strathmore.edu
#
# Note: The lecture contains both theory and practice. This file forms part of
#       the practice. It has required lab work submissions that are graded for
#       coursework marks.
#
# License: GNU GPL-3.0-or-later
# See LICENSE file for licensing information.
# *****************************************************************************

# **[OPTIONAL] Initialization: Install and use renv ----
# The R Environment ("renv") package helps you create reproducible environments
# for your R projects. This is helpful when working in teams because it makes
# your R projects more isolated, portable and reproducible.

# Further reading:
#   Summary: https://rstudio.github.io/renv/
#   More detailed article: https://rstudio.github.io/renv/articles/renv.html

# "renv" It can be installed as follows:
# if (!is.element("renv", installed.packages()[, 1])) {
# install.packages("renv", dependencies = TRUE,
# repos = "https://cloud.r-project.org") # nolint
# }
# require("renv") # nolint

# Once installed, you can then use renv::init() to initialize renv in a new
# project.

# The prompt received after executing renv::init() is as shown below:
# This project already has a lockfile. What would you like to do?

# 1: Restore the project from the lockfile.
# 2: Discard the lockfile and re-initialize the project.
# 3: Activate the project without snapshotting or installing any packages.
# 4: Abort project initialization.

# Select option 1 to restore the project from the lockfile
# renv::init() # nolint

# This will set up a project library, containing all the packages you are
# currently using. The packages (and all the metadata needed to reinstall
# them) are recorded into a lockfile, renv.lock, and a .Rprofile ensures that
# the library is used every time you open the project.

# Consider a library as the location where packages are stored.
# Execute the following command to list all the libraries available in your
# computer:
.libPaths()

# One of the libraries should be a folder inside the project if you are using
# renv

# Then execute the following command to see which packages are available in
# each library:
lapply(.libPaths(), list.files)

# This can also be configured using the RStudio GUI when you click the project
# file, e.g., "BBT4206-R.Rproj" in the case of this project. Then
# navigate to the "Environments" tab and select "Use renv with this project".

# As you continue to work on your project, you can install and upgrade
# packages, using either:
# install.packages() and update.packages or
# renv::install() and renv::update()

# You can also clean up a project by removing unused packages using the
# following command: renv::clean()

# After you have confirmed that your code works as expected, use
# renv::snapshot(), AT THE END, to record the packages and their
# sources in the lockfile.

# Later, if you need to share your code with someone else or run your code on
# a new machine, your collaborator (or you) can call renv::restore() to
# reinstall the specific package versions recorded in the lockfile.

# [OPTIONAL]
# Execute the following code to reinstall the specific package versions
# recorded in the lockfile (restart R after executing the command):
# renv::restore() # nolint

# [OPTIONAL]
# If you get several errors setting up renv and you prefer not to use it, then
# you can deactivate it using the following command (restart R after executing
# the command):
# renv::deactivate() # nolint

# If renv::restore() did not install the "languageserver" package (required to
# use R for VS Code), then it can be installed manually as follows (restart R
# after executing the command):

if (require("languageserver")) {
  require("languageserver")
} else {
  install.packages("languageserver", dependencies = TRUE,
                   repos = "https://cloud.r-project.org")
}

# Introduction ----
# What do you do after you have designed a model that is accurate enough to use?
# This is a critical question whose answer enables the gap between research and
# practice to be addressed.

# It is possible to discover the key internal representation of a model found
# by an algorithm (e.g., the coefficients in a linear model) and use
# them in a new implementation of the prediction algorithm in another
# program developed using a programming language other than R.

# This is easier to do for simpler algorithms that use a simple representation,
# e.g., a linear model, than for algorithms that use more complex
# representations.

# "caret" provides access to "the best" model from a training run in the
# "finalModel" variable.
# The "predict()" function in the "caret" package automatically uses the
# "finalModel" to make predictions on a new dataset. The data provided as the
# "new dataset" can be stored in a separate file and loaded as a data frame.

# STEP 1. Install and Load the Required Packages ----
## caret ----
if (require("caret")) {
  require("caret")
} else {
  install.packages("caret", dependencies = TRUE,
                   repos = "https://cloud.r-project.org")
}

## mlbench ----
if (require("mlbench")) {
  require("mlbench")
} else {
  install.packages("mlbench", dependencies = TRUE,
                   repos = "https://cloud.r-project.org")
}

## plumber ----
if (require("plumber")) {
  require("plumber")
} else {
  install.packages("plumber", dependencies = TRUE,
                   repos = "https://cloud.r-project.org")
}

# STEP 2. Load the Dataset ----
data(Satellite)

# STEP 3. Train the Model ----
# create an 80%/20% data split for training and testing datasets respectively
set.seed(7)
train_index <- createDataPartition(Satellite$classes,
                                   p = 0.7, list = FALSE)
satellite_training <- Satellite[train_index, ]
satellite_testing <- Satellite[-train_index, ]

set.seed(7)
train_control <- trainControl(method = "cv", number = 10)
satellite_model_lda <- train(classes ~ ., data = satellite_training,
                             method = "lda", metric = "Accuracy",
                             trControl = train_control)

# We print a summary of what caret has done
print(satellite_model_lda)

# We then print the details of the model that has been created
print(satellite_model_lda$finalModel)

# STEP 4. Test the Model ----
# We can test the model
set.seed(9)
predictions <- predict(satellite_model_lda, newdata = satellite_testing)
confusionMatrix(predictions, satellite_testing$classes)

# STEP 5. Save and Load your Model ----
# Saving a model into a file allows you to load it later and use it to make
# predictions. Saved models can be loaded by calling the `readRDS()` function

saveRDS(satellite_model_lda, "./models/saved_satellite_model_lda.rds")
# The saved model can then be loaded later as follows:
loaded_satellite_model_lda <- readRDS("./models/saved_satellite_model_lda.rds")
print(loaded_satellite_model_lda)

predictions_with_loaded_model <-
  predict(loaded_satellite_model_lda, newdata = satellite_testing)
confusionMatrix(predictions_with_loaded_model, satellite_testing$classes)


# STEP 6. Creating Functions in R ----

# Plumber requires functions, an example of the syntax for creating a function
# in R is:

name_of_function <- function(arg) {
  # Do something with the argument called `arg`
}

# STEP 7. Make Predictions on New Data using the Saved Model ----
# We can also create and use our own data frame as follows:
to_be_predicted <-
  data.frame(x.1 = 50, x.2 = 100 ,x.3 = 100,x.4 = 67 ,x.5 = 79 ,x.6 = 80,x.7 = 86 ,x.8 = 76 ,x.9 = 34,x.10 = 20,x.11 = 33 ,
             x.12 = 34,x.13 = 56 ,x.14 =78 ,x.15 = 55,x.16 =24 ,x.17 = 33,x.18 = 20,x.19 =19 ,x.20 = 40 ,x.21 = 60,x.22 = 80,
             x.23 = 54 ,x.24 =36 ,x.25 =78 ,x.26 = 108,x.27 =117 ,x.28 = 98,x.29 =80 ,x.30 =9 ,x.31 = 11,x.32 =22 ,x.33 = 44,
             x.34 = 33,x.35 = 22,x.36 =40)

# We then use the data frame to make predictions
predict(loaded_satellite_model_lda, newdata = to_be_predicted)

# STEP 8. Make predictions using the model through a function ----
# An alternative is to create a function and then use the function to make
# predictions

predict_satellite <-
  function(arg_x.1, arg_x.2, arg_x.3 , arg_x.4, arg_x.5, arg_x.6 , arg_x.7 , arg_x.8 , arg_x.9, arg_x.10 ,
           arg_x.11 , arg_x.12, arg_x.13, arg_x.14, arg_x.15, arg_x.16, arg_x.17, arg_x.18, arg_x.19, arg_x.20,
           arg_x.21 , arg_x.22 , arg_x.23 , arg_x.24, arg_x.25, arg_x.26, arg_x.27,arg_x.28,arg_x.29,arg_x.30,
           arg_x.31,arg_x.32,arg_x.33,arg_x.34,arg_x.35,arg_x.36) {
    # Create a data frame using the arguments
    to_be_predicted <-
      my_data <- data.frame(
        x.1 = arg_x.1,
        x.2 = arg_x.2,
        x.3 = arg_x.3,
        x.4 = arg_x.4,
        x.5 = arg_x.5,
        x.6 = arg_x.6,
        x.7 = arg_x.7,
        x.8 = arg_x.8,
        x.9 = arg_x.9,
        x.10 = arg_x.10,
        x.11 = arg_x.11,
        x.12 = arg_x.12,
        x.13 = arg_x.13,
        x.14 = arg_x.14,
        x.15 = arg_x.15,
        x.16 = arg_x.16,
        x.17 = arg_x.17,
        x.18 = arg_x.18,
        x.19 = arg_x.19,
        x.20 = arg_x.20,
        x.21 = arg_x.21,
        x.22 = arg_x.22,
        x.23 = arg_x.23,
        x.24 = arg_x.24,
        x.25 = arg_x.25,
        x.26 = arg_x.26,
        x.27 = arg_x.27,
        x.28 = arg_x.28,
        x.29 = arg_x.29,
        x.30 = arg_x.30,
        x.31 = arg_x.31,
        x.32 = arg_x.32,
        x.33 = arg_x.33,
        x.34 = arg_x.34,
        x.35 = arg_x.35,
        x.36 = arg_x.36
      )


    # Make a prediction based on the data frame
    predict(loaded_satellite_model_lda, to_be_predicted)
  }


# We can now call the function predict_satellite() instead of calling the
# predict() function directly

predict_satellite(86, 148, 72, 35, 100, 33, 78, 50,80, 102, 34, 56,74, 87, 90, 11,84
                  ,56 ,78 ,90 ,44,34,24,78,88,100,43,22,11,30,54,66,44,33,20,98)

predict_satellite(1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36)


# [OPTIONAL] **Deinitialization: Create a snapshot of the R environment ----
# Lastly, as a follow-up to the initialization step, record the packages
# installed and their sources in the lockfile so that other team-members can
# use renv::restore() to re-install the same package version in their local
# machine during their initialization step.
# renv::snapshot() # nolint