-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathEDA.R
More file actions
53 lines (49 loc) · 1.59 KB
/
EDA.R
File metadata and controls
53 lines (49 loc) · 1.59 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
# Exploratory Data Analysis
library(corrplot)
df <- read.csv("NBA Dataset/team_season.txt")
df <- df[-which(df$year <= 1978),]
df <- df[c(1:16,18:31,33:36)]
subset <- df
# subset <- df[c(1:17,19:20)]
subset$o_fgp <- subset$o_fgm/subset$o_fga
# # subset$o_3pp <- subset$o_3pm/subset$o_3pa
subset$o_ftp <- subset$o_ftm/subset$o_fta
subset$d_fgp <- subset$d_fgm/subset$d_fga
# # subset$o_3pp <- subset$o_3pm/subset$o_3pa
subset$d_ftp <- subset$d_ftm/subset$d_fta
subset <- subset[c(1:3,8:17,22:38)]
for(i in 4:22) {
subset[i] <- subset[i]/(subset$won+subset$lost)
}
subset <- subset[-6]
subset <- subset[-15]
write.csv(subset, file="updatedStatsFrom79OAndD.csv", row.names = FALSE)
# M <- cor(subset[4:16])
# corrplot(M, method="square")
# ====================================
#
# # Exploratory Data Analysis
# library(corrplot)
# df <- read.csv("NBA Dataset/team_season.txt")
# df <- df[-which(df$year <= 1998),]
# df <- df[c(1:18,34:36)]
# #
# subset <- df
# # # subset <- df[c(1:17,19:20)]
# subset$o_fgp <- subset$o_fgm/subset$o_fga
# subset$o_3pp <- subset$o_3pm/subset$o_3pa
# subset$o_ftp <- subset$o_ftm/subset$o_fta
# # subset$d_fgp <- subset$d_fgm/subset$d_fga
# # # # subset$o_3pp <- subset$o_3pm/subset$o_3pa
# # subset$d_ftp <- subset$d_ftm/subset$d_fta
# #
# subset <- subset[c(1:3,8:15,18:24)]
# for(i in 4:13) {
# subset[i] <- subset[i]/(subset$won+subset$lost)
# }
# subset <- subset[-6]
# # subset <- subset[-15]
# #
# write.csv(subset, file="updatedStatsFrom99.csv", row.names = FALSE)
# # # M <- cor(subset[4:16])
# # # corrplot(M, method="square")