-
Notifications
You must be signed in to change notification settings - Fork 1
Expand file tree
/
Copy pathcluster_quality_vis.R
More file actions
52 lines (46 loc) · 1.93 KB
/
cluster_quality_vis.R
File metadata and controls
52 lines (46 loc) · 1.93 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
rm(list = ls())
cat("Loading packages...\n")
suppressMessages(library(readxl))
suppressMessages(library(dplyr))
suppressMessages(library(ggplot2))
suppressMessages(library(tidyr))
suppressMessages(library(stringr))
suppressMessages(library(viridis))
suppressMessages(library(ggpubr))
suppressMessages(library(ggrepel))
suppressMessages(library(viridis))
suppressMessages(library(EnhancedVolcano))
suppressMessages(library(gridExtra))
suppressMessages(library(survival))
suppressMessages(library(survminer))
suppressMessages(library(scales))
suppressMessages(library(rstatix))
suppressMessages(library(broom))
suppressMessages(library(boot))
suppressMessages(library(table1))
suppressMessages(library(colorspace))
suppressMessages(library(ggforce))
suppressMessages(library(ComplexHeatmap))
suppressMessages(library(circlize))
clst_dir <- "/mnt/sda1/OAI_Data/kmean_cluster_12252020/"
data_dir <- "/mnt/sda1/OAI_Data/data_summary/"
exp_id <- "kmean_pca_umap"
input_id <- "12112020_data_clean"
clean_co <- 'v25'
input_prefix <- paste(clst_dir, 'clean_', clean_co, '_', sep = "")
output_prefix <- paste(input_prefix, "final_", sep = "")
score_df <- as.data.frame(read_excel(paste(clst_dir, "kmeans_metric_pca_score_direct_knn2imp_", input_id, "241016_updated.xlsx", sep = "")))
colnames(score_df)[1] <- "cluster"
score_df$c <- as.numeric(str_split_fixed(score_df$cluster, "_C", n = 2)[,2])
print(head(score_df))
print(unique(score_df$cluster))
print(colnames(score_df))
gath_df <- gather(score_df, "metric", "value", colnames(score_df)[3:(ncol(score_df)-1)])
print(head(gath_df))
gg <- ggplot(gath_df, aes(x = c, y = value)) +
geom_point() +
geom_vline(xintercept = 4, linetype = "dotdash") +
facet_wrap(~metric, nrow = 3, scales = "free") +
labs(x = "Cluster", y = "Metric values", title = "Cluster quality") +
theme_bw()
ggsave(paste(clst_dir, "kmeans_metric_pca_score_direct_knn2imp_", input_id, "241016_updated.png", sep = ""), dpi = 300, width = 9, height = 6)