computational-metabolomics
diff --git a/‎DESCRIPTION‎
Lines changed: 1 addition & 0 deletions b/‎DESCRIPTION‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎NAMESPACE‎
Lines changed: 3 additions & 0 deletions b/‎NAMESPACE‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎R/hca_class.R‎
Lines changed: 113 additions & 0 deletions b/‎R/hca_class.R‎
Lines changed: 113 additions & 0 deletions
diff --git a/‎man/HCA-class.Rd‎
Lines changed: 10 additions & 0 deletions b/‎man/HCA-class.Rd‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎man/hca_dendrogram-class.Rd‎
Lines changed: 10 additions & 0 deletions b/‎man/hca_dendrogram-class.Rd‎
Lines changed: 10 additions & 0 deletions
diff --git a/‎man/structToolbox.Rd‎
Lines changed: 1 addition & 1 deletion b/‎man/structToolbox.Rd‎
Lines changed: 1 addition & 1 deletion
@@ -35,6 +35,7 @@ Collate:
     'ggplot_theme_pub.R'
     'glog_class.R'
     'grid_search_1d_class.R'
+    'hca_class.R'
     'kfold_xval_class.R'
     'kfold_xval_charts.R'
     'knn_impute_class.R'
 
@@ -1,6 +1,7 @@
 # Generated by roxygen2: do not edit by hand
 
 export(ANOVA)
+export(HCA)
 export(HSD)
 export(HSDEM)
 export(PCA)
@@ -35,6 +36,7 @@ export(fs_line)
 export(glog_transform)
 export(grid_search_1d)
 export(gs_line)
+export(hca_dendrogram)
 export(kfold_xval)
 export(kfoldxcv_grid)
 export(kfoldxcv_metric)
@@ -84,6 +86,7 @@ exportMethods(run)
 import(agricolae)
 import(car)
 import(emmeans)
+import(ggdendro)
 import(ggplot2)
 import(ggthemes)
 import(grid)
 
@@ -0,0 +1,113 @@
+#' HCA method class
+#'
+#' HCA method class. Calculate a hierarchical clustering for the input data
+#'
+#' @export HCA
+HCA<-setClass(
+    "HCA",
+    contains=c('method'),
+    slots=c(
+        # INPUTS
+        params.dist_method='enum',
+        params.cluster_method='enum',
+        params.minkowski_power='numeric',
+        params.factor_name='character',
+        # OUTPUTS
+        outputs.dist_matrix='entity',
+        outputs.hclust='entity',
+        outputs.factor_df='data.frame'
+    ),
+    prototype = list(name='Hierarchical Cluster Analysis',
+        description='Applies hierarchical clustering to a dataset.',
+        type="univariate",
+        predicted='dist_matrix',
+
+
+        params.dist_method=enum(name='Distance method',
+            value='euclidean',
+            type='character',
+            description='The distance measure to be used. This must be one of "euclidean", "maximum", "manhattan", "canberra", "binary" or "minkowski"',
+            list=c("euclidean", "maximum", "manhattan", "canberra", "binary", "minkowski")
+        ),
+        params.cluster_method=enum(name='Clustering method',
+            value='complete',
+            type='character',
+            description='The agglomeration method to be used. This should be one of "ward.D", "ward.D2", "single", "complete", "average", "mcquitty", "median" or "centroid"',
+            list=c("ward.D", "ward.D2", "single", "complete", "average", "mcquitty", "median", "centroid")
+        ),
+
+        outputs.dist_matrix=entity(name='distance structure',
+            type='dist',
+            description='An object containing pairwise distance information between samples'
+        ),
+        outputs.hclust=entity(name='clustering object',
+            type='hclust',
+            description='An object of class hclust which describes the tree produced by the clustering process'
+        )
+    )
+)
+
+#' @export
+setMethod(f="method.apply",
+    signature=c("HCA",'dataset'),
+    definition=function(M,D)
+    {
+
+        M$dist_matrix=dist(D$data, method = M$dist_method, diag = FALSE, upper = FALSE, p = M$minkowski_power)
+
+        M$hclust=hclust(M$dist_matrix, method = M$cluster_method, members = NULL)
+
+        df=D$sample_meta[,M$factor_name,drop=FALSE]
+        df$orig_order=1:nrow(df)
+        df$label=rownames(D$data)
+        M$factor_df=df
+        return(M)
+    }
+)
+
+
+
+#' hca_dendrogram class
+#'
+#' plots a dendrogram for HCA
+#'
+#' @export hca_dendrogram
+#' @import ggdendro
+#' @include hca_class.R
+hca_dendrogram<-setClass(
+    "hca_dendrogram",
+    contains='chart'
+)
+
+#' @export
+setMethod(f="chart.plot",
+    signature=c("hca_dendrogram",'HCA'),
+    definition=function(obj,dobj)
+    {
+        hcdata=dendro_data(dobj$hclust)
+
+        A=label(hcdata)
+
+        A=A[order(dobj$factor_df$label),,drop=FALSE]
+        dobj$factor_df[order(dobj$factor_df$label),,drop=FALSE]
+        A$group=dobj$factor_df[,1]
+
+        g= ggplot() +
+            geom_segment(data=segment(hcdata), aes(x=x, y=y, xend=xend, yend=yend)) +
+            geom_point(data=A, aes(x=x, y=y,color=group))+
+            structToolbox:::scale_colour_Publication() +
+            structToolbox:::theme_Publication(base_size = 12) +
+            labs(color = colnames(dobj$factor_df)[1]) +
+            theme(axis.title.x=element_blank(),
+                axis.text.x=element_blank(),
+                axis.ticks.x=element_blank()) +
+            ylab('dissimilarity')
+
+        return(g)
+    }
+)
+
+
+
+
+