StatFunGen
diff --git a/‎.DS_Store‎
-6 KB b/‎.DS_Store‎
-6 KB
diff --git a/‎R/colocboost.R‎
Lines changed: 14 additions & 14 deletions b/‎R/colocboost.R‎
Lines changed: 14 additions & 14 deletions
diff --git a/‎R/colocboost_init.R‎
Lines changed: 9 additions & 9 deletions b/‎R/colocboost_init.R‎
Lines changed: 9 additions & 9 deletions
diff --git a/‎R/colocboost_onecausal.R‎ ‎R/colocboost_one_causal.R‎R/colocboost_onecausal.R renamed to R/colocboost_one_causal.R
Lines changed: 54 additions & 54 deletions b/‎R/colocboost_onecausal.R‎ ‎R/colocboost_one_causal.R‎R/colocboost_onecausal.R renamed to R/colocboost_one_causal.R
Lines changed: 54 additions & 54 deletions
@@ -30,7 +30,7 @@
 #' @param dict_sumstatLD A L by 2 matrix of dictionary for \code{sumstat} and \code{LD} if there exist subsets of traits corresponding to the same sumstat.
 #'                  The first column should be 1:L for L sumstat The second column should be the index of \code{LD} corresponding to the sumstat.
 #'                  The innovation: do not provide the same matrix in \code{LD} to reduce the computational burden.
-#' @param traits_names The names of traits, which has the same order for Y.
+#' @param outcome_names The names of traits, which has the same order for Y.
 #' @param target_idx The index of the target trait if perform targeted ColocBoost
 #' @param effect_est Matrix of snp regression coefficients (i.e. regression beta values) in the genomic region
 #' @param effect_se Matrix of standard errors associated with the beta values
@@ -108,7 +108,7 @@ colocboost <- function(X = NULL, Y = NULL, # individual data
                        ###### - index dict for X match multiple Y / LD match multiple sumstat
                        dict_YX = NULL, # Y index for 1st column, X index for 2nd column
                        dict_sumstatLD = NULL, # sumstat index for 1st column, LD index for 2nd column
-                       traits_names = NULL, # the names of traits
+                       outcome_names = NULL, # the names of outcomes
                        ###### - HyPrColoc input
                        effect_est = NULL, # same as HyPrColoc, beta hat matrix: with rowname of snp names
                        effect_se = NULL, # same as HyPrColoc, sebeta hat matrix with rowname of snp names
@@ -140,7 +140,7 @@ colocboost <- function(X = NULL, Y = NULL, # individual data
                        median_abs_corr = NULL,
                        between_purity = 0.8, # minimum LD between two csets
                        tol = 1e-9, # tol for LD
-                       merging = TRUE, # if merge two sets for one trait
+                       merging = TRUE, # if merge two sets for one outcome
                        coverage_singlew = 0.8,
                        lambda = 0.5, # the ratio for z^2 and z in weight penalty
                        lambda_target = 1,
@@ -244,10 +244,10 @@ colocboost <- function(X = NULL, Y = NULL, # individual data
                     for (i in 1:length(Y)){
                         tmp <- unique(dict_YX[dict_YX[,1]==i,2])
                         if (length(tmp) == 0){
-                            warning(paste("Error: You don't provide matched X for trait", i))
+                            warning(paste("Error: You don't provide matched X for outcome", i))
                             return(NULL)
                         } else if (length(tmp) != 1){
-                            warning(paste("Error: You provide different matched X for trait", i))
+                            warning(paste("Error: You provide different matched X for outcome", i))
                             return(NULL)
                         } else {
                             yx_dict[i] <- tmp
@@ -338,7 +338,7 @@ colocboost <- function(X = NULL, Y = NULL, # individual data
         if ( !is.null(sumstat) ){
             if (is.data.frame(sumstat)){ sumstat <- list(sumstat) }
             if (!is.list(sumstat)){
-              warning("Error: Input sumstat must be the list containing summary level data for all traits!")
+              warning("Error: Input sumstat must be the list containing summary level data for all outcomes!")
               return(NULL)
             }
             # --- check if variants names in summary data
@@ -359,7 +359,7 @@ colocboost <- function(X = NULL, Y = NULL, # individual data
 
           # if no LD input, set diagonal matrix to LD
           warning("Providing the LD for summary statistics data is highly recommended. ",
-                  "Without LD, only a single iteration will be performed under the assumption of one causal variant per trait. ",
+                  "Without LD, only a single iteration will be performed under the assumption of one causal variant per outcome. ",
                   "Additionally, the purity of CoS cannot be evaluated!")
 
           p.sumstat <- sapply(keep.snp.sumstat, length)
@@ -431,7 +431,7 @@ colocboost <- function(X = NULL, Y = NULL, # individual data
             warning("Providing the sample size (n), or even a rough estimate of n, ",
                     "is highly recommended. Without n, the implicit assumption is ",
                     "n is large (Inf) and the effect sizes are small (close to zero).",
-                    "Trait ", paste(p_no, collapse = ","), " in sumstat don't contain 'n'!")
+                    "outcome ", paste(p_no, collapse = ","), " in sumstat don't contain 'n'!")
         }
 
         Z <- N_sumstat <- Var_y <- SeBhat <- vector(mode='list', length=length(sumstat))
@@ -500,20 +500,20 @@ colocboost <- function(X = NULL, Y = NULL, # individual data
     min_variants <- min(sapply(keep.snps, length))
     if (min_variants < 100){
       warning("Warning message about the number of variants.\n",
-              "The smallest number of variants across traits is ", min_variants, " <100. ",
+              "The smallest number of variants across outcomes is ", min_variants, " <100. ",
               "If this is what you expected, this is not a problem.",
               "If this is not you expected, please check input data.")
     }
     if (length(overlapp_snps)<=1){
-      warning("Error: No or only 1 overlapping variants were found across all traits, colocalization cannot be performed. ",
-           "Please verify the variant names across different traits.")
+      warning("Error: No or only 1 overlapping variants were found across all outcomes, colocalization cannot be performed. ",
+           "Please verify the variant names across different outcomes.")
       return(NULL)
     } else if ( (length(overlapp_snps)/mean_variants)<0.1 ){
       warning("Warning message about the overlapped variants.\n",
-              "The average number of variants across traits is ", mean_variants, 
+              "The average number of variants across outcomes is ", mean_variants, 
               ". But only ", length(overlapp_snps), " number of variants overlapped (<10%).\n",
               "If this is what you expected, this is not a problem.\n",
-              "If this is not you expected, please check if the variant name matched across traits.")
+              "If this is not you expected, please check if the variant name matched across outcomes.")
     }
     cb_data <- colocboost_init_data(X = X, Y = Y, dict_YX = yx_dict,
                                     Z = Z, LD = LD, N_sumstat = N_sumstat, dict_sumstatLD = sumstatLD_dict,
@@ -550,7 +550,7 @@ colocboost <- function(X = NULL, Y = NULL, # individual data
                                    coloc_thres = coloc_thres,
                                    LD_obj = LD_obj,
                                    target_idx = target_idx,
-                                   traits_names = traits_names)
+                                   outcome_names = outcome_names)
 
     # --- post-processing of the colocboost updates
     message("Starting post-hoc analyses and results summary.")
 
@@ -51,7 +51,7 @@ colocboost_init_data <- function(X, Y, dict_YX,
     }
     if (target_variants & !is.null(target_idx)){
         if (target_idx > length(keep.snps)){
-          stop("Target trait index is over the total number of traits! please check!")
+          stop("Target outcome index is over the total number of outcomes! please check!")
         }
         keep.snp.names <- keep.snps[[dict[target_idx]]]
         if (overlap_varaints){
@@ -122,7 +122,7 @@ colocboost_init_data <- function(X, Y, dict_YX,
                 tmp$X <- x_stand
             }
             cb_data$data[[flag]] <- tmp
-            names(cb_data$data)[flag] <- paste0("ind_trait_",i)
+            names(cb_data$data)[flag] <- paste0("ind_outcome_",i)
             flag = flag + 1
         }
         cb_data$dict = c(dict_YX_final)
@@ -223,7 +223,7 @@ colocboost_init_data <- function(X, Y, dict_YX,
 
             }
             cb_data$data[[flag]] <- tmp
-            names(cb_data$data)[flag] <- paste0("sumstat_trait_",i)
+            names(cb_data$data)[flag] <- paste0("sumstat_outcome_",i)
             flag = flag + 1
 
         }
@@ -337,7 +337,7 @@ colocboost_init_para <- function(cb_data, cb_model,tau=0.01,
                                  multicorrection_cut=1,
                                  func_multicorrection = "lfdr",
                                  LD_obj = FALSE,
-                                 traits_names = NULL,
+                                 outcome_names = NULL,
                                  target_idx = NULL){
 
 
@@ -346,16 +346,16 @@ colocboost_init_para <- function(cb_data, cb_model,tau=0.01,
     N <- sapply(cb_data$data, function(dt) dt$N)
     # - number of SNPs
     P <- if (!is.null(cb_data$data[[1]]$X)) ncol(cb_data$data[[1]]$X) else length(cb_data$data[[1]]$XtY)
-    # - number of traits
+    # - number of outcomes
     L <- length(cb_data$data)
     # - initial profile loglikelihood
     profile_loglike <- sum(sapply(1:length(cb_model), function(i) tail(cb_model[[i]]$profile_loglike_each, n=1)))
-    # - check initial update trait
+    # - check initial update outcome
     stop_null <- sapply(cb_model, function(tmp) min(tmp$multi_correction_univariate))
     pos_stop <- which(stop_null >= multicorrection_cut)
     update_y = rep(1, L)
     if (length(pos_stop) != 0){ update_y[pos_stop] <- 0 } else {pos_stop = NULL}
-    if (!is.null(traits_names)){ traits_names = traits_names } else {traits_names = paste0("Y", 1:L)}
+    if (!is.null(outcome_names)){ outcome_names = outcome_names } else {outcome_names = paste0("Y", 1:L)}
 
     cb_model_para = list("L" = L,
                          "P" = P,
@@ -371,8 +371,8 @@ colocboost_init_para <- function(cb_data, cb_model,tau=0.01,
                          "true_stop" = pos_stop,
                          "LD_obj" = LD_obj,
                          "real_update_jk" = c(),
-                         "traits_names" = traits_names,
-                         "snp_names" = cb_data$snp.names,
+                         "outcome_names" = outcome_names,
+                         "variables" = cb_data$snp.names,
                          "target_idx" = target_idx)
     class(cb_model_para) = "colocboost"
 
 
@@ -1,25 +1,25 @@
 
 
-colocboost_onecausal <- function(cb_model, cb_model_para, cb_data,
-                                 jk_equiv_cor = 0.8,
-                                 jk_equiv_loglik = 1,
-                                 tau = 0.01,
-                                 decayrate = 1,
-                                 func_prior = "z2z",
-                                 lambda = 0.5,
-                                 lambda_target = 1,
-                                 LD_obj = FALSE){
+colocboost_one_causal <- function(cb_model, cb_model_para, cb_data,
+                                  jk_equiv_cor = 0.8,
+                                  jk_equiv_loglik = 1,
+                                  tau = 0.01,
+                                  decayrate = 1,
+                                  func_prior = "z2z",
+                                  lambda = 0.5,
+                                  lambda_target = 1,
+                                  LD_obj = FALSE){
 
   if (jk_equiv_cor != 0){
-    cb_obj <- colocboost_oneiteration(cb_model, cb_model_para, cb_data,
-                                      jk_equiv_cor = jk_equiv_cor,
-                                      jk_equiv_loglik = jk_equiv_loglik,
-                                      tau = tau,
-                                      decayrate = decayrate,
-                                      func_prior = func_prior,
-                                      lambda = lambda,
-                                      lambda_target = lambda_target,
-                                      LD_obj = LD_obj)
+    cb_obj <- colocboost_one_iteration(cb_model, cb_model_para, cb_data,
+                                       jk_equiv_cor = jk_equiv_cor,
+                                       jk_equiv_loglik = jk_equiv_loglik,
+                                       tau = tau,
+                                       decayrate = decayrate,
+                                       func_prior = func_prior,
+                                       lambda = lambda,
+                                       lambda_target = lambda_target,
+                                       LD_obj = LD_obj)
   } else {
     cb_obj <- colocboost_diagLD(cb_model, cb_model_para, cb_data,
                                 jk_equiv_cor = jk_equiv_cor,
@@ -39,24 +39,24 @@ colocboost_onecausal <- function(cb_model, cb_model_para, cb_data,
 
 
 # under one causal per trait assumption with one iteration
-colocboost_oneiteration <- function(cb_model, cb_model_para, cb_data,
-                                    jk_equiv_cor = 0.8,
-                                    jk_equiv_loglik = 1,
-                                    tau = 0.01,
-                                    decayrate = 1,
-                                    func_prior = "z2z",
-                                    lambda = 0.5,
-                                    lambda_target = 1,
-                                    LD_obj = FALSE){
+colocboost_one_iteration <- function(cb_model, cb_model_para, cb_data,
+                                     jk_equiv_cor = 0.8,
+                                     jk_equiv_loglik = 1,
+                                     tau = 0.01,
+                                     decayrate = 1,
+                                     func_prior = "z2z",
+                                     lambda = 0.5,
+                                     lambda_target = 1,
+                                     LD_obj = FALSE){
 
 
     if (sum(cb_model_para$update_y == 1) != 0){
 
       ######## - some traits updated
       # - step 1: check update clusters
-      real_update <- boost_check_update_jk_onecausal(cb_model, cb_model_para, cb_data,
-                                                     jk_equiv_cor = jk_equiv_cor,
-                                                     jk_equiv_loglik = jk_equiv_loglik)
+      real_update <- boost_check_update_jk_one_causal(cb_model, cb_model_para, cb_data,
+                                                      jk_equiv_cor = jk_equiv_cor,
+                                                      jk_equiv_loglik = jk_equiv_loglik)
 
       # - step 2: boost update
       for (i_update in 1:length(real_update)){
@@ -66,13 +66,13 @@ colocboost_oneiteration <- function(cb_model, cb_model_para, cb_data,
           cb_model_para$update_status <- cbind(cb_model_para$update_status, as.matrix(real_update[[i_update]]$update_status))
           cb_model_para$real_update_jk <- rbind(cb_model_para$real_update_jk, real_update[[i_update]]$real_update_jk)
           # - update cb_model
-          cb_model <- boost_joint(cb_model, cb_model_para, cb_data,
-                                  tau = tau,
-                                  decayrate = decayrate,
-                                  func_prior = func_prior,
-                                  lambda = lambda,
-                                  lambda_target = lambda_target,
-                                  LD_obj = LD_obj)
+          cb_model <- colocboost_update(cb_model, cb_model_para, cb_data,
+                                        tau = tau,
+                                        decayrate = decayrate,
+                                        func_prior = func_prior,
+                                        lambda = lambda,
+                                        lambda_target = lambda_target,
+                                        LD_obj = LD_obj)
       }
     }
     # -- remove redundant parameters
@@ -92,10 +92,10 @@ colocboost_oneiteration <- function(cb_model, cb_model_para, cb_data,
 
 
 
-boost_check_update_jk_onecausal <- function(cb_model, cb_model_para, cb_data,
-                                            prioritize_jkstar = TRUE, 
-                                            jk_equiv_cor = 0.8,
-                                            jk_equiv_loglik = 1){
+boost_check_update_jk_one_causal <- function(cb_model, cb_model_para, cb_data,
+                                             prioritize_jkstar = TRUE, 
+                                             jk_equiv_cor = 0.8,
+                                             jk_equiv_loglik = 1){
 
     pos.update <- which(cb_model_para$update_y == 1)
     update_jk <- rep(NA, cb_model_para$L+1)
@@ -195,9 +195,9 @@ colocboost_diagLD <- function(cb_model, cb_model_para, cb_data,
     cb_model_para$jk <- rbind(cb_model_para$jk, update_jk)
     cb_model_para$update_status <- cbind(cb_model_para$update_status, as.matrix(update_status))
     cb_model_para$real_update_jk <- rbind(cb_model_para$real_update_jk, real_update_jk)
-    cb_model <- boost_joint(cb_model, cb_model_para, cb_data,
-                            tau = tau, decayrate = decayrate, func_prior = func_prior,
-                            lambda = lambda, lambda_target = lambda_target, LD_obj = LD_obj)
+    cb_model <- colocboost_update(cb_model, cb_model_para, cb_data,
+                                  tau = tau, decayrate = decayrate, func_prior = func_prior,
+                                  lambda = lambda, lambda_target = lambda_target, LD_obj = LD_obj)
 
   }
 
@@ -225,9 +225,9 @@ colocboost_diagLD <- function(cb_model, cb_model_para, cb_data,
         cb_model_para$update_temp <- list("update_status" = update_status, 
                                           "real_update_jk" = real_update_jk)
         # - update cb_model
-        cb_model_tmp <- boost_joint(cb_model_tmp, cb_model_para, cb_data,
-                                    tau = tau, decayrate = decayrate, func_prior = func_prior,
-                                    lambda = lambda, lambda_target = lambda_target, LD_obj = LD_obj)
+        cb_model_tmp <- colocboost_update(cb_model_tmp, cb_model_para, cb_data,
+                                          tau = tau, decayrate = decayrate, func_prior = func_prior,
+                                          lambda = lambda, lambda_target = lambda_target, LD_obj = LD_obj)
         weights <- rbind(weights, cb_model_tmp[[iy]]$weights_path)
     }
     ###### overlap weights
@@ -275,13 +275,13 @@ colocboost_diagLD <- function(cb_model, cb_model_para, cb_data,
       cb_model_para$update_status <- cbind(cb_model_para$update_status, as.matrix(real_update[[i_update]]$update_status))
       cb_model_para$real_update_jk <- rbind(cb_model_para$real_update_jk, real_update[[i_update]]$real_update_jk)
       # - update cb_model
-      cb_model <- boost_joint(cb_model, cb_model_para, cb_data,
-                              tau = tau,
-                              decayrate = decayrate,
-                              func_prior = func_prior,
-                              lambda = lambda,
-                              lambda_target = lambda_target,
-                              LD_obj = LD_obj)
+      cb_model <- colocboost_update(cb_model, cb_model_para, cb_data,
+                                    tau = tau,
+                                    decayrate = decayrate,
+                                    func_prior = func_prior,
+                                    lambda = lambda,
+                                    lambda_target = lambda_target,
+                                    LD_obj = LD_obj)
     }
   }
   # -- remove redundant parameters