Need more test

snoweye · snoweye · commit 04c23200bba5 · 2017-06-18T12:12:47.000-04:00
diff --git a/R/00_pmclust_reduceK.r b/R/00_pmclust_reduceK.r
@@ -1,94 +1,100 @@
 ### For automatically reducing K methods.
 
-pmclust.reduceK <- function(X = NULL, K = 2, MU = NULL,
-    algorithm = .PMC.CT$algorithm, RndEM.iter = .PMC.CT$RndEM.iter,
-    CONTROL = .PMC.CT$CONTROL, method.own.X = .PMC.CT$method.own.X,
-    rank.own.X = .pbd_env$SPMD.CT$rank.source, comm = .pbd_env$SPMD.CT$comm){
-  if(algorithm[1] == "kmeans"){
+### X should be in spmd, gbd, or dmat and set at .pmclustEnv or so, as used
+### in pmclust().
+pmclust.reduceK <- function(K = 2, algorithm = .PMC.CT$algorithm){
+  if(any(algorithm[1] %in% c("kmeans", "kmeans.dmat"))){
     stop("kmeans/pkmeans is not supported in reduceK.")
   }
 
-  # Run through original pmclust().
-  ret <- pmclust(X = X, K = K, MU = MU, algorithm = algorithm,
-                 RndEM.iter = RndEM.iter, CONTROL = CONTROL,
-                 method.own.X = method.own.X, rank.own.X = rank.own.X,
-                 comm = comm)
+  if(algorithm[1] %in% .PMC.CT$algorithm.gbd){
+    ret <- pmclust.reduceK.spmd(X = X, K = K, algorithm = algorithm)
+  } else if(algorithm[1] %in% .PMC.CT$algorithm.dmat){
+    ret <- pmclust.reduceK.dmat(X = X, K = K, algorithm = algorithm)
+  } else{
+    comm.stop("The algorithm is not found.")
+  }
+
+  ret
+} # End of pmclust.reduceK().
+
+
+pmclust.reduce.spmd <- function(K = 2, algorithm = .PMC.CT$algorithm){
+  # Get an initial start.
+  PARAM.org <- set.global(K = K)
+  PARAM.org <- try(initial.em(PARAM.org))
+
+  # Ensure the initial is good. Warning: This may take forever to run!
+  repeat{
+    if(class(PARAM.org) == "try-error"){
+      PARAM.org <- set.global(K = K)
+      PARAM.org <- try(initial.em(PARAM.org))
+    } else{
+      break
+    }
+  }
+
+  # Update steps.
+  method.step <- switch(algorithm[1],
+                        "em" = em.step,
+                        "aecm" = aecm.step,
+                        "apecm" = apecm.step,
+                        "apecma" = apecma.step,
+                        NULL)
+  if(comm.all(is.null(method.step))){
+    comm.stop("Algorithm is not found.")
+  }
+  PARAM.new <- try(method.step(PARAM.org))
+  em.update.class()
+  N.CLASS <- get.N.CLASS(K)
 
-  # Repeat if error occurs.
+
+  # Reduce K if error occurs.
   repeat{
-    if(ret$check$convergence == 99 && K > 1){
+    if((class(PARAM.new) == "try-error" ||
+        .pmclustEnv$CHECK$convergence == 99) &&
+       K > 1){
       # Drop specific i.k if available or
       # drop the smallest class or
       # drop the class with the smallest eta among all small classes or
       # drop all classes with 0 elements.
-      PARAM.new <- ret$param
       if(.pmclustEnv$CONTROL$stop.at.fail && .pmclustEnv$FAIL.i.k > 0){
         i.k <- .pmclustEnv$FAIL.i.k
       } else{
-        i.k <- which(ret$n.class == min(ret$n.class))
+        i.k <- which(N.CLASS == min(N.CLASS))
       }
-      if(i.k > 1 && min(ret$n.class) > 0){
+      if(i.k > 1 && min(N.CLASS) > 0){
         i.k <- i.k[which.min(PARAM.new$ETA[i.k])]
       }
       K <- K - length(i.k)
+      comm.cat("- Reduce: ", K, "\n")
 
       # Initial global storage.
-      if(algorithm[1] %in% .PMC.CT$algorithm.gbd){
-        PARAM.org <- set.global(K = K)
-      } else if(algorithm[1] %in% .PMC.CT$algorithm.dmat){
-        PARAM.org <- set.global.dmat(K = K)
-      } else{
-        comm.stop("The algorithm is not found.")
-      }
+      PARAM.org <- set.global(K = K)
 
       # Replacing PARAM.org by previous PARAM.new.
-      PARAM.org$ETA <- PARAM.new$ETA[-i.k] / sum(PARAM.org$ETA[-i.k])
+      PARAM.org$ETA <- PARAM.new$ETA[-i.k] / sum(PARAM.new$ETA[-i.k])
       PARAM.org$log.ETA <- log(PARAM.org$ETA)
       PARAM.org$MU <- matrix(PARAM.new$MU[, -i.k], ncol = K)
       PARAM.org$SIGMA <- PARAM.new$SIGMA[-i.k]
 
-      # Need one e-step to initial storage.
-      if(algorithm[1] %in% .PMC.CT$algorithm.gbd){
-        e.step.spmd(PARAM.org)
-      } else if(algorithm[1] %in% .PMC.CT$algorithm.dmat){
-        e.step.dmat(PARAM.org)
-      } else{
-        comm.stop("The algorithm is not found.")
-      }
-
       # Update steps.
-      method.step <- switch(algorithm[1],
-                            "em" = em.step,
-                            "aecm" = aecm.step,
-                            "apecm" = apecm.step,
-                            "apecma" = apecma.step,
-                            NULL)
-      PARAM.new <- method.step(PARAM.org)
-
-      # Obtain classifications.
+      e.step.spmd(PARAM.org)
+      PARAM.new <- try(method.step(PARAM.org))
       em.update.class()
-
-      # Get class numbers.
-      if(algorithm[1] %in% .PMC.CT$algorithm.gbd){
-        N.CLASS <- get.N.CLASS(K)
-      } else if(algorithm[1] %in% .PMC.CT$algorithm.dmat){
-        N.CLASS <- get.N.CLASS.dmat(K)
-      } else{
-        comm.stop("The algorithm is not found.")
-      }
-
-
-      # For return.
-      ret <- list(algorithm = algorithm[1],
-                  param = PARAM.new,
-                  class = .pmclustEnv$CLASS.spmd,
-                  n.class = N.CLASS,
-                  check = .pmclustEnv$CHECK)
+      N.CLASS <- get.N.CLASS(K)
     } else{
       break
     }
   }
 
+  # For return.
+  ret <- list(algorithm = algorithm[1],
+              param = PARAM.new,
+              class = .pmclustEnv$CLASS.spmd,
+              n.class = N.CLASS,
+              check = .pmclustEnv$CHECK)
+
   ret
-} # end of pmclust.reduceK().
+} # End of pmclust.reduceK.spmd().
 
diff --git a/R/00_pmclust_reduceK_dmat.r b/R/00_pmclust_reduceK_dmat.r
@@ -0,0 +1,81 @@
+### A dmat version for automatically reducing K methods.
+
+pmclust.reduce.dmat <- function(K = 2, algorithm = .PMC.CT$algorithm){
+  # Get an initial start.
+  PARAM.org <- set.global.dmat(K = K)
+  PARAM.org <- try(initial.em.dmat(PARAM.org))
+
+  # Ensure the initial is good. Warning: This may take forever to run!
+  repeat{
+    if(class(PARAM.org) == "try-error"){
+      PARAM.org <- set.global.dmat(K = K)
+      PARAM.org <- try(initial.em.dmat(PARAM.org))
+    } else{
+      break
+    }
+  }
+
+  # Update steps.
+  method.step <- switch(algorithm[1],
+                        "em.dmat" = em.step,
+                        # "aecm.dmat" = aecm.step,
+                        # "apecm.dmat" = apecm.step,
+                        # "apecma.dmat" = apecma.step,
+                        NULL)
+  if(comm.all(is.null(method.step))){
+    comm.stop("Algorithm is not found.")
+  }
+  PARAM.new <- try(method.step(PARAM.org))
+  em.update.class.dmat()
+  N.CLASS <- get.N.CLASS.dmat(K)
+
+
+  # Reduce K if error occurs.
+  repeat{
+    if((class(PARAM.new) == "try-error" ||
+        .pmclustEnv$CHECK$convergence == 99) &&
+       K > 1){
+      # Drop specific i.k if available or
+      # drop the smallest class or
+      # drop the class with the smallest eta among all small classes or
+      # drop all classes with 0 elements.
+      if(.pmclustEnv$CONTROL$stop.at.fail && .pmclustEnv$FAIL.i.k > 0){
+        i.k <- .pmclustEnv$FAIL.i.k
+      } else{
+        i.k <- which(N.CLASS == min(N.CLASS))
+      }
+      if(i.k > 1 && min(N.CLASS) > 0){
+        i.k <- i.k[which.min(PARAM.new$ETA[i.k])]
+      }
+      K <- K - length(i.k)
+      comm.cat("- Reduce: ", K, "\n")
+
+      # Initial global storage.
+      PARAM.org <- set.global.dmat(K = K)
+
+      # Replacing PARAM.org by previous PARAM.new.
+      PARAM.org$ETA <- PARAM.new$ETA[-i.k] / sum(PARAM.new$ETA[-i.k])
+      PARAM.org$log.ETA <- log(PARAM.org$ETA)
+      PARAM.org$MU <- matrix(PARAM.new$MU[, -i.k], ncol = K)
+      PARAM.org$SIGMA <- PARAM.new$SIGMA[-i.k]
+
+      # Update steps.
+      e.step.dmat(PARAM.org)
+      PARAM.new <- try(method.step(PARAM.org))
+      em.update.class.dmat()
+      N.CLASS <- get.N.CLASS.dmat(K)
+    } else{
+      break
+    }
+  }
+
+  # For return.
+  ret <- list(algorithm = algorithm[1],
+              param = PARAM.new,
+              class = .pmclustEnv$CLASS.spmd,
+              n.class = N.CLASS,
+              check = .pmclustEnv$CHECK)
+
+  ret
+} # End of pmclust.reduceK.dmat().
+