Beginning cvlar implementation

Joshua Loftus · Joshua Loftus · commit c467ba2267a2 · 2016-10-27T15:01:33.000+01:00
diff --git a/forLater/josh/selectiveInference/R/cv.R b/forLater/josh/selectiveInference/R/cv.R
@@ -130,3 +130,48 @@ cvfs <- function(x, y, index = 1:ncol(x), maxsteps, sigma = NULL, intercept = TR
     invisible(fit)
 }
 
+
+cvlar <- function(x, y) { # other args
+    folds <- cvMakeFolds(x)
+    models <- lapply(folds, function(fold) {
+        x.train <- X
+        y.train <- Y
+        x.train[fold,] <- 0
+        y.train[fold] <- 0
+        x.test <- X[fold,]
+        y.test <- Y[fold]
+          larpath.train <- lar(x.train, y.train, maxsteps = maxsteps, intercept = F, normalize = F)
+        return(lff)
+    })
+
+    active.sets <- lapply(models, function(model) model$action)
+    lambdas <- lapply(models, function(model) model$lambda)
+    lmin <- min(unlist(lambdas))
+
+# Interpolate lambda grid or parametrize by steps?
+# interpolation probably requires re-writing cvRSSquads for
+# penalized fits in order to make sense
+
+# do steps for now just to have something that works?
+
+    RSSquads <- list()
+    for (s in 1:maxsteps) {
+        initial.active <- lapply(active.sets, function(a) a[1:s])
+        RSSquads[[s]] <- cvRSSquad(X, folds, initial.active)
+    }
+
+    RSSs <- lapply(RSSquads, function(Q) t(Y) %*% Q %*% Y)
+    sstar <- which.min(RSSs)
+    quadstar <- RSSquads[sstar][[1]]
+
+    RSSquads <- lapply(RSSquads, function(quad) quad - quadstar)
+    RSSquads[[sstar]] <- NULL # remove the all zeroes case
+
+    fit <- lar(X, Y, maxsteps=sstar, intercept = F, normalize = F)
+
+# Very tall Gamma encoding all cv-model paths
+    Gamma <- do.call(rbind, lapply(models, function(model) return(model$Gamma)))
+
+# more to do here    
+}
+
diff --git a/forLater/josh/sim.cvlar.R b/forLater/josh/sim.cvlar.R
@@ -0,0 +1,58 @@
+# Choices
+
+# RSS: least-squares or penalized beta?
+# depends on final model. Go with least-squares for now
+
+# fixed vs lar? (lar, apparently)
+# fixed probably slower, but advantage of same lambda grid?
+# is same lambda grid necessary? -- doesn't lar algorithm give all possible models anyway?
+# i.e. for non-knot lambda just find where it is in lar path, take corresponding model
+
+# groups? later
+
+# TODO
+
+# copy larInf or groupfsInf?
+# larInf: add CV quadratic constraints* & break/fix p-value computation
+# -------- *but can we even use the ydecomp we use for quadratic?
+# groupfsInf: some ugly rewriting, no cumprojs etc, but straightforward
+# -------- downside: need to implement larInf basically
+
+# larInf
+# [ ] is.null(sigma) don't estimate it
+
+# plan:
+# expand Gamma for [-fold] indices?
+# stack all the Gammas? or iterate through them?
+# work backward from poly.pval <- larInf
+
+
+# big picture / long term
+# what OOP kind of design would lend itself to easily implementing more cv things?
+
+# Gamma: something x n
+# Gamma %*% y >= 0
+
+# pass 0-padded x[-fold] and y[-fold] to lar?
+
+library(selectiveInference)
+setwd("/Users/joftius/Dropbox/work/R-software/forLater/josh")
+source("selectiveInference/R/cv.R")
+
+set.seed(1)
+n <- 100
+p <- 50
+maxsteps <- 10
+sparsity <- 3
+snr <- 2
+rho <- 0.1
+nfolds <- 5
+
+x <- matrix(rnorm(n*p), nrow=n)
+y <- rnorm(n)
+beta <- rep(0, p)
+beta[1:sparsity] <- 2* sqrt(2*log(p)/n) * sample(c(-1,1), sparsity, replace=T)
+y <- y + x %*% beta
+my <- mean(y)
+y <- y - my
+