exporting function to construct polyhedral constraints of LASSO

jonathan-taylor · jonathan-taylor · commit 3d8b2481a998 · 2017-08-31T14:05:21.000-07:00
diff --git a/selectiveInference/NAMESPACE b/selectiveInference/NAMESPACE
@@ -14,7 +14,8 @@ export(lar,fs,
        TG.pvalue, 
        TG.limits, 
        TG.interval,
-       debiasingMatrix
+       debiasingMatrix,
+       fixedLassoPoly
     )
 
 S3method("coef", "lar")
diff --git a/selectiveInference/R/funs.fixed.R b/selectiveInference/R/funs.fixed.R
@@ -93,14 +93,14 @@ fixedLassoInf <- function(x, y, beta, lambda, family=c("gaussian","binomial","co
                     "'thresh' parameter, for a more accurate convergence."))
     
     # Get lasso polyhedral region, of form Gy >= u
-    if (type == 'full' & p > n) out = fixedLasso.poly(x,y,beta,lambda,vars,inactive=TRUE)
-    else out = fixedLasso.poly(x,y,beta,lambda,vars)
-    G = out$G
-    u = out$u
+    if (type == 'full' & p > n) out = fixedLassoPoly(x,y,lambda,beta,vars,inactive=TRUE)
+    else out = fixedLassoPoly(x,y,lambda,beta,vars)
+    A = out$A
+    b = out$b
     
     # Check polyhedral region
     tol.poly = 0.01
-    if (min(G %*% y - u) < -tol.poly * sqrt(sum(y^2)))
+    if (max(A %*% y - b) > tol.poly * sqrt(sum(y^2)))
       stop(paste("Polyhedral constraints not satisfied; you must recompute beta",
                  "more accurately. With glmnet, make sure to use exact=TRUE in coef(),",
                  "and check whether the specified value of lambda is too small",
@@ -191,7 +191,7 @@ fixedLassoInf <- function(x, y, beta, lambda, family=c("gaussian","binomial","co
     sign[j] = sign(sum(vj*y))
     vj = sign[j] * vj
 
-    limits.info = TG.limits(y, -G, -u, vj, Sigma=diag(rep(sigma^2, n)))
+    limits.info = TG.limits(y, A, b, vj, Sigma=diag(rep(sigma^2, n)))
     a = TG.pvalue.base(limits.info, null_value=null_value[j], bits=bits)
     pv[j] = a$pv
     vlo[j] = a$vlo * mj # Unstandardize (mult by norm of vj)
@@ -221,45 +221,39 @@ fixedLassoInf <- function(x, y, beta, lambda, family=c("gaussian","binomial","co
 #############################
 
 
-fixedLasso.poly=
-  function(x, y, beta, lambda, a, inactive = FALSE) {
-    xa = x[,a,drop=F]
-    xac = x[,!a,drop=F]
-    xai = pinv(crossprod(xa))
-    xap = xai %*% t(xa)
-    za = sign(beta[a])
+fixedLassoPoly =
+  function(X, y, lambda, beta, active, inactive = FALSE) {
+    Xa = X[,active,drop=F]
+    Xac = X[,!active,drop=F]
+    Xai = pinv(crossprod(Xa))
+    Xap = Xai %*% t(Xa)
+
+    za = sign(beta[active])
     if (length(za)>1) dz = diag(za)
     if (length(za)==1) dz = matrix(za,1,1)
     
-    if (inactive) {
-      P = diag(1,nrow(xa)) - xa %*% xap
+    if (inactive) { # should we include the inactive constraints?
+      R = diag(1,nrow(Xa)) - Xa %*% Xap # R is residual forming matrix of selected model
       
-      G = -rbind(
-        1/lambda * t(xac) %*% P,
-        -1/lambda * t(xac) %*% P,
-        -dz %*% xap
+      A = rbind(
+        1/lambda * t(Xac) %*% R,
+        -1/lambda * t(Xac) %*% R,
+        -dz %*% Xap
       )
       lambda2=lambda
-      if(length(lambda)>1) lambda2=lambda[a]
-      u = -c(
-        1 - t(xac) %*% t(xap) %*% za,
-        1 + t(xac) %*% t(xap) %*% za,
-        -lambda2 * dz %*% xai %*% za)
+      if(length(lambda)>1) lambda2=lambda[active]
+      b = c(
+        1 - t(Xac) %*% t(Xap) %*% za,
+        1 + t(Xac) %*% t(Xap) %*% za,
+        -lambda2 * dz %*% Xai %*% za)
     } else {
-      G = -rbind(
-        #   1/lambda * t(xac) %*% P,
-        # -1/lambda * t(xac) %*% P,
-        -dz %*% xap
-      )
+      A = -dz %*% Xap
       lambda2=lambda
-      if(length(lambda)>1) lambda2=lambda[a]
-      u = -c(
-        #   1 - t(xac) %*% t(xap) %*% za,
-        #   1 + t(xac) %*% t(xap) %*% za,
-        -lambda2 * dz %*% xai %*% za)
+      if(length(lambda)>1) lambda2=lambda[active]
+      b = -lambda2 * dz %*% Xai %*% za
     }
     
-    return(list(G=G,u=u))
+    return(list(A=A, b=b))
   }
 
 ##############################
diff --git a/selectiveInference/man/fixedLassoPoly.Rd b/selectiveInference/man/fixedLassoPoly.Rd
@@ -0,0 +1,80 @@
+\name{fixedLassoPoly}
+\alias{fixedLassoPoly}
+
+\title{
+Compute polyhedral constraints for a LASSO problem with
+a fixed value of lambda.
+}
+\description{
+Compute polyhedral representation of the selection region of Lee et al. (2016).
+By construction, y should satisfy A %*% y elementwise less then or equal b.
+}
+\usage{
+fixedLassoPoly(X, y, lambda, beta, active, inactive = FALSE)
+}
+\arguments{
+\item{X}{
+Design matrix of LASSO problem.
+}
+\item{y}{
+Response of LASSO problem.
+}
+\item{lambda}{
+Value of regularization parameter.
+}      
+\item{beta}{
+Solution of LASSO problem with regularization parameter set to lambda.
+}      
+\item{active}{
+Active set of the LASSO problem as a boolean vector. Should correspond
+to the non-zeros of beta.
+} 
+\item{inactive}{
+Form the inactive constraints as well?
+} 
+}
+\details{
+This function computes
+the  polyhedral representation of the selection region of Lee et al. (2016).
+}
+
+\value{  
+\item{A}{Linear part of the affine inequalities.}
+\item{b}{RHS offset the affine inequalities.}
+}
+
+\references{
+Jason Lee, Dennis Sun, Yuekai Sun, and Jonathan Taylor (2016). 
+Exact post-selection inference, with application to the lasso. Annals of Statistics, 44(3), 907-927.
+
+Jonathan Taylor and Robert Tibshirani (2017) Post-selection inference for math L1-penalized likelihood models.
+Canadian Journal of Statistics, xx, 1-21. (Volume still not posted)
+}
+\author{Ryan Tibshirani, Rob Tibshirani, Jonathan Taylor, Joshua Loftus, Stephen Reid}
+
+\examples{
+
+set.seed(43)
+n = 50
+p = 10
+sigma = 1
+
+x = matrix(rnorm(n*p),n,p)
+x = scale(x,TRUE,TRUE)
+
+beta = c(3,2,rep(0,p-2))
+y = x\%*\%beta + sigma*rnorm(n)
+
+# first run glmnet
+gfit = glmnet(x,y,standardize=FALSE)
+
+# extract coef for a given lambda; note the 1/n factor!
+# (and we don't save the intercept term)
+lambda = .8
+beta = coef(gfit, s=lambda/n, exact=TRUE)[-1]
+active = (beta != 0)
+
+fixedLassoPoly(x, y, lambda, beta, active)
+
+}
+ 

Original file line number	Diff line number	Diff line change
`@@ -14,7 +14,8 @@ export(lar,fs,`
`14`	`14`	`TG.pvalue,`
`15`	`15`	`TG.limits,`
`16`	`16`	`TG.interval,`
`17`		`- debiasingMatrix`
	`17`	`+ debiasingMatrix,`
	`18`	`+ fixedLassoPoly`
`18`	`19`	`)`
`19`	`20`
`20`	`21`	`S3method("coef", "lar")`