selective-inference
diff --git a/‎selectiveInference/R/funs.fixed.R
Lines changed: 8 additions & 5 deletions b/‎selectiveInference/R/funs.fixed.R
Lines changed: 8 additions & 5 deletions
diff --git a/‎selectiveInference/man/debiasingMatrix.Rd
Lines changed: 2 additions & 2 deletions b/‎selectiveInference/man/debiasingMatrix.Rd
Lines changed: 2 additions & 2 deletions
diff --git a/‎tests/debiased_lasso/comparison_scaled.R
Lines changed: 78 additions & 0 deletions b/‎tests/debiased_lasso/comparison_scaled.R
Lines changed: 78 additions & 0 deletions
diff --git a/‎tests/debiased_lasso/comparison_unscaled.R
Lines changed: 78 additions & 0 deletions b/‎tests/debiased_lasso/comparison_unscaled.R
Lines changed: 78 additions & 0 deletions
@@ -8,7 +8,7 @@ fixedLassoInf <- function(x, y, beta,
                           sigma=NULL, alpha=0.1,
                           type=c("partial", "full"), tol.beta=1e-5, tol.kkt=0.1,
                           gridrange=c(-100,100), bits=NULL, verbose=FALSE, 
-                          linesearch.try=10) {
+                          linesearch.try=10, offset_correction=TRUE) {
 
   family = match.arg(family)
   this.call = match.call()
@@ -197,6 +197,9 @@ fixedLassoInf <- function(x, y, beta,
         M = M[-1,] # remove intercept row
         null_value = null_value[-1] # remove intercept element
       }
+      if (!offset_correction) {
+        null_value = 0 * null_value
+      }
     } else if (type=="partial" || p > n) {
       xa = x[,vars,drop=F]
       M = pinv(crossprod(xa)) %*% t(xa)
@@ -325,13 +328,13 @@ debiasingMatrix = function(Xinfo,               # could be X or t(X) %*% X / n d
 			   max_active=NULL,     # how big can active set get?
 			   max_try=10,          # how many steps in linesearch?
 			   warn_kkt=FALSE,      # warn if KKT does not seem to be satisfied?
-			   max_iter=100,        # how many iterations for each optimization problem
+			   max_iter=50,         # how many iterations for each optimization problem
                            kkt_stop=TRUE,       # stop based on KKT conditions?
                            parameter_stop=TRUE, # stop based on relative convergence of parameter?
 			   objective_stop=TRUE, # stop based on relative decrease in objective?
                            kkt_tol=1.e-4,       # tolerance for the KKT conditions
                            parameter_tol=1.e-4, # tolerance for relative convergence of parameter
-			   objective_tol=1.e-8  # tolerance for relative decrease in objective
+			   objective_tol=1.e-4  # tolerance for relative decrease in objective
                            ) {
 
 
@@ -399,13 +402,13 @@ debiasingRow = function (Xinfo,               # could be X or t(X) %*% X / n dep
 		         max_active=NULL,     # how big can active set get?
 			 max_try=10,          # how many steps in linesearch?
 			 warn_kkt=FALSE,      # warn if KKT does not seem to be satisfied?
-			 max_iter=100,        # how many iterations for each optimization problem
+			 max_iter=50,         # how many iterations for each optimization problem
                          kkt_stop=TRUE,       # stop based on KKT conditions?
                          parameter_stop=TRUE, # stop based on relative convergence of parameter?
                          objective_stop=TRUE, # stop based on relative decrease in objective?
                          kkt_tol=1.e-4,       # tolerance for the KKT conditions
 			 parameter_tol=1.e-4, # tolerance for relative convergence of parameter
-			 objective_tol=1.e-8  # tolerance for relative decrease in objective
+			 objective_tol=1.e-4  # tolerance for relative decrease in objective
                          ) {
 
   p = ncol(Xinfo)
 
@@ -22,13 +22,13 @@ debiasingMatrix(Xinfo,
 		max_active=NULL,    
 		max_try=10,         
 		warn_kkt=FALSE,     
-		max_iter=100,       
+		max_iter=50,       
 		kkt_stop=TRUE,
 		parameter_stop=TRUE,
 		objective_stop=TRUE,
                 kkt_tol=1.e-4,      
 		parameter_tol=1.e-4,
-		objective_tol=1.e-8)
+		objective_tol=1.e-4)
 }
 \arguments{
 \item{Xinfo}{
 
@@ -0,0 +1,78 @@
+source('javanmard_montanari.R')
+
+##############################################
+
+# Runs nsims simulations under the global null, computing p-values
+# using both the old code (slow one using Adel's code) and the new
+# code (faster using Jon's code), and produces qq-plots for both.
+# Runing 50 sims takes about 10-15 mins because old code is slow, so
+# feel free to lower nsims if you want
+
+
+library(selectiveInference)
+library(glmnet)
+
+# set.seed(424)
+
+n=100
+p=200
+
+sigma=.5
+
+theor_lambda = sigma * sqrt(2 * log(p))
+lambda=c(0.25, 0.5, 1, 0.8 * theor_lambda, theor_lambda)
+
+for (j in c(3,4,5,1,2)) {
+
+thresh = 1e-10
+
+beta=rep(0,p)
+type="full"
+
+nsim = 20
+
+scaling = sqrt(n)
+pvs_old = c()
+pvs_new <- c()
+pvs_old_0 = c()   # don't add the offset correction
+pvs_new_0 = c()   # don't add the offset correction
+for (i in 1:nsim) {
+  cat(i,fill=T)
+  x = matrix(rnorm(n*p),n,p)
+  x = scale(x,T,T) / scaling
+  mu = x%*%beta 
+  y=mu+sigma*rnorm(n)
+
+  # first run  glmnet
+  gfit=glmnet(x,y,intercept=F,standardize=F,thresh=thresh)
+
+  bhat = coef(gfit, s=lambda[j]/(sqrt(n) * scaling), exact=TRUE,x=x,y=y)[-1]
+
+  if(sum(bhat != 0) > 0) {
+
+  # compute fixed lambda p-values and selection intervals
+
+  aa = fixedLassoInf(x,y,bhat,lambda[j]*sqrt(n) / scaling,intercept=F,sigma=sigma,type=type)
+  bb = oldFixedLassoInf(x,y,bhat,lambda[j]*sqrt(n) / scaling,intercept=F,sigma=sigma,type=type)
+  cc = fixedLassoInf(x,y,bhat,lambda[j]*sqrt(n) / scaling,intercept=F,sigma=sigma,type=type, offset_correction=FALSE)
+  dd = oldFixedLassoInf(x,y,bhat,lambda[j]*sqrt(n) / scaling,intercept=F,sigma=sigma,type=type, offset_correction=FALSE)
+  pvs_new <- c(pvs_new, aa$pv, recursive=TRUE)
+  pvs_old <- c(pvs_old, bb$pv,recursive=TRUE)
+  pvs_new_0 <- c(pvs_new_0, cc$pv, recursive=TRUE)
+  pvs_old_0 <- c(pvs_old_0, dd$pv, recursive=TRUE)
+
+  cat()
+  }
+}
+
+#check uniformity 
+
+png(paste('comparison_scaled', j, '.png', sep=''))
+plot(ecdf(pvs_old), pch=23, col='green', xlim=c(0,1), ylim=c(0,1), main='ECDF of p-values')
+plot(ecdf(pvs_new), pch=24, col='purple', add=TRUE)
+plot(ecdf(pvs_old_0), pch=23, col='red', add=TRUE)
+plot(ecdf(pvs_new_0), pch=24, col='black', add=TRUE)
+abline(0,1)
+legend("bottomright", legend=c("Old","New", "Old 0", "New 0"), pch=c(23,24,23,24), pt.bg=c("green","purple","red","black"))
+dev.off()
+}
@@ -0,0 +1,78 @@
+source('javanmard_montanari.R')
+
+##############################################
+
+# Runs nsims simulations under the global null, computing p-values
+# using both the old code (slow one using Adel's code) and the new
+# code (faster using Jon's code), and produces qq-plots for both.
+# Runing 50 sims takes about 10-15 mins because old code is slow, so
+# feel free to lower nsims if you want
+
+
+library(selectiveInference)
+library(glmnet)
+
+# set.seed(424)
+
+n=100
+p=200
+
+sigma=.5
+
+theor_lambda = sigma * sqrt(2 * log(p))
+lambda=c(0.25, 0.5, 1, 0.8 * theor_lambda, theor_lambda)
+
+for (j in c(3,4,5,1,2)) {
+
+thresh = 1e-10
+
+beta=rep(0,p)
+type="full"
+
+nsim = 20
+
+scaling = sqrt(n)
+pvs_old = c()
+pvs_new <- c()
+pvs_old_0 = c()   # don't add the offset correction
+pvs_new_0 = c()   # don't add the offset correction
+for (i in 1:nsim) {
+  cat(i,fill=T)
+  x = matrix(rnorm(n*p),n,p)
+  x = scale(x,T,T) / scaling
+  mu = x%*%beta 
+  y=mu+sigma*rnorm(n)
+
+  # first run  glmnet
+  gfit=glmnet(x,y,intercept=F,standardize=F,thresh=thresh)
+
+  bhat = coef(gfit, s=lambda[j]/(sqrt(n) * scaling), exact=TRUE,x=x,y=y)[-1]
+
+  if(sum(bhat != 0) > 0) {
+
+  # compute fixed lambda p-values and selection intervals
+
+  aa = fixedLassoInf(x,y,bhat,lambda[j]*sqrt(n) / scaling,intercept=F,sigma=sigma,type=type)
+  bb = oldFixedLassoInf(x,y,bhat,lambda[j]*sqrt(n) / scaling,intercept=F,sigma=sigma,type=type)
+  cc = fixedLassoInf(x,y,bhat,lambda[j]*sqrt(n) / scaling,intercept=F,sigma=sigma,type=type, offset_correction=FALSE)
+  dd = oldFixedLassoInf(x,y,bhat,lambda[j]*sqrt(n) / scaling,intercept=F,sigma=sigma,type=type, offset_correction=FALSE)
+  pvs_new <- c(pvs_new, aa$pv, recursive=TRUE)
+  pvs_old <- c(pvs_old, bb$pv,recursive=TRUE)
+  pvs_new_0 <- c(pvs_new_0, cc$pv, recursive=TRUE)
+  pvs_old_0 <- c(pvs_old_0, dd$pv, recursive=TRUE)
+
+  cat()
+  }
+}
+
+#check uniformity 
+
+png(paste('comparison_unscaled', j, '.png', sep=''))
+plot(ecdf(pvs_old), pch=23, col='green', xlim=c(0,1), ylim=c(0,1), main='ECDF of p-values')
+plot(ecdf(pvs_new), pch=24, col='purple', add=TRUE)
+plot(ecdf(pvs_old_0), pch=23, col='red', add=TRUE)
+plot(ecdf(pvs_new_0), pch=24, col='black', add=TRUE)
+abline(0,1)
+legend("bottomright", legend=c("Old","New", "Old 0", "New 0"), pch=c(23,24,23,24), pt.bg=c("green","purple","red","black"))
+dev.off()
+}