Merge pull request #18 from jonathan-taylor/master

tibshirani · web-flow · commit 2bd33e81aa2a · 2017-08-16T09:04:07.000-07:00
comparing test
diff --git a/selectiveInference/R/funs.fixed.R b/selectiveInference/R/funs.fixed.R
@@ -159,7 +159,8 @@ sigma=NULL, alpha=0.1,
       hsigmaSinv <- solve(hsigmaS) # pinv(hsigmaS)
 
       # Approximate inverse covariance matrix for when (n < p) from lasso_Inference.R
-      htheta <- InverseLinfty(hsigma, n, length(S), verbose=FALSE)
+      useC = TRUE
+      htheta <- InverseLinfty(hsigma, n, length(S), verbose=FALSE, useC=useC)
       # htheta <- InverseLinfty(hsigma, n, verbose=FALSE)
       
       FS = rbind(diag(length(S)),matrix(0,pp-length(S),length(S)))
@@ -269,7 +270,7 @@ fixedLasso.poly=
 ### Functions borrowed and slightly modified from lasso_inference.R
 
 ## Approximates inverse covariance matrix theta
-InverseLinfty <- function(sigma, n, e, resol=1.5, mu=NULL, maxiter=50, threshold=1e-2, verbose = TRUE) {
+InverseLinfty <- function(sigma, n, e, resol=1.5, mu=NULL, maxiter=50, threshold=1e-2, verbose = TRUE, useC = FALSE) {
   # InverseLinfty <- function(sigma, n, resol=1.5, mu=NULL, maxiter=50, threshold=1e-2, verbose = TRUE) {
     isgiven <- 1;
   if (is.null(mu)){
@@ -294,7 +295,11 @@ InverseLinfty <- function(sigma, n, e, resol=1.5, mu=NULL, maxiter=50, threshold
     incr <- 0;
     while ((mu.stop != 1)&&(try.no<10)){
       last.beta <- beta
-      output <- InverseLinftyOneRow(sigma, i, mu, maxiter=maxiter, threshold=threshold)
+      if (useC == FALSE) {
+            output <- InverseLinftyOneRow(sigma, i, mu, maxiter=maxiter, threshold=threshold)
+      } else {
+            output <- InverseLinftyOneRowC(sigma, i, mu, maxiter=maxiter)
+      }
       beta <- output$optsol
       iter <- output$iter
       if (isgiven==1){
@@ -334,17 +339,46 @@ InverseLinfty <- function(sigma, n, e, resol=1.5, mu=NULL, maxiter=50, threshold
   return(M)
 }
 
+InverseLinftyOneRowC <- function (Sigma, i, mu, maxiter=50) {
+
+         p = nrow(Sigma)		
+         basis_vector = rep(0, p)
+	 basis_vector[i] = 1.
+         theta = rep(0, p)     
+
+	 val = .C("find_one_row",
+          	 Sigma=as.double(Sigma),
+		 Sigma_diag=as.double(diag(Sigma)),
+		 Sigma_theta=as.double(rep(0, p)),
+		 nrow=as.integer(p),
+   		 bound=as.double(mu),
+		 theta=as.double(theta),
+		 maxiter=as.integer(50),
+		 row=as.integer(i-1),
+		 coord=as.integer(i-1),
+		 dup=FALSE,
+		 package="selectiveInference")
+
+	# Check feasibility
+
+	if (max(abs(Sigma %*% val$theta - basis_vector)) > 1.01 * mu) {
+	   warning("Solution for row of M does not seem to be feasible")
+	}
+
+	return(val$theta)
+}
+
 InverseLinftyOneRow <- function ( sigma, i, mu, maxiter=50, threshold=1e-2 ) {
   p <- nrow(sigma);
   rho <- max(abs(sigma[i,-i])) / sigma[i,i];
   mu0 <- rho/(1+rho);
   beta <- rep(0,p);
   
-  if (mu >= mu0){
-    beta[i] <- (1-mu0)/sigma[i,i];
-    returnlist <- list("optsol" = beta, "iter" = 0);
-    return(returnlist);
-  }
+  #if (mu >= mu0){
+  #  beta[i] <- (1-mu0)/sigma[i,i];
+  #  returnlist <- list("optsol" = beta, "iter" = 0);
+  #  return(returnlist);
+  #}
   
   diff.norm2 <- 1;
   last.norm2 <- 1;
diff --git a/selectiveInference/src/debiasing_matrix.c b/selectiveInference/src/debiasing_matrix.c
@@ -0,0 +1,186 @@
+#include <stdio.h>
+#include <math.h> // for fabs
+
+// Find an approximate row of \hat{Sigma}^{-1}
+
+// Solves a dual version of problem (4) of https://arxiv.org/pdf/1306.3171.pdf
+
+// Dual problem: \text{min}_{\theta} 1/2 \theta^T \Sigma \theta - e_i^T\theta + \mu \|\theta\|_1
+
+// This is the "negative" of the problem as in https://gist.github.com/jonathan-taylor/07774d209173f8bc4e42aa37712339bf
+// Therefore we don't have to negate the answer to get theta.
+// Update one coordinate 
+
+double objective(double *Sigma,       /* A covariance matrix: X^TX/n */
+		 int nrow,            /* how many rows in Sigma */
+		 int row,             /* which row: 0-based */
+		 double bound,        /* Lagrange multipler for \ell_1 */
+		 double *theta)       /* current value */
+{
+  int irow, icol;
+  double value = 0;
+  double *Sigma_ptr = Sigma;
+  double *theta_row_ptr, *theta_col_ptr;
+
+  theta_row_ptr = theta;
+  theta_col_ptr = theta;
+
+  for (irow=0; irow<nrow; irow++) {
+    double *theta_col_ptr = theta;
+    if (*theta_row_ptr != 0) {
+      for (icol=0; icol<nrow; icol++) {
+        value += 0.5 * (*Sigma_ptr) * (*theta_row_ptr) * (*theta_col_ptr);
+        Sigma_ptr++;
+        theta_col_ptr++;
+      }
+    }
+    if (irow == row) {
+      value -= (*theta_row_ptr); // the elementary basis vector term
+    }
+    value = value + bound * fabs((*theta_row_ptr)); // the \ell_1 term
+    theta_row_ptr++;
+  }
+
+  return(value);
+}
+
+
+double update_one_coord(double *Sigma,           /* A covariance matrix: X^TX/n */
+                        double *Sigma_diag,      /* Diagonal entries of Sigma */
+                        double *Sigma_theta,     /* Sigma times theta */
+			int nrow,                /* How many rows in Sigma */
+			double bound,            /* feasibility parameter */
+			double *theta,           /* current value */
+			int row,                 /* which row: 0-based */
+			int coord)               /* which coordinate to update: 0-based */
+{
+
+  double delta;
+  double linear_term = 0;
+  double value = 0;
+  double old_value;
+  double *Sigma_ptr;
+  double *Sigma_theta_ptr;
+  double *theta_ptr;
+  int icol = 0;
+
+  double *quadratic_ptr = ((double *) Sigma_diag + coord);
+  double quadratic_term = *quadratic_ptr;
+
+  Sigma_theta_ptr = ((double *) Sigma_theta + coord);
+  linear_term = *Sigma_theta_ptr;
+
+  theta_ptr = ((double *) theta + coord);
+  old_value = *theta_ptr;
+
+  // The coord entry of Sigma_theta term has a diagonal term in it:
+  // Sigma[coord, coord] * theta[coord]
+  // This removes it. 
+  linear_term -= quadratic_term * old_value;
+
+  if (row == coord) {
+    linear_term -= 1;
+  }
+
+  // Now soft-threshold the coord entry of theta 
+
+  // Objective is t \mapsto q/2 * t^2 + l * t + bound |t|
+  // with q=quadratic_term and l=linear_term
+
+  // With a negative linear term, solution should be
+  // positive
+
+  if (linear_term < -bound) {
+    value = (-linear_term - bound) / quadratic_term;
+  }
+  else if (linear_term > bound) {
+    value = -(linear_term - bound) / quadratic_term;
+  }
+
+  if (fabs(old_value - value) > 1.e-6 * (fabs(value) + fabs(old_value))) { // Update the linear term
+
+    delta = value - old_value;
+    Sigma_ptr = ((double *) Sigma + coord * nrow);
+    Sigma_theta_ptr = ((double *) Sigma_theta);
+
+    for (icol=0; icol<nrow; icol++) {
+      *Sigma_theta_ptr = *Sigma_theta_ptr + delta * (*Sigma_ptr);
+      Sigma_theta_ptr += 1;
+      Sigma_ptr += 1;
+    }
+
+    theta_ptr = ((double *) theta + coord);
+    *theta_ptr = value;
+
+  }
+
+  return(value);
+
+}
+
+void find_one_row(double *Sigma,          /* A covariance matrix: X^TX/n */
+                  double *Sigma_diag,     /* Diagonal entry of covariance matrix */
+                  double *Sigma_theta,    /* Sigma times theta */
+                  int *nrow_ptr,          /* How many rows in Sigma */
+		  double *bound_ptr,      /* feasibility parameter */
+                  double *theta,          /* current value */
+                  int *maxiter_ptr,       /* how many iterations */
+                  int *row_ptr)         /* which coordinate to update: 0-based */
+{
+
+  int maxiter = *maxiter_ptr;
+  int iter = 0;
+  int icoord = 0;
+  int row = *row_ptr;
+  double bound = *bound_ptr;
+  int nrow = *nrow_ptr;
+
+  double old_value = objective(Sigma,
+			       nrow,
+			       row,
+			       bound,
+			       theta);
+  double new_value; 
+  double tol=1.e-10;
+
+  for (iter=0; iter<maxiter; iter++) {
+
+    // Update the diagonal first
+
+    update_one_coord(Sigma,
+		     Sigma_diag,
+		     Sigma_theta,
+		     nrow,
+		     bound,
+		     theta,
+		     row,
+		     row);
+
+    for (icoord=0; icoord<nrow; icoord++) {
+
+      update_one_coord(Sigma,
+		       Sigma_diag,
+		       Sigma_theta,
+		       nrow,
+		       bound,
+		       theta,
+		       row,
+		       icoord);
+    }
+
+    new_value = objective(Sigma,
+			  nrow,
+			  row,
+			  bound,
+			  theta);
+
+    if (((old_value - new_value) < tol * fabs(new_value)) && (iter > 0)) {
+      break;
+    }
+
+    old_value = new_value;
+  }
+
+  *nrow_ptr = iter-1;
+}
+