created the matrices for the affine transform, wrapper for calling Gaussian density

jonathan-taylor · jonathan-taylor · commit eedf0fde5bf1 · 2017-10-30T21:57:24.000-07:00
diff --git a/selectiveInference/R/funs.fixed.R b/selectiveInference/R/funs.fixed.R
@@ -435,8 +435,7 @@ debiasingRow = function (Xinfo,               # could be X or t(X) %*% X / n dep
   last_output = NULL
 
   if (is_wide) {
-     n = nrow(Xinfo)
-     Xsoln = as.numeric(rep(0, n))
+     Xsoln = as.numeric(rep(0, nrow(Xinfo)))
   }
 
   while (counter_idx < max_try) {
diff --git a/selectiveInference/R/funs.randomized.R b/selectiveInference/R/funs.randomized.R
@@ -37,6 +37,7 @@ randomizedLASSO = function(X,
     if (length(lam) == 1) {
        lam = rep(lam, p)
     }
+
     if (length(lam) != p) {
        stop("Lagrange parameter should be single float or of length ncol(X)")
     }    
@@ -65,5 +66,38 @@ randomizedLASSO = function(X,
 		           objective_stop,     # objective_stop
 			   kkt_stop,           # kkt_stop
 			   param_stop)         # param_stop
+
+    
+    sign_soln = sign(result$soln)
+
+    unpenalized = lam == 0
+    active = !unpenalized * (sign_soln != 0)
+    inactive = !unpenzlied * (sign_soln == 0)
+
+    unpenalized_set = which(unpenalized)
+    active_set = which(active)
+    inactive_set = which(inactive)
+
+    coef_term = t(X) %*% X[,c(unpenalized_set,  # the coefficients
+                              active_set)]
+    coef_term = coef_term %*% diag(c(rep(1, sum(unpenalized)), sign_soln[active]))  # coefficients are non-negative
+    coef_term[active,] = coef_term[active,] + ridge_term * diag(rep(1, sum(active)))  # ridge term
+
+    subgrad_term = cbind(matrix(0, sum(inactive), sum(active) + sum(unpenalized)),
+                         diag(rep(1, sum(inactive))))
+    linear_term = rbind(coef_term,
+                        subgrad_term)
+
+    offset_term = rep(0, p)
+    offset_term[active] = lam[active] * sign_soln[active]
+
+    
+
+    list(active_set = active_set,
+         inactive_set = inactive_set,
+         unpenalized_set = unpenalized_set,
+         sign_soln = sign_soln)
+         
+         
     return(result)
 }
diff --git a/selectiveInference/src/Rcpp-randomized.cpp b/selectiveInference/src/Rcpp-randomized.cpp
@@ -0,0 +1,40 @@
+#include <Rcpp.h>                // need to include the main Rcpp header file 
+#include <randomized_lasso.h>    // where densities are defined
+
+// [[Rcpp::export]]
+Rcpp::NumericVector log_density_gaussian_(double noise_scale,                         // Scale of randomization
+					  Rcpp::NumericMatrix internal_linear,        // A_D -- linear part for data
+					  Rcpp::NumericMatrix internal_state,         // D -- data state -- matrix of shape (nopt, npts)
+					  Rcpp::NumericMatrix optimization_linear,    // A_O -- linear part for optimization variables
+					  Rcpp::NumericMatrix optimization_state,     // O -- optimization state -- matrix of shape (ninternal, npts)
+					  Rcpp::NumericMatrix offset) {               // h -- offset in affine transform -- "p" dimensional 
+
+  int npt = internal_state.ncol();         // Function is vectorized
+  if (optimization_state.ncol() != npt) {  // Assuming each column is an internal or opt state because arrays are column major
+    Rcpp::stop("Number of optimization samples should equal the number of (internally represented) data.");
+  }
+
+  int ndim = optimization_linear.nrow();  
+  if (internal_linear.nrow() != ndim) {  
+    Rcpp::stop("Dimension of optimization range should be the same as the dimension of the data range.");
+  } 
+  int ninternal = internal_linear.ncol();
+  int noptimization = optimization_linear.ncol();
+
+  Rcpp::NumericVector result(npt);
+
+  int ipt;
+  for (ipt=0; ipt<npt; ipt++) {
+    result[ipt] = log_density_gaussian(noise_scale,
+				       ndim,
+				       ninternal,
+				       noptimization,
+				       (double *) internal_linear.begin(),
+				       ((double *) internal_state.begin() + ipt * ninternal),
+				       (double *) optimization_linear.begin(),
+				       ((double *) optimization_state.begin() + ipt * noptimization),
+				       (double *) offset.begin());
+  }
+
+  return(result);
+}
diff --git a/selectiveInference/src/randomized_lasso.c b/selectiveInference/src/randomized_lasso.c
@@ -11,6 +11,8 @@
 // Laplace is product of IID Laplace with scale noise_scale
 // Also evaluated at A_D D + A_O O + h
 
+// Matrices are assumed in column major order! 
+
 double log_density_gaussian(double noise_scale,             // Scale of randomization
 			    int ndim,                       // Number of features -- "p"
 			    int ninternal,                  // Dimension of internal data representation often 1
diff --git a/selectiveInference/src/randomized_lasso.c~ b/selectiveInference/src/randomized_lasso.c~
@@ -0,0 +1,188 @@
+#include <math.h> // for fabs
+
+// Augmented density for randomized LASSO after
+// Gaussian randomization
+
+// Described in https://arxiv.org/abs/1609.05609
+
+// Gaussian is product of IID N(0, noise_scale^2) density
+// Evaluated at A_D D + A_O O + h
+
+// Laplace is product of IID Laplace with scale noise_scale
+// Also evaluated at A_D D + A_O O + h
+
+double log_density_gaussian(double noise_scale,             // Scale of randomization
+			    int ndim,                       // Number of features -- "p"
+			    int ninternal,                  // Dimension of internal data representation often 1
+			    int noptimization,              // Dimension of optimization variables -- "p"
+			    double *internal_linear,        // A_D -- linear part for data
+			    double *internal_state,         // D -- data state
+			    double *optimization_linear,    // A_O -- linear part for optimization variables
+			    double *optimization_state,     // O -- optimization state
+			    double *offset)                 // h -- offset in affine transform -- "p" dimensional 
+{
+  int irow, icol;
+  double denom = 2 * noise_scale * noise_scale;
+  double value = 0;
+  double reconstruction = 0;
+  double *offset_ptr;
+  double *internal_linear_ptr;
+  double *internal_state_ptr;
+  double *optimization_linear_ptr;
+  double *optimization_state_ptr;
+
+  for (irow=0; irow<ndim; irow++) {
+
+    // Compute the irow-th entry of the ndim vector
+
+    offset_ptr = ((double *) offset + irow);
+    reconstruction = *offset_ptr;
+
+    // Internal (i.e. data) contribution
+    for (icol=0; icol<ninternal; icol++) {
+      
+      internal_linear_ptr = ((double *) internal_linear + icol * ndim + irow);
+      internal_state_ptr = ((double *) internal_state + icol);
+
+      reconstruction += (*internal_linear_ptr) * (*internal_state_ptr);
+    }
+
+    // Optimization contribution
+    for (icol=0; icol<noptimization; icol++) {
+      
+      optimization_linear_ptr = ((double *) optimization_linear + icol * ndim + irow);
+      optimization_state_ptr = ((double *) optimization_state + icol);
+
+      reconstruction += (*optimization_linear_ptr) * (*optimization_state_ptr);
+    }
+
+    value -= (reconstruction * reconstruction) / denom;
+  }
+
+  return(value);
+}
+
+double log_density_laplace(double noise_scale,             // Scale of randomization
+			   int ndim,                       // Number of features -- "p"
+			   int ninternal,                  // Dimension of internal data representation often 1
+			   int noptimization,              // Dimension of optimization variables -- "p"
+			   double *internal_linear,        // A_D -- linear part for data
+			   double *internal_state,         // D -- data state
+			   double *optimization_linear,    // A_O -- linear part for optimization variables
+			   double *optimization_state,     // O -- optimization state
+			   double *offset)                 // h -- offset in affine transform -- "p" dimensional 
+{
+  int irow, icol;
+  double value = 0;
+  double reconstruction = 0;
+  double *offset_ptr;
+  double *internal_linear_ptr;
+  double *internal_state_ptr;
+  double *optimization_linear_ptr;
+  double *optimization_state_ptr;
+
+  for (irow=0; irow<ndim; irow++) {
+
+    // Compute the irow-th entry of the ndim vector
+
+    offset_ptr = ((double *) offset + irow);
+    reconstruction = *offset_ptr;
+
+    // Internal (i.e. data) contribution
+    for (icol=0; icol<ninternal; icol++) {
+      
+      internal_linear_ptr = ((double *) internal_linear + icol * ndim + irow);
+      internal_state_ptr = ((double *) internal_state + icol);
+
+      reconstruction += (*internal_linear_ptr) * (*internal_state_ptr);
+    }
+
+    // Optimization contribution
+    for (icol=0; icol<noptimization; icol++) {
+      
+      optimization_linear_ptr = ((double *) optimization_linear + icol * ndim + irow);
+      optimization_state_ptr = ((double *) optimization_state + icol);
+
+      reconstruction += (*optimization_linear_ptr) * (*optimization_state_ptr);
+    }
+
+    value -= fabs(reconstruction) / noise_scale;
+  }
+
+  return(value);
+}
+
+// Keeping internal (data) state fixed
+
+double log_density_gaussian_conditional(double noise_scale,             // Scale of randomization
+					int ndim,                       // Number of features -- "p"
+					int noptimization,              // Dimension of optimization variables -- "p"
+					double *optimization_linear,    // A_O -- linear part for optimization variables
+					double *optimization_state,     // O -- optimization state
+					double *offset)                 // h -- offset in affine transform -- "p" dimensional 
+{
+  int irow, icol;
+  double value = 0;
+  double denom = 2 * noise_scale * noise_scale;
+  double reconstruction = 0;
+  double *offset_ptr;
+  double *optimization_linear_ptr;
+  double *optimization_state_ptr;
+
+  for (irow=0; irow<ndim; irow++) {
+
+    // Compute the irow-th entry of the ndim vector
+
+    offset_ptr = ((double *) offset + irow);
+    reconstruction = *offset_ptr;
+
+    // Optimization contribution
+    for (icol=0; icol<noptimization; icol++) {
+      
+      optimization_linear_ptr = ((double *) optimization_linear + icol * ndim + irow);
+      optimization_state_ptr = ((double *) optimization_state + icol);
+
+      reconstruction += (*optimization_linear_ptr) * (*optimization_state_ptr);
+    }
+
+    value -= reconstruction * reconstruction / denom;
+  }
+
+  return(value);
+}
+
+double log_density_laplace_conditional(double noise_scale,             // Scale of randomization
+				       int ndim,                       // Number of features -- "p"
+				       int noptimization,              // Dimension of optimization variables -- "p"
+				       double *optimization_linear,    // A_O -- linear part for optimization variables
+				       double *optimization_state,     // O -- optimization state
+				       double *offset)                 // h -- offset in affine transform -- "p" dimensional 
+{
+  int irow, icol;
+  double value = 0;
+  double reconstruction = 0;
+  double *offset_ptr;
+  double *optimization_linear_ptr;
+  double *optimization_state_ptr;
+
+  for (irow=0; irow<ndim; irow++) {
+
+    // Compute the irow-th entry of the ndim vector
+
+    offset_ptr = ((double *) offset + irow);
+    reconstruction = *offset_ptr;
+
+    // Optimization contribution
+    for (icol=0; icol<noptimization; icol++) {
+      
+      optimization_linear_ptr = ((double *) optimization_linear + icol * ndim + irow);
+      optimization_state_ptr = ((double *) optimization_state + icol);
+
+      reconstruction += (*optimization_linear_ptr) * (*optimization_state_ptr);
+    }
+
+    value -= fabs(reconstruction) / noise_scale;
+  }
+
+  return(value);
+}
diff --git a/selectiveInference/src/randomized_lasso.h b/selectiveInference/src/randomized_lasso.h
@@ -35,7 +35,7 @@ double log_density_laplace_conditional(double noise_scale,             // Scale
 				       int noptimization,              // Dimension of optimization variables -- "p"
 				       double *optimization_linear,    // A_O -- linear part for optimization variables
 				       double *optimization_state,     // O -- optimization state
-				       double *offset).                // h -- offset in affine transform -- "p" dimensional 
+				       double *offset);                // h -- offset in affine transform -- "p" dimensional 
 
 #ifdef __cplusplus
 }  /* extern "C" */
diff --git a/selectiveInference/src/randomized_lasso.h~ b/selectiveInference/src/randomized_lasso.h~
@@ -0,0 +1,42 @@
+#ifdef __cplusplus
+extern "C"
+{
+#endif /* __cplusplus */
+
+double log_density_gaussian(double noise_scale,             // Scale of randomization
+			    int ndim,                       // Number of features -- "p"
+			    int ninternal,                  // Dimension of internal data representation often 1
+			    int noptimization,              // Dimension of optimization variables -- "p"
+			    double *internal_linear,        // A_D -- linear part for data
+			    double *internal_state,         // D -- data state
+			    double *optimization_linear,    // A_O -- linear part for optimization variables
+			    double *optimization_state,     // O -- optimization state
+			    double *offset);                // h -- offset in affine transform -- "p" dimensional 
+  
+double log_density_laplace(double noise_scale,             // Scale of randomization
+			   int ndim,                       // Number of features -- "p"
+			   int ninternal,                  // Dimension of internal data representation often 1
+			   int noptimization,              // Dimension of optimization variables -- "p"
+			   double *internal_linear,        // A_D -- linear part for data
+			   double *internal_state,         // D -- data state
+			   double *optimization_linear,    // A_O -- linear part for optimization variables
+			   double *optimization_state,     // O -- optimization state
+			   double *offset);                // h -- offset in affine transform -- "p" dimensional 
+
+double log_density_gaussian_conditional(double noise_scale,             // Scale of randomization
+					int ndim,                       // Number of features -- "p"
+					int noptimization,              // Dimension of optimization variables -- "p"
+					double *optimization_linear,    // A_O -- linear part for optimization variables
+					double *optimization_state,     // O -- optimization state
+					double *offset);                // h -- offset in affine transform -- "p" dimensional 
+
+double log_density_laplace_conditional(double noise_scale,             // Scale of randomization
+				       int ndim,                       // Number of features -- "p"
+				       int noptimization,              // Dimension of optimization variables -- "p"
+				       double *optimization_linear,    // A_O -- linear part for optimization variables
+				       double *optimization_state,     // O -- optimization state
+				       double *offset).                // h -- offset in affine transform -- "p" dimensional 
+
+#ifdef __cplusplus
+}  /* extern "C" */
+#endif /* __cplusplus */

Original file line number	Diff line number	Diff line change
`@@ -435,8 +435,7 @@ debiasingRow = function (Xinfo, # could be X or t(X) %*% X / n dep`
`435`	`435`	`last_output = NULL`
`436`	`436`
`437`	`437`	`if (is_wide) {`
`438`		`- n = nrow(Xinfo)`
`439`		`- Xsoln = as.numeric(rep(0, n))`
	`438`	`+ Xsoln = as.numeric(rep(0, nrow(Xinfo)))`
`440`	`439`	`}`
`441`	`440`
`442`	`441`	`while (counter_idx < max_try) {`