Merge pull request #21 from jonathan-taylor/general_pivot

jonathan-taylor · web-flow · commit e887312a04b3 · 2017-08-04T13:16:48.000-07:00
General pivot -- exposes functions for TG and eliminates poly.* and mypoly.*
diff --git a/selectiveInference/NAMESPACE b/selectiveInference/NAMESPACE
@@ -12,7 +12,10 @@ export(lar,fs,
        estimateSigma,
        manyMeans,print.manyMeans,
        groupfs,groupfsInf,
-       scaleGroups,factorDesign
+       scaleGroups,factorDesign,
+       TG.pvalue, 
+       TG.limits, 
+       TG.interval
     )
 
 S3method("coef", "lar")
diff --git a/selectiveInference/R/funs.fixed.R b/selectiveInference/R/funs.fixed.R
@@ -122,14 +122,19 @@ else{
     vj = vj / mj        # Standardize (divide by norm of vj)
     sign[j] = sign(sum(vj*y))
     vj = sign[j] * vj
-    a = poly.pval(y,G,u,vj,sigma,bits)
+
+    limits.info = TG.limits(y, -G, -u, vj, Sigma=diag(rep(sigma^2, n)))
+    a = TG.pvalue.base(limits.info, bits=bits)
     pv[j] = a$pv
     vlo[j] = a$vlo * mj # Unstandardize (mult by norm of vj)
     vup[j] = a$vup * mj # Unstandardize (mult by norm of vj)
     vmat[j,] = vj * mj * sign[j]  # Unstandardize (mult by norm of vj)
 
-    a = poly.int(y,G,u,vj,sigma,alpha,gridrange=gridrange,
-      flip=(sign[j]==-1),bits=bits)
+    a = TG.interval.base(limits.info, 
+                         alpha=alpha,
+                         gridrange=gridrange,
+			 flip=(sign[j]==-1),
+                         bits=bits)
     ci[j,] = a$int * mj # Unstandardize (mult by norm of vj)
     tailarea[j,] = a$tailarea
   }
diff --git a/selectiveInference/R/funs.fixedCox.R b/selectiveInference/R/funs.fixedCox.R
@@ -62,14 +62,14 @@ b1= -(mydiag(s2)%*%MM)%*%s2*lambda
       vj=rep(0,length(bbar));vj[jj]=s2[jj]
 
 
-      junk=mypoly.pval.lee(bbar,A1,b1,vj,MM)
+      junk=TG.pvalue(bbar, A1, b1, vj,MM)
 
        pv[jj] = junk$pv
       vlo[jj]=junk$vlo
        vup[jj]=junk$vup
        sd[jj]=junk$sd
 
-      junk2=mypoly.int.lee(bbar,vj,vlo[jj],vup[jj],sd[jj],alpha)
+      junk2=TG.interval(bbar, A1, b1, vj, MM, alpha)
        ci[jj,]=junk2$int
        tailarea[jj,] = junk2$tailarea
      
diff --git a/selectiveInference/R/funs.fixedLogit.R b/selectiveInference/R/funs.fixedLogit.R
@@ -89,14 +89,14 @@ fixedLogitLassoInf=function(x,y,beta,lambda,alpha=.1, type=c("partial"), tol.bet
     for(jj in 1:sum(m)){
        vj=c(rep(0,sum(m)+1));vj[jj+1]=s2[jj+1]
       # compute p-values
-      junk=mypoly.pval.lee(bbar,A1,b1,vj,MM)
+      junk=TG.pvalue(bbar, A1, b1, vj, MM)
       pv[jj] = junk$pv
  
    vlo[jj]=junk$vlo
    vup[jj]=junk$vup
        sd[jj]=junk$sd
-  #  junk2=mypoly.int.lee(bbar[-1], A1, b1,vj,MM[-1,-1],alpha=.1)
-     junk2=mypoly.int.lee(bbar,vj,vlo[jj],vup[jj],sd[jj],alpha=alpha)
+
+     junk2=TG.interval(bbar, A1, b1, vj, MM,alpha=alpha)
 
      ci[jj,]=junk2$int
      tailarea[jj,] = junk2$tailarea
diff --git a/selectiveInference/R/funs.fs.R b/selectiveInference/R/funs.fs.R
@@ -299,15 +299,21 @@ fsInf <- function(obj, sigma=NULL, alpha=0.1, k=NULL, type=c("active","all","aic
       vj = vreg[j,]
       mj = sqrt(sum(vj^2)) 
       vj = vj / mj              # Standardize (divide by norm of vj)
-      a = poly.pval(y,Gj,uj,vj,sigma,bits)
+
+      limits.info = TG.limits(y, -Gj, -uj, vj, Sigma=diag(rep(sigma^2, n)))
+      a = TG.pvalue.base(limits.info, bits=bits)
+
       pv[j] = a$pv
       sxj = sx[vars[j]]
       vlo[j] = a$vlo * mj / sxj # Unstandardize (mult by norm of vj / sxj)
       vup[j] = a$vup * mj / sxj # Unstandardize (mult by norm of vj / sxj)
       vmat[j,] = vj * mj / sxj  # Unstandardize (mult by norm of vj / sxj)
   
-      a = poly.int(y,Gj,uj,vj,sigma,alpha,gridrange=gridrange,
-        flip=(sign[j]==-1),bits=bits)
+      a = TG.interval.base(limits.info, 
+                           alpha=alpha,
+			   gridrange=gridrange,
+			   flip=(sign[j]==-1),
+			   bits=bits)
       ci[j,] = a$int * mj / sxj # Unstandardize (mult by norm of vj / sxj)
       tailarea[j,] = a$tailarea
     }
@@ -349,15 +355,19 @@ fsInf <- function(obj, sigma=NULL, alpha=0.1, k=NULL, type=c("active","all","aic
       Gj = rbind(G,vj)
       uj = c(u,0)
 
-      a = poly.pval(y,Gj,uj,vj,sigma,bits)
+      limits.info = TG.limits(y, -Gj, -uj, vj, Sigma=diag(rep(sigma^2, n)))
+      a = TG.pvalue.base(limits.info, bits=bits)
       pv[j] = a$pv
       sxj = sx[vars[j]]
       vlo[j] = a$vlo * mj / sxj # Unstandardize (mult by norm of vj / sxj)
       vup[j] = a$vup * mj / sxj # Unstandardize (mult by norm of vj / sxj)
       vmat[j,] = vj * mj / sxj  # Unstandardize (mult by norm of vj / sxj)
 
-      a = poly.int(y,Gj,uj,vj,sigma,alpha,gridrange=gridrange,
-        flip=(sign[j]==-1),bits=bits)
+      a = TG.interval.base(limits.info,
+                           alpha=alpha,
+                           gridrange=gridrange,
+			   flip=(sign[j]==-1),
+                           bits=bits)
       ci[j,] = a$int * mj / sxj # Unstandardize (mult by norm of vj / sxj)
       tailarea[j,] = a$tailarea
     }
diff --git a/selectiveInference/R/funs.inf.R b/selectiveInference/R/funs.inf.R
@@ -1,48 +1,3 @@
-# Main p-value function
-
-poly.pval <- function(y, G, u, v, sigma, bits=NULL) {
-  z = sum(v*y)
-  vv = sum(v^2)
-  sd = sigma*sqrt(vv)
-  
-  rho = G %*% v / vv
-  vec = (u - G %*% y + rho*z) / rho
-  vlo = suppressWarnings(max(vec[rho>0]))
-  vup = suppressWarnings(min(vec[rho<0]))
-
-  pv = tnorm.surv(z,0,sd,vlo,vup,bits)
-  return(list(pv=pv,vlo=vlo,vup=vup))
-}
-
-# Main confidence interval function
-
-poly.int <- function(y, G, u, v, sigma, alpha, gridrange=c(-100,100),
-                     gridpts=100, griddepth=2, flip=FALSE, bits=NULL) {
-  
-  z = sum(v*y)
-  vv = sum(v^2)
-  sd = sigma*sqrt(vv)
-  
-  rho = G %*% v / vv
-  vec = (u - G %*% y + rho*z) / rho
-  vlo = suppressWarnings(max(vec[rho>0]))
-  vup = suppressWarnings(min(vec[rho<0]))
-  
-  xg = seq(gridrange[1]*sd,gridrange[2]*sd,length=gridpts)
-  fun = function(x) { tnorm.surv(z,x,sd,vlo,vup,bits) }
-
-  int = grid.search(xg,fun,alpha/2,1-alpha/2,gridpts,griddepth)
-  tailarea = c(fun(int[1]),1-fun(int[2]))
-
-  if (flip) {
-    int = -int[2:1]
-    tailarea = tailarea[2:1]
-  }
-  
-  return(list(int=int,tailarea=tailarea))
-}
-
-##############################
 
 # Assuming that grid is in sorted order from smallest to largest,
 # and vals are monotonically increasing function values over the
@@ -247,48 +202,95 @@ aicStop <- function(x, y, action, df, sigma, mult=2, ntimes=2) {
 
 #these next two functions are used by the binomial and Cox options of fixedLassoInf
 
-mypoly.pval.lee=
-function(y, A, b, eta, Sigma, bits=NULL) {
+# Compute the truncation interval and SD of the corresponding Gaussian
+
+TG.limits = function(Z, A, b, eta, Sigma=NULL) {
+
+    target_estimate = sum(as.numeric(eta) * as.numeric(Z))
+
+    if (max(A %*% as.numeric(Z) - b) > 0) {
+        warning('Contsraint not satisfied. A %*% Z should be elementwise less than or equal to b')
+    }
+
+    if (is.null(Sigma)) {
+        Sigma = diag(rep(1, n))
+    }
+
     # compute pvalues from poly lemma:  full version from Lee et al for full matrix Sigma
-    nn=length(y)
-    eta=as.vector(eta)
-  temp = sum(eta*y)
-   vv=as.numeric(matrix(eta,nrow=1,ncol=nn)%*%Sigma%*%eta)
-   cc = Sigma%*%eta/vv
-   
- z=(diag(nn)-matrix(cc,ncol=1)%*%eta)%*%y
-    rho=A%*%cc
+
+    n = length(Z)
+    eta = matrix(eta, ncol=1, nrow=n)
+    b = as.vector(b)
+    var_estimate = sum(matrix(eta, nrow=1, ncol=n) %*% (Sigma %*% matrix(eta, ncol=1, nrow=n)))
+    cross_cov = Sigma %*% matrix(eta, ncol=1, nrow=n)
    
-  vec = (b- A %*% z)/rho
-  vlo = suppressWarnings(max(vec[rho<0]))
-  vup = suppressWarnings(min(vec[rho>0]))
-  sd=sqrt(vv)
-  pv = tnorm.surv(temp,0,sd,vlo,vup,bits)
-  return(list(pv=pv,vlo=vlo,vup=vup,sd=sd))
+    resid = (diag(n) - matrix(cross_cov / var_estimate, ncol=1, nrow=n) %*% matrix(eta, nrow=1, ncol=n)) %*% Z
+    rho = A %*% cross_cov / var_estimate
+    vec = (b - as.numeric(A %*% resid)) / rho
+
+    vlo = suppressWarnings(max(vec[rho < 0]))
+    vup = suppressWarnings(min(vec[rho > 0]))
+
+    sd = sqrt(var_estimate)
+    return(list(vlo=vlo, vup=vup, sd=sd, estimate=target_estimate))
+}
+
+TG.pvalue = function(Z, A, b, eta, Sigma=NULL, null_value=0, bits=NULL) {
+
+    limits.info = TG.limits(Z, A, b, eta, Sigma)
+
+    return(TG.pvalue.base(limits.info, null_value=null_value, bits=bits))
 }
 
+TG.interval = function(Z, A, b, eta, Sigma=NULL, alpha=0.1, 
+                       gridrange=c(-100,100),
+                       gridpts=100, 
+                       griddepth=2, 
+                       flip=FALSE, 
+                       bits=NULL) {
+
+    limits.info = TG.limits(Z, A, b, eta, Sigma)
+
+    return(TG.interval.base(limits.info, 
+                            alpha=alpha, 
+                            gridrange=gridrange,
+                            griddepth=griddepth,
+			    flip=flip,
+			    bits=bits))
+}
 
+TG.interval.base = function(limits.info, alpha=0.1, 
+                            gridrange=c(-100,100),
+                            gridpts=100, 
+                            griddepth=2, 
+                            flip=FALSE, 
+                            bits=NULL) {
 
-mypoly.int.lee=
-   function(y,eta,vlo,vup,sd, alpha, gridrange=c(-100,100),gridpts=100, griddepth=2, flip=FALSE, bits=NULL) {
     # compute sel intervals from poly lemmma, full version from Lee et al for full matrix Sigma
 
-  temp = sum(eta*y)
-  
-  xg = seq(gridrange[1]*sd,gridrange[2]*sd,length=gridpts)
-  fun = function(x) { tnorm.surv(temp,x,sd,vlo,vup,bits) }
+    param_grid = seq(gridrange[1] * limits.info$sd, gridrange[2] * limits.info$sd, length=gridpts)
 
-  int = grid.search(xg,fun,alpha/2,1-alpha/2,gridpts,griddepth)
-  tailarea = c(fun(int[1]),1-fun(int[2]))
+    pivot = function(param) {
+        tnorm.surv(limits.info$estimate, param, limits.info$sd, limits.info$vlo, limits.info$vup, bits) 
+    }
 
-  if (flip) {
-    int = -int[2:1]
-    tailarea = tailarea[2:1]
-  }
+    interval = grid.search(param_grid, pivot, alpha/2, 1-alpha/2, gridpts, griddepth)
+    tailarea = c(pivot(interval[1]), 1- pivot(interval[2]))
+
+    if (flip) {
+        interval = -interval[2:1]
+        tailarea = tailarea[2:1]
+     }
  
-  return(list(int=int,tailarea=tailarea))
+     # int is not a good variable name, synonymous with integer...
+     return(list(int=interval,
+                 tailarea=tailarea))
 }
 
+TG.pvalue.base = function(limits.info, null_value=0, bits=NULL) {
+    pv = tnorm.surv(limits.info$estimate, null_value, limits.info$sd, limits.info$vlo, limits.info$vup, bits)
+    return(list(pv=pv, vlo=limits.info$vlo, vup=limits.info$vup, sd=limits.info$sd))
+}
 
 
 mydiag=function(x){
diff --git a/selectiveInference/R/funs.lar.R b/selectiveInference/R/funs.lar.R
@@ -379,15 +379,20 @@ larInf <- function(obj, sigma=NULL, alpha=0.1, k=NULL, type=c("active","all","ai
       vj = vreg[j,]
       mj = sqrt(sum(vj^2))
       vj = vj / mj              # Standardize (divide by norm of vj)
-      a = poly.pval(y,Gj,uj,vj,sigma,bits)
+
+      limits.info = TG.limits(y, -Gj, -uj, vj, Sigma=diag(rep(sigma^2, n)))
+      a = TG.pvalue.base(limits.info, bits=bits)
       pv[j] = a$pv
       sxj = sx[vars[j]]
       vlo[j] = a$vlo * mj / sxj # Unstandardize (mult by norm of vj / sxj)
       vup[j] = a$vup * mj / sxj # Unstandardize (mult by norm of vj)
       vmat[j,] = vj * mj / sxj  # Unstandardize (mult by norm of vj / sxj)
 
-      a = poly.int(y,Gj,uj,vj,sigma,alpha,gridrange=gridrange,
-        flip=(sign[j]==-1),bits=bits)
+      a = TG.interval.base(limits.info,
+                           alpha=alpha,
+                           gridrange=gridrange,
+                           flip=(sign[j]==-1),
+                           bits=bits)
       ci[j,] = a$int * mj / sxj # Unstandardize (mult by norm of vj / sxj)
       tailarea[j,] = a$tailarea
 
@@ -433,15 +438,20 @@ larInf <- function(obj, sigma=NULL, alpha=0.1, k=NULL, type=c("active","all","ai
       Gj = rbind(G,vj)
       uj = c(u,0)
 
-      a = poly.pval(y,Gj,uj,vj,sigma,bits)
+      limits.info = TG.limits(y, -Gj, -uj, vj, Sigma=diag(rep(sigma^2, n)))
+      a = TG.pvalue.base(limits.info, bits=bits)
+
       pv[j] = a$pv
       sxj = sx[vars[j]]
       vlo[j] = a$vlo * mj / sxj # Unstandardize (mult by norm of vj / sxj)
       vup[j] = a$vup * mj / sxj # Unstandardize (mult by norm of vj / sxj)
       vmat[j,] = vj * mj / sxj  # Unstandardize (mult by norm of vj / sxj)
 
-      a = poly.int(y,Gj,uj,vj,sigma,alpha,gridrange=gridrange,
-        flip=(sign[j]==-1),bits=bits)
+      a = TG.interval.base(limits.info,
+                           alpha=alpha,
+                           gridrange=gridrange,
+                           flip=(sign[j]==-1),
+                           bits=bits)
       ci[j,] = a$int * mj / sxj # Unstandardize (mult by norm of vj / sxj)
       tailarea[j,] = a$tailarea
     }
diff --git a/selectiveInference/man/TG.interval.Rd b/selectiveInference/man/TG.interval.Rd
diff --git a/selectiveInference/man/TG.limits.Rd b/selectiveInference/man/TG.limits.Rd
diff --git a/selectiveInference/man/TG.pvalue.Rd b/selectiveInference/man/TG.pvalue.Rd