Merge pull request #1548 from Spaak/master

twiecki · web-flow · commit 818e4cde8207 · 2016-11-24T14:56:14.000+01:00
some small changes to make advi respect theano.config.floatX
diff --git a/pymc3/blocking.py b/pymc3/blocking.py
@@ -38,6 +38,14 @@ class DictToArrayBijection(object):
     def __init__(self, ordering, dpoint):
         self.ordering = ordering
         self.dpt = dpoint
+        
+        # determine smallest float dtype that will fit all data
+        if all([x.dtyp == 'float16' for x in ordering.vmap]):
+            self.array_dtype = 'float16'
+        elif all([x.dtyp == 'float32' for x in ordering.vmap]):
+            self.array_dtype = 'float32'
+        else:
+            self.array_dtype = 'float64'
 
     def map(self, dpt):
         """
@@ -47,7 +55,7 @@ def map(self, dpt):
         ----------
         dpt : dict
         """
-        apt = np.empty(self.ordering.dimensions)
+        apt = np.empty(self.ordering.dimensions, dtype=self.array_dtype)
         for var, slc, _, _ in self.ordering.vmap:
             apt[slc] = dpt[var].ravel()
         return apt
diff --git a/pymc3/variational/advi.py b/pymc3/variational/advi.py
@@ -180,7 +180,7 @@ def _calc_elbo(vars, model, n_mcsamples, random_seed):
 
     [logp], inarray = pm.join_nonshared_inputs([logpt], vars, shared)
 
-    uw = tt.dvector('uw')
+    uw = tt.vector('uw')
     uw.tag.test_value = np.concatenate([inarray.tag.test_value,
                                         inarray.tag.test_value])
 
@@ -192,9 +192,10 @@ def _calc_elbo(vars, model, n_mcsamples, random_seed):
 def _elbo_t(logp, uw, inarray, n_mcsamples, random_seed):
     """Create Theano tensor of approximate ELBO by Monte Carlo sampling.
     """
-    l = (uw.size / 2).astype('int64')
-    u = uw[:l]
-    w = uw[l:]
+    l = (uw.size / 2)
+    l_int = l.astype('int64')
+    u = uw[:l_int]
+    w = uw[l_int:]
 
     # Callable tensor
     def logp_(input):
@@ -209,14 +210,14 @@ def logp_(input):
     if n_mcsamples == 1:
         n = r.normal(size=inarray.tag.test_value.shape)
         q = n * tt.exp(w) + u
-        elbo = logp_(q) + tt.sum(w) + 0.5 * l * (1 + np.log(2.0 * np.pi))
+        elbo = logp_(q) + tt.sum(w) + 0.5 * l * (1 + tt.log(2.0 * np.pi))
     else:
         n = r.normal(size=(n_mcsamples, u.tag.test_value.shape[0]))
         qs = n * tt.exp(w) + u
         logps, _ = theano.scan(fn=lambda q: logp_(q),
                                outputs_info=None,
                                sequences=[qs])
-        elbo = tt.mean(logps) + tt.sum(w) + 0.5 * l * (1 + np.log(2.0 * np.pi))
+        elbo = tt.mean(logps) + tt.sum(w) + 0.5 * l * (1 + tt.log(2.0 * np.pi))
 
     return elbo
 
@@ -250,14 +251,15 @@ def optimizer(loss, param):
             param = list(param)
 
         for param_ in param:
-            i = theano.shared(np.array(0))
+            i = theano.shared(np.array(0, dtype=theano.config.floatX))
+            i_int = i.astype('int64')
             value = param_.get_value(borrow=True)
             accu = theano.shared(
                 np.zeros(value.shape + (n_win,), dtype=value.dtype))
             grad = tt.grad(loss, param_)
 
             # Append squared gradient vector to accu_new
-            accu_new = tt.set_subtensor(accu[:, i], grad ** 2)
+            accu_new = tt.set_subtensor(accu[:, i_int], grad ** 2)
             i_new = tt.switch((i + 1) < n_win, i + 1, 0)
 
             updates[accu] = accu_new