tensorlayer
diff --git a/‎example/tutorial_cifar10.py‎
Lines changed: 89 additions & 89 deletions b/‎example/tutorial_cifar10.py‎
Lines changed: 89 additions & 89 deletions
@@ -5,7 +5,7 @@
 
 import tensorflow as tf
 import tensorlayer as tl
-from tensorlayer.layers import set_keep
+from tensorlayer.layers import *
 import numpy as np
 import time, os, io
 from PIL import Image
@@ -14,107 +14,110 @@
 
 X_train, y_train, X_test, y_test = tl.files.load_cifar10_dataset(
                                     shape=(-1, 32, 32, 3), plotable=False)
-# scale = X_train.max()
-# X_train /= scale
-# X_test /= scale
 
-def model(x, y_, is_train, reuse):
+def model(x, y_, reuse):
     W_init = tf.truncated_normal_initializer(stddev=5e-2)
     W_init2 = tf.truncated_normal_initializer(stddev=0.04)
     b_init2 = tf.constant_initializer(value=0.1)
     with tf.variable_scope("model", reuse=reuse):
         tl.layers.set_name_reuse(reuse)
-        network = tl.layers.InputLayer(x, name='input')
-
-        network = tl.layers.Conv2dLayer(network, act=tf.identity,
-                    shape=[5, 5, 3, 64], strides=[1, 1, 1, 1], padding='SAME', # 64 features for each 5x5x3 patch
-                    W_init=W_init, b_init=None, name='cnn1')                            # output: (batch_size, 24, 24, 64)
-        network = tl.layers.BatchNormLayer(network, is_train=is_train,
-                    act=tf.nn.relu, name='batch1')
-        network = tl.layers.PoolLayer(network, ksize=[1, 3, 3, 1],
-                    strides=[1, 2, 2, 1], padding='SAME',
-                    pool=tf.nn.max_pool, name='pool1',)               # output: (batch_size, 12, 12, 64)
-
-        network = tl.layers.Conv2dLayer(network, act=tf.identity,
-                    shape=[5, 5, 64, 64], strides=[1, 1, 1, 1], padding='SAME',# 64 features for each 5x5 patch
-                    W_init=W_init, b_init=None, name ='cnn2')         # output: (batch_size, 12, 12, 64)
-        network = tl.layers.BatchNormLayer(network, is_train=is_train,
-                    act=tf.nn.relu, name='batch2')
-        network = tl.layers.PoolLayer(network, ksize=[1, 3, 3, 1],
-                    strides=[1, 2, 2, 1], padding='SAME',
-                    pool = tf.nn.max_pool, name ='pool2')             # output: (batch_size, 6, 6, 64)
-
-        network = tl.layers.FlattenLayer(network, name='flatten')     # output: (batch_size, 2304)
-        network = tl.layers.DenseLayer(network, n_units=384, act=tf.nn.relu,
+        net = InputLayer(x, name='input')
+        net = Conv2d(net, 64, (5, 5), (1, 1), padding='SAME',
+                    W_init=W_init, name='cnn1')
+        # net = Conv2dLayer(net, act=tf.nn.relu, shape=[5, 5, 3, 64],
+        #             strides=[1, 1, 1, 1], padding='SAME',                 # 64 features for each 5x5x3 patch
+        #             W_init=W_init, name ='cnn1')           # output: (batch_size, 24, 24, 64)
+        net = MaxPool2d(net, (3, 3), (2, 2), padding='SAME',name='pool1')
+        # net = PoolLayer(net, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1],
+        #             padding='SAME', pool = tf.nn.max_pool, name ='pool1',)# output: (batch_size, 12, 12, 64)
+        net = LocalResponseNormLayer(net, depth_radius=4, bias=1.0,
+                    alpha=0.001 / 9.0, beta=0.75, name='norm1')
+        # net.outputs = tf.nn.lrn(net.outputs, 4, bias=1.0, alpha=0.001 / 9.0,
+        #            beta=0.75, name='norm1')
+
+        net = Conv2d(net, 64, (5, 5), (1, 1), padding='SAME',
+                    W_init=W_init, name='cnn2')
+        # net = Conv2dLayer(net, act=tf.nn.relu, shape=[5, 5, 64, 64],
+        #             strides=[1, 1, 1, 1], padding='SAME',                 # 64 features for each 5x5 patch
+        #             W_init=W_init, name ='cnn2')           # output: (batch_size, 12, 12, 64)
+        net = LocalResponseNormLayer(net, depth_radius=4, bias=1.0,
+                    alpha=0.001 / 9.0, beta=0.75, name='norm2')
+        # net.outputs = tf.nn.lrn(net.outputs, 4, bias=1.0, alpha=0.001 / 9.0,
+        #             beta=0.75, name='norm2')
+        net = MaxPool2d(net, (3, 3), (2, 2), padding='SAME',name='pool2')
+        # net = PoolLayer(net, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1],
+        #             padding='SAME', pool = tf.nn.max_pool, name ='pool2') # output: (batch_size, 6, 6, 64)
+        net = FlattenLayer(net, name='flatten')                             # output: (batch_size, 2304)
+        net = DenseLayer(net, n_units=384, act=tf.nn.relu,
                     W_init=W_init2, b_init=b_init2, name='relu1')           # output: (batch_size, 384)
-        network = tl.layers.DenseLayer(network, n_units=192, act = tf.nn.relu,
+        net = DenseLayer(net, n_units=192, act=tf.nn.relu,
                     W_init=W_init2, b_init=b_init2, name='relu2')           # output: (batch_size, 192)
-        network = tl.layers.DenseLayer(network, n_units=10, act = tf.identity,
+        net = DenseLayer(net, n_units=10, act=tf.identity,
                     W_init=tf.truncated_normal_initializer(stddev=1/192.0),
-                    b_init = tf.constant_initializer(value=0.0),
-                    name='output')                                    # output: (batch_size, 10)
-        y = network.outputs
-        cost = tl.cost.cross_entropy(y, y_, name='cost')
-        L2 = tf.contrib.layers.l2_regularizer(0.004)(network.all_params[4]) + \
-                tf.contrib.layers.l2_regularizer(0.004)(network.all_params[6])
-        cost = cost + L2
+                    name='output')                                          # output: (batch_size, 10)
+        y = net.outputs
+
+        ce = tl.cost.cross_entropy(y, y_, name='cost')
+        # L2 for the MLP, without this, the accuracy will be reduced by 15%.
+        L2 = tf.contrib.layers.l2_regularizer(0.004)(net.all_params[4]) + \
+                tf.contrib.layers.l2_regularizer(0.004)(net.all_params[6])
+        cost = ce + L2
+
         correct_prediction = tf.equal(tf.argmax(y, 1), y_)
         acc = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
 
-        return network, cost, acc
+        return net, cost, acc
 
 
-def model2(x, y_, is_train, reuse):
+def model_batch_norm(x, y_, reuse, is_train):
+    """ Batch normalization should be placed before rectifier. """
     W_init = tf.truncated_normal_initializer(stddev=5e-2)
-    b_init = tf.constant_initializer(value=0.0)
     W_init2 = tf.truncated_normal_initializer(stddev=0.04)
     b_init2 = tf.constant_initializer(value=0.1)
     with tf.variable_scope("model", reuse=reuse):
         tl.layers.set_name_reuse(reuse)
-        network = tl.layers.InputLayer(x, name='input')
-        network = tl.layers.Conv2dLayer(network, act=tf.nn.relu,
-                    shape=[5, 5, 3, 64], strides=[1, 1, 1, 1], padding='SAME', # 64 features for each 5x5x3 patch
-                    W_init=W_init, b_init=b_init, name ='cnn1')       # output: (batch_size, 24, 24, 64)
-        network = tl.layers.PoolLayer(network, ksize=[1, 3, 3, 1],
-                    strides=[1, 2, 2, 1], padding='SAME',
-                    pool = tf.nn.max_pool, name ='pool1',)            # output: (batch_size, 12, 12, 64)
-        # network.outputs = tf.nn.lrn(network.outputs, 4, bias=1.0, alpha=0.001 / 9.0,
-        #                                                 beta=0.75, name='norm1')
-        network = tl.layers.LocalResponseNormLayer(network, depth_radius=4, bias=1.0,
-                    alpha=0.001 / 9.0, beta=0.75, name='norm1')
-        network = tl.layers.Conv2dLayer(network, act=tf.nn.relu,
-                    shape=[5, 5, 64, 64], strides=[1, 1, 1, 1], padding='SAME',# 64 features for each 5x5 patch
-                    W_init=W_init, b_init=b_init, name ='cnn2')       # output: (batch_size, 12, 12, 64)
-        # network.outputs = tf.nn.lrn(network.outputs, 4, bias=1.0, alpha=0.001 / 9.0,
-        #                                                 beta=0.75, name='norm2')
-        network = tl.layers.LocalResponseNormLayer(network, depth_radius=4, bias=1.0,
-                    alpha=0.001 / 9.0, beta=0.75, name='norm2')
-        network = tl.layers.PoolLayer(network, ksize=[1, 3, 3, 1],
-                    strides=[1, 2, 2, 1], padding='SAME',
-                    pool = tf.nn.max_pool, name ='pool2')             # output: (batch_size, 6, 6, 64)
-        network = tl.layers.FlattenLayer(network, name='flatten')     # output: (batch_size, 2304)
-        network = tl.layers.DenseLayer(network, n_units=384, act=tf.nn.relu,
+        net = InputLayer(x, name='input')
+
+        net = Conv2d(net, 64, (5, 5), (1, 1), padding='SAME',
+                    W_init=W_init, b_init=None, name='cnn1')
+        # net = Conv2dLayer(net, act=tf.identity, shape=[5, 5, 3, 64],
+        #             strides=[1, 1, 1, 1], padding='SAME',                 # 64 features for each 5x5x3 patch
+        #             W_init=W_init, b_init=None, name='cnn1')              # output: (batch_size, 24, 24, 64)
+        net = BatchNormLayer(net, is_train, act=tf.nn.relu, name='batch1')
+        net = MaxPool2d(net, (3, 3), (2, 2), padding='SAME',name='pool1')
+        # net = PoolLayer(net, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1],
+        #             padding='SAME', pool=tf.nn.max_pool, name='pool1',)   # output: (batch_size, 12, 12, 64)
+
+        net = Conv2d(net, 64, (5, 5), (1, 1), padding='SAME',
+                    W_init=W_init, b_init=None, name='cnn2')
+        # net = Conv2dLayer(net, act=tf.identity, shape=[5, 5, 64, 64],
+        #             strides=[1, 1, 1, 1], padding='SAME',                 # 64 features for each 5x5 patch
+        #             W_init=W_init, b_init=None, name ='cnn2')             # output: (batch_size, 12, 12, 64)
+        net = BatchNormLayer(net, is_train, act=tf.nn.relu, name='batch2')
+        net = MaxPool2d(net, (3, 3), (2, 2), padding='SAME',name='pool2')
+        # net = PoolLayer(net, ksize=[1, 3, 3, 1], strides=[1, 2, 2, 1],
+        #            padding='SAME', pool = tf.nn.max_pool, name ='pool2')  # output: (batch_size, 6, 6, 64)
+
+        net = FlattenLayer(net, name='flatten')                             # output: (batch_size, 2304)
+        net = DenseLayer(net, n_units=384, act=tf.nn.relu,
                     W_init=W_init2, b_init=b_init2, name='relu1')           # output: (batch_size, 384)
-        network = tl.layers.DenseLayer(network, n_units=192, act=tf.nn.relu,
+        net = DenseLayer(net, n_units=192, act = tf.nn.relu,
                     W_init=W_init2, b_init=b_init2, name='relu2')           # output: (batch_size, 192)
-        network = tl.layers.DenseLayer(network, n_units=10, act=tf.identity,
+        net = DenseLayer(net, n_units=10, act = tf.identity,
                     W_init=tf.truncated_normal_initializer(stddev=1/192.0),
-                    b_init = tf.constant_initializer(value=0.0),
-                    name='output')    # output: (batch_size, 10)
-        y = network.outputs
+                    name='output')                                          # output: (batch_size, 10)
+        y = net.outputs
 
         ce = tl.cost.cross_entropy(y, y_, name='cost')
         # L2 for the MLP, without this, the accuracy will be reduced by 15%.
-        L2 = tf.contrib.layers.l2_regularizer(0.004)(network.all_params[4]) + \
-                tf.contrib.layers.l2_regularizer(0.004)(network.all_params[6])
+        L2 = tf.contrib.layers.l2_regularizer(0.004)(net.all_params[4]) + \
+                tf.contrib.layers.l2_regularizer(0.004)(net.all_params[6])
         cost = ce + L2
 
-        # correct_prediction = tf.equal(tf.argmax(tf.nn.softmax(y), 1), y_)
         correct_prediction = tf.equal(tf.argmax(y, 1), y_)
         acc = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
 
-        return network, cost, acc
-
+        return net, cost, acc
 
 def distort_fn(x, is_train=False):
     """
@@ -127,7 +130,6 @@ def distort_fn(x, is_train=False):
     artificially increase the data set size:
     .. Randomly flip the image from left to right.
     .. Randomly distort the image brightness.
-    .. Randomly zoom in.
     """
     # print('begin',x.shape, np.min(x), np.max(x))
     x = tl.prepro.crop(x, 24, 24, is_random=is_train)
@@ -140,22 +142,20 @@ def distort_fn(x, is_train=False):
         x = tl.prepro.brightness(x, gamma=0.1, gain=1, is_random=True)
         # print('after brightness',x.shape, np.min(x), np.max(x))
         # tmp = np.max(x)
-        # x += np.random.uniform(-0.1, 0.1)
+        # x += np.random.uniform(-20, 20)
         # x /= tmp
     # normalize the image
-    x = (x - np.mean(x)) / max(np.std(x), 1.0/24.0) # avoid values divided by 0
+    x = (x - np.mean(x)) / max(np.std(x), 1e-5) # avoid values divided by 0
     # print('after norm', x.shape, np.min(x), np.max(x), np.mean(x))
     return x
 
-# x = X_train[0]
-# x = distort_fn(x, True)
-# exit()
-
 x = tf.placeholder(tf.float32, shape=[None, 24, 24, 3], name='x')
 y_ = tf.placeholder(tf.int64, shape=[None, ], name='y_')
 
-network, cost, _ = model2(x, y_, True, False)
-_, cost_test, acc = model2(x, y_, False, True)
+# network, cost, _ = model(x, y_, False)
+# _, cost_test, acc = model(x, y_, True)
+network, cost, _ = model_batch_norm(x, y_, False, is_train=True)
+_, cost_test, acc = model_batch_norm(x, y_, True, is_train=False)
 
 ## train
 n_epoch = 50000
@@ -184,14 +184,14 @@ def distort_fn(x, is_train=False):
 
     if epoch + 1 == 1 or (epoch + 1) % print_freq == 0:
         print("Epoch %d of %d took %fs" % (epoch + 1, n_epoch, time.time() - start_time))
-        train_loss, train_acc, n_batch = 0, 0, 0
-        for X_train_a, y_train_a in tl.iterate.minibatches(
-                                X_train, y_train, batch_size, shuffle=True):
-            X_train_a = tl.prepro.threading_data(X_train_a, fn=distort_fn, is_train=False)  # central crop
-            err, ac = sess.run([cost_test, acc], feed_dict={x: X_train_a, y_: y_train_a})
-            train_loss += err; train_acc += ac; n_batch += 1
-        print("   train loss: %f" % (train_loss/ n_batch))
-        print("   train acc: %f" % (train_acc/ n_batch))
+        # train_loss, train_acc, n_batch = 0, 0, 0
+        # for X_train_a, y_train_a in tl.iterate.minibatches(
+        #                         X_train, y_train, batch_size, shuffle=True):
+        #     X_train_a = tl.prepro.threading_data(X_train_a, fn=distort_fn, is_train=False)  # central crop
+        #     err, ac = sess.run([cost_test, acc], feed_dict={x: X_train_a, y_: y_train_a})
+        #     train_loss += err; train_acc += ac; n_batch += 1
+        # print("   train loss: %f" % (train_loss/ n_batch))
+        # print("   train acc: %f" % (train_acc/ n_batch))
         test_loss, test_acc, n_batch = 0, 0, 0
         for X_test_a, y_test_a in tl.iterate.minibatches(
                                     X_test, y_test, batch_size, shuffle=True):