teazj
diff --git a/‎tensorflowTUT/tf23_BN.py
-122 b/‎tensorflowTUT/tf23_BN.py
-122
diff --git a/‎tensorflowTUT/tf23_BN/test.py
+153 b/‎tensorflowTUT/tf23_BN/test.py
+153
@@ -0,0 +1,153 @@
+"""
+visit https://morvanzhou.github.io/tutorials/ for more!
+
+Build two networks.
+1. Without batch normalization
+2. With batch normalization
+
+Run tests on these two networks.
+"""
+
+# 23 Batch Normalization
+
+import numpy as np
+import tensorflow as tf
+import matplotlib.pyplot as plt
+
+
+ACTIVATION = tf.nn.relu
+N_LAYERS = 7
+N_HIDDEN_UNITS = 30
+
+
+def fix_seed(seed=1):
+    # reproducible
+    np.random.seed(seed)
+    tf.set_random_seed(seed)
+
+
+def plot_his(inputs, inputs_norm):
+    # plot histogram for the inputs of every layer
+
+    for j, all_inputs in enumerate([inputs, inputs_norm]):
+        for i, input in enumerate(all_inputs):
+            plt.subplot(2, len(all_inputs), j*len(all_inputs)+(i+1))
+            plt.cla()
+            plt.hist(input.ravel(), bins=15, range=(-1, 1), color='#FF5733')
+            plt.yticks(())
+            if j == 1:
+                plt.xticks((-1, 0, 1))
+            else:
+                plt.xticks(())
+            ax = plt.gca()
+            ax.spines['right'].set_color('none')
+            ax.spines['top'].set_color('none')
+        plt.title("%s normalizing" % ("Without" if j == 0 else "With"))
+    plt.draw()
+    plt.pause(0.01)
+
+
+def built_net(xs, ys, norm):
+    def add_layer(inputs, in_size, out_size, activation_function=None, norm=False):
+        # weights and biases (bad initialization for this case)
+        Weights = tf.Variable(tf.random_normal([in_size, out_size], mean=0., stddev=1.))
+        biases = tf.Variable(tf.zeros([1, out_size]) + 0.1)
+
+        # fully connected product
+        Wx_plus_b = tf.matmul(inputs, Weights) + biases
+
+        # normalize fully connected product
+        if norm:
+            # Batch Normalize
+            fc_mean, fc_var = tf.nn.moments(
+                Wx_plus_b,
+                axes=[0],   # the dimension you wanna normalize, here [0] for batch
+                            # for image, you wanna do [0, 1, 2] for [batch, height, width] but not channel
+            )
+            scale = tf.Variable(tf.ones([out_size]))
+            shift = tf.Variable(tf.zeros([out_size]))
+            epsilon = 0.001
+            # similar with this:
+            # Wx_plus_b = (Wx_plus_b - fc_mean) / tf.sqrt(fc_var + 0.001)
+            Wx_plus_b = tf.nn.batch_normalization(Wx_plus_b, fc_mean, fc_var, shift, scale, epsilon)
+
+        # activation
+        if activation_function is None:
+            outputs = Wx_plus_b
+        else:
+            outputs = activation_function(Wx_plus_b)
+
+        return outputs
+
+    fix_seed(1)
+    # record inputs for every layer
+    layers_inputs = [xs]
+
+    # build hidden layers
+    for l_n in range(N_LAYERS):
+        layer_input = layers_inputs[l_n]
+        in_size = layers_inputs[l_n].get_shape()[1].value
+
+        output = add_layer(
+            layer_input,    # input
+            in_size,        # input size
+            N_HIDDEN_UNITS, # output size
+            ACTIVATION,     # activation function
+            norm,           # normalize before activation
+        )
+        layers_inputs.append(output)    # add output for next run
+
+    # build output layer
+    prediction = add_layer(layers_inputs[-1], 30, 1, activation_function=None)
+
+    cost = tf.reduce_mean(tf.reduce_sum(tf.square(ys - prediction), reduction_indices=[1]))
+    train_op = tf.train.GradientDescentOptimizer(0.001).minimize(cost)
+    return [train_op, cost, layers_inputs]
+
+# make up data
+fix_seed(1)
+x_data = np.linspace(-7, 10, 500)[:, np.newaxis]
+noise = np.random.normal(0, 8, x_data.shape)
+y_data = np.square(x_data) - 5 + noise
+
+# plot input data
+# plt.scatter(x_data, y_data)
+# plt.show()
+
+xs = tf.placeholder(tf.float32, [None, 1])  # [num_samples, num_features]
+ys = tf.placeholder(tf.float32, [None, 1])
+
+train_op, cost, layers_inputs = built_net(xs, ys, norm=False)   # without BN
+train_op_norm, cost_norm, layers_inputs_norm = built_net(xs, ys, norm=True) # with BN
+
+sess = tf.Session()
+sess.run(tf.global_variables_initializer())
+
+# record cost
+cost_his = []
+cost_his_norm = []
+record_step = 5
+
+plt.ion()
+plt.figure(figsize=(7, 3))
+for i in range(251):
+    if i % 50 == 0:
+        # plot histogram
+        all_inputs, all_inputs_norm = sess.run([layers_inputs, layers_inputs_norm], feed_dict={xs: x_data, ys: y_data})
+        plot_his(all_inputs, all_inputs_norm)
+
+    sess.run(train_op, feed_dict={xs: x_data, ys: y_data})
+    sess.run(train_op_norm, feed_dict={xs: x_data, ys: y_data})
+    if i % record_step == 0:
+        # record cost
+        cost_his.append(sess.run(cost, feed_dict={xs: x_data, ys: y_data}))
+        cost_his_norm.append(sess.run(cost_norm, feed_dict={xs: x_data, ys: y_data}))
+
+plt.ioff()
+plt.figure()
+plt.plot(np.arange(len(cost_his))*record_step, np.array(cost_his), label='no BN')     # no norm
+plt.plot(np.arange(len(cost_his))*record_step, np.array(cost_his_norm), label='BN')   # norm
+plt.legend()
+plt.show()
+
+