update

MorvanZhou · Morvan Zhou · commit 9f4b057bba04 · 2017-05-11T12:35:48.000+10:00
diff --git a/tutorial-contents/401_CNN.py b/tutorial-contents/401_CNN.py
@@ -10,6 +10,7 @@
 import tensorflow as tf
 from tensorflow.examples.tutorials.mnist import input_data
 import numpy as np
+import matplotlib.pyplot as plt
 
 tf.set_random_seed(1)
 np.random.seed(1)
@@ -21,6 +22,13 @@
 test_x = mnist.test.images[:2000]
 test_y = mnist.test.labels[:2000]
 
+# plot one example
+print(mnist.train.images.shape)     # (55000, 28 * 28)
+print(mnist.train.labels.shape)   # (55000, 10)
+plt.imshow(mnist.train.images[0].reshape((28, 28)), cmap='gray')
+plt.title('%i' % np.argmax(mnist.train.labels[0]))
+plt.show()
+
 tf_x = tf.placeholder(tf.float32, [None, 28*28])/255.  # normalize to range (0, 1)
 image = tf.reshape(tf_x, [-1, 28, 28, 1])              # (batch, height, width, channel)
 tf_y = tf.placeholder(tf.int32, [None, 10])            # input y
diff --git a/tutorial-contents/402_RNN_classification.py b/tutorial-contents/402_RNN_classification.py
@@ -0,0 +1,73 @@
+"""
+Know more, visit my Python tutorial page: https://morvanzhou.github.io/tutorials/
+My Youtube Channel: https://www.youtube.com/user/MorvanZhou
+
+Dependencies:
+tensorflow: 1.1.0
+matplotlib
+numpy
+"""
+import tensorflow as tf
+from tensorflow.examples.tutorials.mnist import input_data
+import numpy as np
+import matplotlib.pyplot as plt
+
+tf.set_random_seed(1)
+np.random.seed(1)
+
+# Hyper Parameters
+BATCH_SIZE = 64
+TIME_STEP = 28          # rnn time step / image height
+INPUT_SIZE = 28         # rnn input size / image width
+LR = 0.01               # learning rate
+
+# data
+mnist = input_data.read_data_sets('./mnist', one_hot=True)
+test_x = mnist.test.images[:2000]
+test_y = mnist.test.labels[:2000]
+
+# plot one example
+print(mnist.train.images.shape)     # (55000, 28 * 28)
+print(mnist.train.labels.shape)   # (55000, 10)
+plt.imshow(mnist.train.images[0].reshape((28, 28)), cmap='gray')
+plt.title('%i' % np.argmax(mnist.train.labels[0]))
+plt.show()
+
+# tensorflow placeholders
+tf_x = tf.placeholder(tf.float32, [None, TIME_STEP * INPUT_SIZE])/255.  # shape(batch, 784), normalize to range (0, 1)
+image = tf.reshape(tf_x, [-1, TIME_STEP, INPUT_SIZE])                   # (batch, height, width, channel)
+tf_y = tf.placeholder(tf.int32, [None, 10])                             # input y
+
+# RNN
+rnn_cell = tf.contrib.rnn.BasicLSTMCell(num_units=64)
+outputs, (h_c, h_n) = tf.nn.dynamic_rnn(
+    rnn_cell,                   # cell you have chosen
+    image,                      # input
+    initial_state=None,         # the initial hidden state
+    dtype=tf.float32,           # must given if set initial_state = None
+    time_major=False,           # False: (batch, time step, input); True: (time step, batch, input)
+)
+output = tf.layers.dense(outputs[:, -1, :], 10)              # output based on the last output step
+
+loss = tf.losses.softmax_cross_entropy(onehot_labels=tf_y, logits=output)           # compute cost
+train_op = tf.train.AdamOptimizer(LR).minimize(loss)
+
+accuracy = tf.metrics.accuracy(          # return (acc, update_op), and create 2 local variables
+    labels=tf.argmax(tf_y, axis=1), predictions=tf.argmax(output, axis=1),)[1]
+
+sess = tf.Session()
+init_op = tf.group(tf.global_variables_initializer(), tf.local_variables_initializer()) # the local var is for accuracy_op
+sess.run(init_op)     # initialize var in graph
+
+for step in range(1200):    # training
+    b_x, b_y = mnist.train.next_batch(BATCH_SIZE)
+    _, loss_ = sess.run([train_op, loss], {tf_x: b_x, tf_y: b_y})
+    if step % 50 == 0:      # testing
+        accuracy_ = sess.run(accuracy, {tf_x: test_x, tf_y: test_y})
+        print('train loss: %.4f' % loss_, '| test accuracy: %.2f' % accuracy_)
+
+# print 10 predictions from test data
+test_output = sess.run(output, {tf_x: test_x[:10]})
+pred_y = np.argmax(test_output, 1)
+print(pred_y, 'prediction number')
+print(np.argmax(test_y[:10], 1), 'real number')
diff --git a/tutorial-contents/403_RNN_regression.py b/tutorial-contents/403_RNN_regression.py
@@ -0,0 +1,78 @@
+"""
+Know more, visit my Python tutorial page: https://morvanzhou.github.io/tutorials/
+My Youtube Channel: https://www.youtube.com/user/MorvanZhou
+
+Dependencies:
+tensorflow: 1.1.0
+matplotlib
+numpy
+"""
+import tensorflow as tf
+import numpy as np
+import matplotlib.pyplot as plt
+
+
+# Hyper Parameters
+TIME_STEP = 10       # rnn time step
+INPUT_SIZE = 1      # rnn input size
+CELL_SIZE = 32      # rnn cell size
+LR = 0.02           # learning rate
+
+# show data
+steps = np.linspace(0, np.pi*2, 100, dtype=np.float32)
+x_np = np.sin(steps)    # float32 for converting torch FloatTensor
+y_np = np.cos(steps)
+plt.plot(steps, y_np, 'r-', label='target (cos)')
+plt.plot(steps, x_np, 'b-', label='input (sin)')
+plt.legend(loc='best')
+plt.show()
+
+# tensorflow placeholders
+tf_x = tf.placeholder(tf.float32, [None, TIME_STEP, INPUT_SIZE])        # shape(batch, 5, 1)
+tf_y = tf.placeholder(tf.float32, [None, TIME_STEP, INPUT_SIZE])          # input y
+
+# RNN
+rnn_cell = tf.contrib.rnn.BasicRNNCell(num_units=CELL_SIZE)
+init_s = rnn_cell.zero_state(batch_size=1, dtype=tf.float32)    # very first hidden state
+outputs, final_s = tf.nn.dynamic_rnn(
+    rnn_cell,                   # cell you have chosen
+    tf_x,                       # input
+    initial_state=init_s,       # the initial hidden state
+    time_major=False,           # False: (batch, time step, input); True: (time step, batch, input)
+)
+outs2D = tf.reshape(outputs, [-1, CELL_SIZE])                       # reshape 3D output to 2D for fully connected layer
+net_outs2D = tf.layers.dense(outs2D, INPUT_SIZE)
+outs = tf.reshape(net_outs2D, [-1, TIME_STEP, INPUT_SIZE])          # reshape back to 3D
+
+loss = tf.losses.mean_squared_error(labels=tf_y, predictions=outs)  # compute cost
+train_op = tf.train.AdamOptimizer(LR).minimize(loss)
+
+sess = tf.Session()
+init_op = tf.group(tf.global_variables_initializer())
+sess.run(init_op)     # initialize var in graph
+
+plt.figure(1, figsize=(12, 5))
+plt.ion()           # continuously plot
+plt.show()
+
+for step in range(60):
+    start, end = step * np.pi, (step+1)*np.pi   # time steps
+    # use sin predicts cos
+    steps = np.linspace(start, end, TIME_STEP)
+    x = np.sin(steps)[np.newaxis, :, np.newaxis]    # shape (batch, time_step, input_size)
+    y = np.cos(steps)[np.newaxis, :, np.newaxis]
+    if 'final_s_' not in globals():                 # first state, no any hidden state
+        feed_dict = {tf_x: x, tf_y: y}
+    else:                                           # has hidden state, so pass it to rnn
+        feed_dict = {tf_x: x, tf_y: y, init_s: final_s_}
+    _, pred_, final_s_ = sess.run([train_op, outs, final_s], feed_dict)     # train
+
+    # plotting
+    plt.plot(steps, y.flatten(), 'r-')
+    plt.plot(steps, pred_.flatten(), 'b-')
+    plt.ylim((-1.2, 1.2))
+    plt.draw()
+    plt.pause(0.05)
+
+plt.ioff()
+plt.show()
diff --git a/tutorial-contents/DQN.py b/tutorial-contents/DQN.py
@@ -44,9 +44,9 @@
     l_target = tf.layers.dense(tf_s_, 10, tf.nn.relu)
     q_next = tf.layers.dense(l_target, N_ACTIONS)
 
-q_target = tf.stop_gradient(tf_r + GAMMA * tf.reduce_max(q_next, axis=1))   # shape=(None, ), not need any gradient
+q_target = tf.stop_gradient(tf_r + GAMMA * tf.reduce_max(q_next, axis=1)) # shape=(None, ), not need gradient for q_next
 a_one_hot = tf.one_hot(tf_a, depth=N_ACTIONS, dtype=tf.float32)
-q_wrt_a = tf.reduce_sum(q * a_one_hot, axis=1)                              # shape=(None, ), q for current state
+q_wrt_a = tf.reduce_sum(q * a_one_hot, axis=1)                            # shape=(None, ), q for current state
 
 loss = tf.reduce_mean(tf.squared_difference(q_target, q_wrt_a))
 train_op = tf.train.AdamOptimizer(LR).minimize(loss)