Added

hunkim · hunkim · commit b0265b549ef0 · 2017-02-24T21:05:37.000+08:00
diff --git a/klab-12-1-softmax_hello_char.py b/klab-12-1-softmax_hello_char.py
@@ -0,0 +1,63 @@
+import numpy as np
+from keras.models import Sequential
+from keras.layers import Dense, TimeDistributed, Activation, LSTM
+from keras.utils import np_utils
+
+import os
+
+# brew install graphviz
+# pip3 install graphviz
+# pip3 install pydot
+from keras.utils.visualize_util import plot
+
+# sample text
+sample = "hihello"
+
+char_set = list(set(sample))  # id -> char ['i', 'l', 'e', 'o', 'h']
+char_dic = {w: i for i, w in enumerate(char_set)}
+
+x_str = sample[:-1]
+y_str = sample[1:]
+
+data_dim = len(char_set)
+timesteps = len(y_str)
+nb_classes = len(char_set)
+
+print(x_str, y_str)
+
+x = [char_dic[c] for c in x_str]  # char to index
+y = [char_dic[c] for c in y_str]  # char to index
+
+# One-hot encoding
+x = np_utils.to_categorical(x, nb_classes=nb_classes)
+# reshape X to be [samples, time steps, features]
+x = np.reshape(x, (-1, len(x), data_dim))
+print(x.shape)
+
+# One-hot encoding
+y = np_utils.to_categorical(y, nb_classes=nb_classes)
+# time steps
+y = np.reshape(y, (-1, len(y), data_dim))
+print(y.shape)
+
+model = Sequential()
+model.add(Dense(nb_classes, input_shape=(
+    timesteps, data_dim)))
+model.add(Activation('softmax'))
+model.summary()
+# Store model graph in png
+plot(model, to_file=os.path.basename(__file__) + '.png', show_shapes=True)
+
+model.compile(loss='categorical_crossentropy',
+              optimizer='rmsprop', metrics=['accuracy'])
+model.fit(x, y, nb_epoch=100)
+
+predictions = model.predict(x, verbose=0)
+for i, prediction in enumerate(predictions):
+    x_index = np.argmax(x[i], axis=1)
+    x_str = [char_set[j] for j in x_index]
+    print(x_index, ''.join(x_str))
+
+    index = np.argmax(prediction, axis=1)
+    result = [char_set[j] for j in index]
+    print(index, ''.join(result))
diff --git a/klab-12-2-rnn_long_char.py b/klab-12-2-rnn_long_char.py
@@ -11,9 +11,9 @@
 from keras.utils.visualize_util import plot
 
 # sample sentence
-sentence = "If you want to build a ship, don't drum up people together to collect wood and don't assign them tasks and work, but rather teach them to long for the endless immensity of the sea."
+sentence = "if you want to build a ship, don't drum up people together to collect wood and don't assign them tasks and work, but rather teach them to long for the endless immensity of the sea."
 
-char_set = list(set(sentence))  # id -> char ['i', 'l', 'e', 'o', 'h']
+char_set = list(set(sentence))  # id -> char ['i', 'l', 'e', 'o', 'h', ...]
 char_dic = {w: i for i, w in enumerate(char_set)}
 
 data_dim = len(char_set)
diff --git a/klab-12-4-seq2seq.py b/klab-12-4-seq2seq.py
@@ -4,6 +4,7 @@
 from keras.layers import Activation, TimeDistributed, Dense, RepeatVector, LSTM
 from keras.utils import np_utils
 from keras.utils.visualize_util import plot
+from keras.callbacks import TensorBoard
 import os
 
 digit = "0123456789"
@@ -38,6 +39,8 @@
 
 
 print('Build model...')
+TensorBoard(log_dir='./logs', histogram_freq=1, write_graph=True, write_images=False)
+
 model = Sequential()
 # "Encode" the input sequence using an RNN, producing an output of HIDDEN_SIZE
 # note: in a situation where your input sequences have a variable length,
@@ -62,12 +65,15 @@
 # Store model graph in png
 plot(model, to_file=os.path.basename(__file__) + '.png', show_shapes=True)
 
-# Create test dataset for fun
+# Create test data set for fun
 testX = []
+testY = []
 for i in range(10):
     rand_pick = np.random.choice(10, 7)
     x = [char_dic[digit[c]] for c in rand_pick]
+    y = [alpha[c] for c in rand_pick]
     testX.append(x)
+    testY.append(y)
 
 # One-hot encoding
 testX = np_utils.to_categorical(testX, nb_classes=nb_classes)
@@ -84,4 +90,5 @@
     index = np.argmax(prediction, axis=1)
     result = [char_set[j] for j in index]
 
-    print(''.join(x_str), ' -> ', ''.join(result))
+    print(''.join(x_str), ' -> ', ''.join(result),
+          " true: ", ''.join(testY[i]))
diff --git a/lab-04-4-multi_variable_linear_regression_feed.py b/lab-04-4-multi_variable_linear_regression_feed.py
@@ -14,8 +14,7 @@
 hypothesis = tf.matmul(x, W) + b
 
 # Simplified cost function
-with tf.control_dependencies(y.shape.assert_same_rank(hypothesis)):
-    cost = tf.reduce_mean(tf.square(hypothesis - y))
+cost = tf.reduce_mean(tf.square(hypothesis - y))
 
 # Minimize
 optimizer = tf.train.GradientDescentOptimizer(learning_rate=0.01)
diff --git a/rnn_basics.ipynb b/rnn_basics.ipynb
@@ -0,0 +1,232 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {
+    "collapsed": true
+   },
+   "source": [
+    "* http://www.wildml.com/2016/08/rnns-in-tensorflow-a-practical-guide-and-undocumented-features/\n",
+    "* http://learningtensorflow.com/index.html"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import tensorflow as tf\n",
+    "import numpy as np\n",
+    "from tensorflow.contrib import rnn\n",
+    "import pprint\n",
+    "pp = pprint.PrettyPrinter(indent=4)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Static RNN"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "tf.reset_default_graph()\n",
+    "sess = tf.InteractiveSession()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "array([[[  0.,   1.,   2.],\n",
+      "        [  3.,   4.,   5.],\n",
+      "        [  6.,   7.,   8.],\n",
+      "        [  9.,  10.,  11.]],\n",
+      "\n",
+      "       [[ 12.,  13.,  14.],\n",
+      "        [ 15.,  16.,  17.],\n",
+      "        [ 18.,  19.,  20.],\n",
+      "        [ 21.,  22.,  23.]]], dtype=float32)\n"
+     ]
+    }
+   ],
+   "source": [
+    "# Create input data\n",
+    "x_data = np.arange(24, dtype=np.float32).reshape(2,4,3)\n",
+    "pp.pprint(x_data)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "5 LSTMStateTuple(c=5, h=5)\n",
+      "5 (LSTMStateTuple(c=5, h=5), LSTMStateTuple(c=5, h=5))\n"
+     ]
+    }
+   ],
+   "source": [
+    "cell = rnn.BasicLSTMCell(num_units=5, state_is_tuple=True)\n",
+    "print(cell.output_size, cell.state_size)\n",
+    "cell = rnn.MultiRNNCell([cell] * 2, state_is_tuple=True)\n",
+    "print(cell.output_size, cell.state_size)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "[   array([[  0.,   1.,   2.],\n",
+      "       [  3.,   4.,   5.],\n",
+      "       [  6.,   7.,   8.],\n",
+      "       [  9.,  10.,  11.]], dtype=float32),\n",
+      "    array([[ 12.,  13.,  14.],\n",
+      "       [ 15.,  16.,  17.],\n",
+      "       [ 18.,  19.,  20.],\n",
+      "       [ 21.,  22.,  23.]], dtype=float32)]\n"
+     ]
+    }
+   ],
+   "source": [
+    "x_data = tf.reshape(x_data, [-1, 3])\n",
+    "x_split = tf.split(value=x_data, num_or_size_splits=2)\n",
+    "pp.pprint(sess.run(x_split))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [
+    {
+     "ename": "AttributeError",
+     "evalue": "module 'tensorflow.python.ops.nn' has no attribute 'rnn'",
+     "output_type": "error",
+     "traceback": [
+      "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m",
+      "\u001b[0;31mAttributeError\u001b[0m                            Traceback (most recent call last)",
+      "\u001b[0;32m<ipython-input-6-9b5a47592263>\u001b[0m in \u001b[0;36m<module>\u001b[0;34m()\u001b[0m\n\u001b[0;32m----> 1\u001b[0;31m \u001b[0moutputs\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0m_states\u001b[0m \u001b[0;34m=\u001b[0m \u001b[0mtf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mnn\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrnn\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mcell\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mx_split\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mdtype\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0mtf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mfloat32\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m      2\u001b[0m \u001b[0mprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0moutputs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      3\u001b[0m \u001b[0msess\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrun\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mtf\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mglobal_variables_initializer\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m      4\u001b[0m \u001b[0mpp\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mpprint\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0msess\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mrun\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0moutputs\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n",
+      "\u001b[0;31mAttributeError\u001b[0m: module 'tensorflow.python.ops.nn' has no attribute 'rnn'"
+     ]
+    }
+   ],
+   "source": [
+    "outputs,_states = tf.nn.rnn(cell, x_split, dtype=tf.float32)\n",
+    "print(outputs)\n",
+    "sess.run(tf.global_variables_initializer())\n",
+    "pp.pprint(sess.run(outputs))"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Dynamic Rnn"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "tf.reset_default_graph()\n",
+    "sess = tf.InteractiveSession()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "tf.reset_default_graph()\n",
+    "\n",
+    "# Create input data\n",
+    "X = np.random.randn(2, 10, 8)\n",
+    "\n",
+    "# The second example is of length 6 \n",
+    "X[1,6:] = 0\n",
+    "X_lengths = [10, 6]\n",
+    "\n",
+    "cell = rnn.LSTMCell(num_units=64, state_is_tuple=True)\n",
+    "\n",
+    "outputs, last_states = tf.nn.dynamic_rnn(\n",
+    "    cell=cell,\n",
+    "    dtype=tf.float64,\n",
+    "    sequence_length=X_lengths,\n",
+    "    inputs=X)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": false
+   },
+   "outputs": [],
+   "source": [
+    "sess.run(tf.global_variables_initializer())\n",
+    "pp.pprint(sess.run(outputs))"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.0"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 0
+}