updated notes and implemented data generation for 10 digit recognition

2017-10-21 09:04:25 +05:30
parent 16c98b53d5
commit 6c62795d02
5 changed files with 104 additions and 3 deletions
--- a/SecondSaturday/Mnist10Digit.ipynb
+++ b/SecondSaturday/Mnist10Digit.ipynb
@@ -0,0 +1,34 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 2",
+   "language": "python",
+   "name": "python2"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 2
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython2",
+   "version": "2.7.14"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 0
+}
--- a/SecondSaturday/Notes.md
+++ b/SecondSaturday/Notes.md
@@ -54,7 +54,7 @@ eg: stock market temporal data / speech data/ image data

 Non-Parametric models : k-NN(K-nearest neighbor), Decision Trees, Random Forests (independent of parameters)
  -> very inaccurate because doesn't know much about the data
-Parametric Models: based on fixed set of parameters
+Parametric Models: based on fixed set of parameters,SVM
  -> more accurate coz the knows more about the parameters from the data


--- a/SecondSaturday/Workshop.md
+++ b/SecondSaturday/Workshop.md
@@ -12,8 +12,7 @@ language, keyboard layout
  Predict the word

 ## Model
-  Structured Output/HMM/ CNN?
-
+  Structured Output/HMM/CNN?

 # mnist hand-written digit database -> build application for recognizing full phone numbers(10 digit).

--- a/SecondSunday/Notes.md
+++ b/SecondSunday/Notes.md
@@ -0,0 +1,22 @@
+# Activation Function (AKA Transfer function)
+ In a neural network activation function adds non-linearity to it.
+ Types:
+ 1. Sigmoid(Logistic) (used mostly for output layer(looks like probability))
+ 2. RelU or Rectified Linear Unit (important discovery for NN - most-used for hidden layers)(not suitable for output layer if output is supposed to be probability) and leaky RelU with some slope on negative part
+ 3. tanH (Hyperbolic) (-1 - 1) or ArcTan (Tan Inverse -> maps to -Pi/2 - Pi/2)
+ 4. Linear(or Identity) layer (used for output layers(best for regression))
+ 5. Softmax (classification giving probability) (probability coz outputs add upto 1)
+ 6. SquareRoot
+ 7. Exponential
+ 8. Sine.
+ 9. Ramp
+ 10. Step (Binary)
+ 11. Unit Sum
+
+if the network computation is something that is multiplicative, use log as activation so that the sum becomes addition.
+
+Constraint Optimization: optimize in such a way that the output is constrained to some value.
+
+
+Steps => number of iteration of batches
+Epoch => number of iterations of going throught the entire dataset
--- a/SecondSunday/mnist_phone_number.py
+++ b/SecondSunday/mnist_phone_number.py
@@ -0,0 +1,46 @@
+%matplotlib inline
+from tensorflow.examples.tutorials.mnist import input_data
+import numpy as np
+import matplotlib.pyplot as plt
+
+mnist = input_data.read_data_sets('./SecondSunday/mnist_data', one_hot=True)
+label_number = mnist.train.labels.argmax(axis=1)
+number_imgs = {str(i):mnist.train.images[np.argwhere(label_number == i).squeeze()] for i in range(10)}
+DATA_COUNT = 100
+phone_number_digits = np.random.randint(10**9,10**10,size=(DATA_COUNT,10))
+phone_number_digits = np.random.randint(10,size=(DATA_COUNT,10))
+phone_number_digits.astype(str)
+phone_number_strings = phone_number_digits.astype(str)
+
+def pick_img(num):
+    rand_idx = np.random.randint(number_imgs[num].shape[0])
+    img = number_imgs[num][rand_idx].reshape(28,28)
+    return img
+
+def create_phone_img(phon_no):
+    return np.hstack(tuple([pick_img(d) for d in phon_no]))
+
+def create_phone_images(phone_array):
+    phone_number_images = []
+    for phon_no in phone_array:
+        phone_number_images.append(create_phone_img(phon_no))
+    return np.array(phone_number_images).reshape(-1,28*280)
+
+phone_number_imgs = create_phone_images(phone_number_strings)
+
+from keras.models import Sequential
+from keras.layers import Dense, Activation
+
+model = Sequential([
+    Dense(32, input_shape=(7840,)),
+    Activation('relu'),
+    Dense(10),
+    Activation('linear'),
+])
+
+model.compile(optimizer='rmsprop',
+              loss='categorical_crossentropy',
+              metrics=['accuracy'])
+
+model.fit()
+# plt.imshow(phone_number_imgs[np.random.randint(phone_number_imgs.shape[0])])