initial commit

SaiKiranBurle · Dec 10, 2017 · 627b5b8 · 627b5b8
1 parent 6a77fb3
commit 627b5b8
Show file tree

Hide file tree

Showing 4 changed files with 305 additions and 0 deletions.
diff --git a/.gitignore b/.gitignore
@@ -0,0 +1,2 @@
+.idea/
+.DS_Store
diff --git a/binary_image_classifier/simple_keras.py b/binary_image_classifier/simple_keras.py
@@ -0,0 +1,105 @@
+from IPython import embed
+from keras.layers import Conv2D, Activation, MaxPooling2D, Flatten, Dense, Dropout
+from keras.models import Sequential
+from keras.preprocessing.image import ImageDataGenerator, load_img, img_to_array
+
+TRAIN_PATH = '/Users/sai/dev/catsdogs/data2/train/'
+
+# Constants
+NUM_CHANNELS = 3
+IMG_X = 150
+IMG_Y = 150
+
+BATCH_SIZE = 16
+TOTAL_NUM_IMAGES = 25000
+
+
+def get_train_data_augmenter():
+    # real time image augmentation
+    augmenter = ImageDataGenerator(
+        # rotation_range=40,
+        # width_shift_range=0.2,
+        # height_shift_range=0.2,
+        shear_range=0.2,
+        zoom_range=0.2,
+        horizontal_flip=True,
+        fill_mode='nearest',
+        rescale=1./255,
+    )
+    return augmenter
+
+
+def run_sample_image_augmentation(augmenter):
+    img = load_img(TRAIN_PATH + 'cat/cat.0.jpg')
+    x = img_to_array(img)                           # shape = (3, 374, 500)
+    x = x.reshape((1,) + x.shape)
+    i = 0
+    for _ in augmenter.flow(x, batch_size=1, save_to_dir='preview_augmentation',
+                            save_prefix='cat', save_format='jpeg'):
+        i += 1
+        if i > 20:
+            break
+
+
+def get_train_data_generator(augmenter):
+    train_generator = augmenter.flow_from_directory(
+        TRAIN_PATH,
+        target_size=(IMG_X, IMG_Y),
+        batch_size=BATCH_SIZE,
+        class_mode='binary'
+    )
+    return train_generator
+
+
+def get_model():
+
+    model = Sequential()
+    # Conv 1
+    model.add(
+        Conv2D(filters=32, kernel_size=(3, 3), input_shape=(IMG_X, IMG_Y, NUM_CHANNELS))
+    )
+    model.add(Activation('relu'))
+    model.add(MaxPooling2D(pool_size=(2, 2)))
+
+    # Conv 2
+    model.add(
+        Conv2D(filters=32, kernel_size=(3, 3))
+    )
+    model.add(Activation('relu'))
+    model.add(MaxPooling2D(pool_size=(2, 2)))
+
+    # Conv 3
+    model.add(
+        Conv2D(filters=64, kernel_size=(3, 3))
+    )
+    model.add(Activation('relu'))
+    model.add(MaxPooling2D(pool_size=(2, 2)))
+
+    # Fully connected
+    model.add(Flatten())
+    model.add(Dense(64))
+    model.add(Activation('relu'))
+    model.add(Dropout(0.5))
+
+    model.add(Dense(1))
+    model.add(Activation('sigmoid'))
+
+    model.compile(optimizer='rmsprop', loss='binary_crossentropy', metrics=['accuracy'])
+
+    return model
+
+
+def train_model(model, data_gen):
+    model.fit_generator(
+        data_gen,
+        steps_per_epoch=TOTAL_NUM_IMAGES // BATCH_SIZE,
+        epochs=50
+    )
+
+
+if __name__ == "__main__":
+    augmenter = get_train_data_augmenter()
+    # run_sample_image_augmentation(augmenter)
+    model = get_model()
+    train_data_gen = get_train_data_generator(augmenter)
+    train_model(model, train_data_gen)
diff --git a/binary_image_classifier/simple_tf.py b/binary_image_classifier/simple_tf.py
@@ -0,0 +1,165 @@
+import glob
+
+import tensorflow as tf
+from IPython import embed
+
+DATASET_BATCH_SIZE = 50
+IMAGE_X = 200
+IMAGE_Y = 200
+IMAGE_N_CHANNELS = 3
+FLATTEN_IMAGE = False
+NUM_CATEGORIES = 2
+
+PATH_REGEX = '/Users/sai/dev/catsdogs/data/train/*.jpg'
+
+
+def _parse_images(filename, filename_2):
+    """
+    Helper function to read images and labels from filenames.
+    filename_2 = filename
+    """
+    img_str = tf.read_file(filename)
+    img_decoded = tf.image.decode_jpeg(img_str)
+    img_resized = tf.image.resize_images(img_decoded, [IMAGE_X, IMAGE_Y])
+    # if FLATTEN_IMAGE:
+    #     # This tensor will have one row of (IMAGE_X * IMAGE_Y * IMAGE_N_CHANNELS) columns
+    #     img_resized = tf.reshape(img_resized, [-1])
+
+    filename_split = tf.string_split([filename_2], '.').values
+    animal_str = tf.slice(filename_split, [0], [1])
+    animal_str = tf.string_split(animal_str, '/').values
+    animal_str = tf.slice(animal_str, [6], [1])
+    is_cat = tf.equal(animal_str, tf.constant('cat'))
+    is_dog = tf.equal(animal_str, tf.constant('dog'))
+    is_cat = tf.cast(is_cat, tf.int64)
+    is_dog = tf.cast(is_dog, tf.int64)
+    label = tf.concat([is_cat, is_dog], 0)
+    return img_resized, label
+
+
+def get_iterator(filenames):
+    dataset = tf.data.Dataset.from_tensor_slices((filenames, filenames))
+    dataset = dataset.map(_parse_images)
+    # Randomly shuffle dataset with a buffer size
+    dataset = dataset.shuffle(1000)
+    # Infinite repeat of the dataset
+    dataset = dataset.repeat()
+    # Batch size
+    dataset = dataset.batch(DATASET_BATCH_SIZE)
+    iterator = dataset.make_initializable_iterator()
+    return iterator
+
+
+def get_file_paths():
+    training_filenames = glob.glob(PATH_REGEX)
+    return training_filenames
+
+
+def initialize_weights(shape):
+    w = tf.truncated_normal(shape, stddev=0.1)
+    w = tf.Variable(w)
+    return w
+
+
+def initialize_biases(shape):
+    b = tf.constant(0.1, shape=shape)
+    b = tf.Variable(b)
+    return b
+
+
+def conv2d(x, W):
+    """
+    Convolutional layer with stride 1 in each direction and no padding.
+    i.e. output size is same as input size
+    """
+    return tf.nn.conv2d(x, W, strides=[1, 1, 1, 1], padding='SAME')
+
+
+def max_pool_2x2(x):
+    """
+    Pooling over non overlapping 2x2 windows
+    """
+    return tf.nn.max_pool(x, ksize=[1, 2, 2, 1],
+                          strides=[1, 2, 2, 1], padding='SAME')
+
+
+def convolution_model(x, y_, keep_prob):
+    # Conv layer 1
+    W_conv1 = initialize_weights(shape=[5, 5, 3, 32])   # [patch_size, patch_size, num_channels, output_depth]
+    # b_conv1 = initialize_biases(shape=[IMAGE_X, IMAGE_Y, IMAGE_N_CHANNELS, 32])     # Maybe this works too?
+    b_conv1 = initialize_biases(shape=[32])
+    z_conv1 = tf.nn.relu(conv2d(x, W_conv1) + b_conv1)
+    z_conv1 = max_pool_2x2(z_conv1)
+
+    # Conv layer 2
+    W_conv2 = initialize_weights(shape=[3, 3, 32, 32])  # [patch_size, patch_size, num_channels, output_depth]
+    # b_conv2 = initialize_biases(shape=[IMAGE_X, IMAGE_Y, IMAGE_N_CHANNELS, 32])     # Maybe this works too?
+    b_conv2 = initialize_biases(shape=[32])
+    z_conv2 = tf.nn.relu(conv2d(z_conv1, W_conv2) + b_conv2)
+    z_conv2 = max_pool_2x2(z_conv2)
+
+    W_fc1 = initialize_weights(shape=[50 * 50 * 32, 512])
+    b_fc1 = initialize_biases(shape=[512])
+    z_conv2_flat = tf.reshape(z_conv2, [-1, 50 * 50 * 32])
+    z_fc1 = tf.nn.relu(tf.matmul(z_conv2_flat, W_fc1) + b_fc1)
+
+    z_dropout1 = tf.nn.dropout(z_fc1, keep_prob)
+
+    W_out1 = initialize_weights(shape=[512, 64])
+    b_out1 = initialize_biases(shape=[64])
+    z_out1 = tf.matmul(z_dropout1, W_out1) + b_out1
+
+    W_out2 = initialize_weights(shape=[64, 2])
+    b_out2 = initialize_biases(shape=[2])
+    z_out2 = tf.matmul(z_out1, W_out2) + b_out2
+
+    y = z_out2
+    return y
+
+
+def feed_forward_model(x, y_):
+
+    w1 = tf.Variable(tf.zeros([IMAGE_X * IMAGE_Y * IMAGE_N_CHANNELS, 20]))
+    b1 = tf.Variable(tf.zeros(20))
+    z1 = tf.matmul(x, w1) + b1
+
+    w2 = tf.Variable(tf.zeros([20, 2]))
+    b2 = tf.Variable(tf.zeros(2))
+    z2 = tf.matmul(z1, w2) + b2
+
+    y = z2
+    return y
+
+
+def train():
+    training_filenames = get_file_paths()
+    filenames = tf.placeholder(tf.string, shape=[None])
+    iterator = get_iterator(filenames)
+
+    # x = tf.placeholder(tf.float32, [None, IMAGE_X * IMAGE_Y * IMAGE_N_CHANNELS])
+    x = tf.placeholder(tf.float32, [None, IMAGE_X, IMAGE_Y, IMAGE_N_CHANNELS])
+    y_ = tf.placeholder(tf.float32, [None, NUM_CATEGORIES])
+    keep_prob = tf.placeholder(tf.float32)
+
+    y = convolution_model(x, y_, keep_prob)
+
+    cross_entropy = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(labels=y_, logits=y))
+    train_step = tf.train.AdamOptimizer(1e-4).minimize(cross_entropy)
+
+    correct_prediction = tf.equal(tf.argmax(y, 1), tf.argmax(y_, 1))
+    accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
+
+    with tf.Session() as sess:
+        sess.run(iterator.initializer, feed_dict={filenames: training_filenames})
+        sess.run(tf.global_variables_initializer())
+        for i in range(5000):
+            batch = iterator.get_next()
+            batch = sess.run(batch)     # Convert the tensor into a numpy array because that is what feed_dict accepts
+            if i % 50 == 0:
+                train_accuracy = accuracy.eval(feed_dict={x: batch[0], y_: batch[1], keep_prob: 1.0})
+                print "Batches Completed: {} Accuracy: {}".format(i, train_accuracy)
+            train_step.run(feed_dict={x: batch[0], y_: batch[1], keep_prob: 0.5})
+
+
+if __name__ == "__main__":
+    train()
diff --git a/finetune/inception.py b/finetune/inception.py
@@ -0,0 +1,33 @@
+from keras.applications.inception_v3 import InceptionV3, preprocess_input, decode_predictions
+from keras.layers import Dense, GlobalAveragePooling2D
+from keras.models import Model
+
+NUM_CLASSES = 2
+
+
+def batch_generator():
+    pass
+
+# base pre-trained model
+base_model = InceptionV3(include_top=False, weights='imagenet')
+
+# Global
+x = base_model.output
+x = GlobalAveragePooling2D()(x)
+
+# Fully connected layer
+x = Dense(units=1024, activation='relu')(x)
+# Logistic softmax layer
+predictions = Dense(NUM_CLASSES, activation='softmax')(x)
+
+model = Model(inputs=base_model.input, outputs=predictions)
+
+# Train only the top layers
+for layer in base_model.layers:
+    layer.trainable = False
+
+# Compile the model
+model.compile(optimizer='rmsprop', loss='categorical_crossentropy')
+
+# Train the model
+model.fit_generator()