import os
import argparse
import simplejson
import matplotlib.pyplot as plt
import cv2
from PIL import Image

import numpy as np
import pandas as pd

import glob

import tensorflow as tf
import keras
from keras.models import Sequential
from keras.regularizers import l2
from keras.preprocessing.image import ImageDataGenerator, array_to_img, img_to_array, load_img
from keras.layers import Dense, Activation, Conv2D, Flatten, Dropout, MaxPooling2D
from keras.callbacks import ModelCheckpoint
from keras.applications.inception_v3 import InceptionV3, preprocess_input

keras.backend.clear_session()


#define paths and constants
cwd = os.getcwd()
data_path = os.path.join(cwd, 'data')
#data_path = "/Users/victorialiu/git/creatica/code/data/"
batch_size = 16
TARGET_SIZE = 299


## Parse command line arguments
def parse_args():
    parser = argparse.ArgumentParser()
    parser.add_argument('-m', '--model-name',
        help='prefix for file to save trained model to ' +
            '(e.g. dense_arch1, conv_regularize05, etc.)',
        required=True)
    parser.add_argument('-r', '--regularizer-strength',
        help='strength of l2 regularization to use',
        type=float, default=0.00)

    return parser.parse_args()


def image_data_augment(rescale=1/255, shear_range = False, zoom_range = False, horizontal_flip = False):
    #declare ImageDataGenerator class for augmenting images using shear, zoom, and flips
    #normalize with 1./255
    return (ImageDataGenerator(
            rescale=rescale,
            shear_range=shear_range,
            zoom_range=zoom_range,
            horizontal_flip=horizontal_flip))



def dataframe_categories(train_or_test):
    #define new data_path to make life easier
    data_subpath = os.path.join(data_path, train_or_test)
    #initiate lists for dataframe
    images_names = []
    categories = []

    for category in os.listdir(data_subpath):
        #no .DS_Store omg I hate .DS_Store
        if category != '.DS_Store':
            for image in os.listdir(
                os.path.join(data_subpath, category)
                ):
                #only use jpg
                if image[-4:] == '.jpg':
                    images_names.append(f'{category}/{image}')
                    categories.append(category)
    images_names = np.array(images_names)
    categories = np.array(categories)

    df = pd.DataFrame({
        'filename' : images_names,
        'class' : categories
    })

    return df


def get_images(train_or_test):
    #augment images
    if train_or_test == 'train':
        datagen = image_data_augment(shear_range = 0.2, zoom_range = 0.2, horizontal_flip = True)
    else:
        datagen = image_data_augment()


    df = dataframe_categories(train_or_test)

    generator = datagen.flow_from_dataframe(
        df,
        directory = os.path.join(data_path, train_or_test),
        target_size=(TARGET_SIZE, TARGET_SIZE),
        batch_size=batch_size,
        class_mode='categorical',
        shuffle=False,
        validate_filenames=False
        )
    return generator


def preprocess_inception():
    """
    inception for transfer learning
    """
    #transfer learning with InceptionV3, a pre-trained cnn
    model = InceptionV3(
        weights='imagenet',
        include_top=False,
        input_shape=(TARGET_SIZE, TARGET_SIZE, 3),
        classes = 3
        )

    for train_or_test in [
        'train',
        'test'
        ]:
        generator = get_images(train_or_test)

        bottleneck_features = model.predict(generator, len(generator), verbose=1)

        #save model with the bottleneck features
        np.savez(f'inception_features_{train_or_test}', features=bottleneck_features)

    return True



def get_data():
    #augment images and use inception net
    preprocess_inception()
    #load training data and define labels, where 0 is hotdog and 1 is nothotdog
    train_data = np.load('inception_features_train.npz')['features']

    #requires the number of hotdog and nothotdog samples to be the exact same
    train_data_type_count = int(len(train_data) / 3)
    train_labels = np.array(
        [0] * train_data_type_count +
        [1] * train_data_type_count +
        [2] * train_data_type_count
        )

    #load testing data and define labels, where 0 is hotdog and 1 is nothotdog
    test_data = np.load('inception_features_test.npz')['features']

    #requires the number of hotdog and nothotdog samples to be the exact same
    test_data_type_count = int(len(test_data) / 3)
    test_labels = np.array(
        [0] * test_data_type_count +
        [1] * test_data_type_count +
        [2] * test_data_type_count
        )

    # Convert labels to one-hot vectors (probability distributions w/
    # probability 1 assigned to the correct label)
    train_labels = keras.utils.to_categorical(train_labels)
    test_labels = keras.utils.to_categorical(test_labels)

    return (train_data, train_labels, test_data, test_labels)


def build_conv_net(reg_param, train_data_shape):
    #train_data_shape = train_data.shape[1:] = (8, 8, 2048)
    model = Sequential()

    #convolutional layer with 32 3x3 trainable filters, using rectified linear units.
    #Padding to result in the same shape as the original picture. Add reg_param if true
    #use l2 regularization if reg_param is given in command line
    model.add(Conv2D(
        16, (3, 3),
        activation='relu',
        input_shape=train_data_shape,
        padding='same',
        kernel_regularizer=l2(reg_param)
        ))
#     # max pooling for noise reduction
#     model.add(MaxPooling2D(pool_size=(2, 2)))


    # second block
    model.add(Conv2D(
        32, (3, 3),
        activation='relu',
        padding='same',
        kernel_regularizer=l2(reg_param)
        ))
    # max pooling for noise reduction
    model.add(MaxPooling2D(pool_size=(2, 2)))
    # dropout for more regularization
    model.add(Dropout(0.25))


    # third block
    model.add(Conv2D(
        64, (3, 3),
        activation='relu',
        padding='same',
        kernel_regularizer=l2(reg_param)
        ))
#     model.add(Conv2D(
#         64, (3, 3),
#         activation='relu',
#         padding='same',
#         kernel_regularizer=l2(reg_param)
#         ))
    # max pooling for noise reduction
#     model.add(MaxPooling2D(pool_size=(2, 2)))
#     dropout for more regularization
    model.add(Dropout(0.25))


    # fourth block
    model.add(Conv2D(
        128, (3, 3),
        activation='relu',
        padding='same',
        kernel_regularizer=l2(reg_param)
        ))
#     model.add(Conv2D(
#         128, (3, 3),
#         activation='relu',
#         padding='same',
#         kernel_regularizer=l2(reg_param)
#         ))
#     # max pooling for noise reduction
#     model.add(MaxPooling2D(pool_size=(2, 2)))
    # dropout for more regularization
    model.add(Dropout(0.25))


    #fifth block
    model.add(Conv2D(
        256, (3, 3),
        activation='relu',
        padding='same',
        kernel_regularizer=l2(reg_param)
        ))
    model.add(Conv2D(
        256, (3, 3),
        activation='relu',
        padding='same',
        kernel_regularizer=l2(reg_param)
        ))
#     model.add(Conv2D(
#         256, (3, 3),
#         activation='relu',
#         padding='same',
#         kernel_regularizer=l2(reg_param)
#         ))
    # max pooling for noise reduction
    model.add(MaxPooling2D(pool_size=(2, 2)))
    # dropout for more regularization
    model.add(Dropout(0.25))


    # fully connected layer
    model.add(Flatten())
    model.add(Dense(512, activation='relu'))
    model.add(Dropout(0.6))
    model.add(Dense(256, activation='relu'))
    model.add(Dropout(0.5))


    #4 categories
    model.add(Dense(3, activation = 'softmax'))

    return model


def main():

# comment this out when running from command line!
    model_name = 'demo'
    regularizer_strength = .00001

# #     comment out when not running from cmdline
#     ## get cmdline args
#     args = parse_args()
#     model_name = args.model_name
#     # get regularization strength, if defined. Otherwise, it is 0
#     regularizer_strength = args.regularizer_strength


    # Remove src from cwd if necessary
    cwd = os.getcwd()
    if os.path.basename(cwd) == 'src': cwd = os.path.dirname(cwd)

    # Create img directory to save images if needed
    os.makedirs(os.path.join(cwd, 'img'), exist_ok=True)
    plot_fname = os.path.join(cwd, 'img', '%s_learn.png' % model_name)

    # Create model directory to save models if needed
    os.makedirs(os.path.join(cwd, 'model'), exist_ok=True)
    model_weights_fname = os.path.join(cwd, 'model', model_name + '.h5')
    model_json_fname = os.path.join(cwd, 'model', model_name + '.json')


    # Importing the hotdog dataset
    #may take a few seconds
    (train_data, train_labels, test_data, test_labels) = get_data()
    train_data_shape = train_data.shape[1:]



    # build model
    model = build_conv_net(regularizer_strength, train_data_shape)

    # Print a summary of the layers and weights in the model
    model.summary()

    # Have our model minimize the binary cross entropy loss with the adam
    # optimizer (fancier stochastic gradient descent that converges faster)
    model.compile(
        loss='categorical_crossentropy',
        optimizer='adam',
        metrics=['MSE'])

    # #set checkpointer to use in callback, to only keep the best model weights
    checkpointer = ModelCheckpoint(
        filepath='/Users/victorialiu/git/creatica/tmp',
        verbose=1,
        save_weights_only=True,
        )

    #time to fit
    history = model.fit(train_data, train_labels,
            epochs=8,
            batch_size=batch_size,
            validation_split=0.2,
            validation_data=(train_data, train_labels),
            verbose=2,
            callbacks=[checkpointer],
            shuffle=True)



    #load best model
    model.load_weights('/Users/victorialiu/git/creatica/tmp')

    # Save model weights and json spec describing the model's architecture
    model.save(model_weights_fname)
    model_json = model.to_json()
    with open(model_json_fname, 'w') as f:
        f.write(simplejson.dumps(simplejson.loads(model_json), indent=4))



#     # Plot accuracy learning curve
#     ax1 = plt.subplot(2, 1, 1)
#     plt.plot(history.history['accuracy'])
#     plt.plot(history.history['val_accuracy'])
#     plt.title('%s accuracy' % model_name)
#     plt.ylabel('Accuracy')
#     plt.xlabel('Epoch')
#     plt.legend(['Train', 'Validation'], loc='lower right')
#     plt.savefig(plot_fname)

#     # Plot loss learning curve
#     plt.subplot(2, 1, 2, sharex=ax1)
#     plt.plot(history.history['loss'])
#     plt.plot(history.history['val_loss'])
#     plt.title('%s loss' % model_name)
#     plt.ylabel('Loss')
#     plt.xlabel('Epoch')
#     plt.legend(['Train', 'Validation'], loc='upper right')



    # Plot accuracy learning curve
    ax1 = plt.subplot(2, 1, 1)
    plt.plot(history.history['MSE'])
    plt.plot(history.history['val_MSE'])
    plt.title('%s accuracy' % model_name)
    plt.ylabel('Accuracy')
    plt.xlabel('Epoch')
    plt.legend(['Train', 'Validation'], loc='lower right')
    plt.savefig(plot_fname)


    # Plot loss learning curve
    plt.subplot(2, 1, 2, sharex=ax1)
    plt.plot(history.history['loss'])
    plt.plot(history.history['val_loss'])
    plt.title('%s loss' % model_name)
    plt.ylabel('Loss')
    plt.xlabel('Epoch')
    plt.legend(['Train', 'Validation'], loc='upper right')



    plt.tight_layout()
    plt.savefig(plot_fname)
    plt.show()

    return True


main()

Found 2508 non-validated image filenames belonging to 3 classes.
157/157 [==============================] - 100s 640ms/step
Found 150 non-validated image filenames belonging to 3 classes.
10/10 [==============================] - 5s 494ms/step
Model: "sequential"
_________________________________________________________________
Layer (type)                 Output Shape              Param #
=================================================================
conv2d_188 (Conv2D)          (None, 8, 8, 16)          294928
_________________________________________________________________
conv2d_189 (Conv2D)          (None, 8, 8, 32)          4640
_________________________________________________________________
max_pooling2d_8 (MaxPooling2 (None, 4, 4, 32)          0
_________________________________________________________________
dropout (Dropout)            (None, 4, 4, 32)          0
_________________________________________________________________
conv2d_190 (Conv2D)          (None, 4, 4, 64)          18496
_________________________________________________________________
dropout_1 (Dropout)          (None, 4, 4, 64)          0
_________________________________________________________________
conv2d_191 (Conv2D)          (None, 4, 4, 128)         73856
_________________________________________________________________
dropout_2 (Dropout)          (None, 4, 4, 128)         0
_________________________________________________________________
conv2d_192 (Conv2D)          (None, 4, 4, 256)         295168
_________________________________________________________________
conv2d_193 (Conv2D)          (None, 4, 4, 256)         590080
_________________________________________________________________
max_pooling2d_9 (MaxPooling2 (None, 2, 2, 256)         0
_________________________________________________________________
dropout_3 (Dropout)          (None, 2, 2, 256)         0
_________________________________________________________________
flatten (Flatten)            (None, 1024)              0
_________________________________________________________________
dense (Dense)                (None, 512)               524800
_________________________________________________________________
dropout_4 (Dropout)          (None, 512)               0
_________________________________________________________________
dense_1 (Dense)              (None, 256)               131328
_________________________________________________________________
dropout_5 (Dropout)          (None, 256)               0
_________________________________________________________________
dense_2 (Dense)              (None, 3)                 771
=================================================================
Total params: 1,934,067
Trainable params: 1,934,067
Non-trainable params: 0
_________________________________________________________________
Epoch 1/8

Epoch 00001: saving model to /Users/victorialiu/git/creatica/tmp
126/126 - 7s - loss: 0.6362 - MSE: 0.1225 - val_loss: 1.3662 - val_MSE: 0.3387
Epoch 2/8

Epoch 00002: saving model to /Users/victorialiu/git/creatica/tmp
126/126 - 7s - loss: 0.5295 - MSE: 0.1032 - val_loss: 1.4071 - val_MSE: 0.3562
Epoch 3/8

Epoch 00003: saving model to /Users/victorialiu/git/creatica/tmp
126/126 - 7s - loss: 0.5986 - MSE: 0.1080 - val_loss: 1.0744 - val_MSE: 0.2654
Epoch 4/8

Epoch 00004: saving model to /Users/victorialiu/git/creatica/tmp
126/126 - 7s - loss: 0.4734 - MSE: 0.0935 - val_loss: 1.1686 - val_MSE: 0.2983
Epoch 5/8

Epoch 00005: saving model to /Users/victorialiu/git/creatica/tmp
126/126 - 8s - loss: 0.4455 - MSE: 0.0902 - val_loss: 1.3958 - val_MSE: 0.3653
Epoch 6/8

Epoch 00006: saving model to /Users/victorialiu/git/creatica/tmp
126/126 - 7s - loss: 0.4440 - MSE: 0.0911 - val_loss: 1.2252 - val_MSE: 0.3160
Epoch 7/8

Epoch 00007: saving model to /Users/victorialiu/git/creatica/tmp
126/126 - 7s - loss: 0.4698 - MSE: 0.0933 - val_loss: 1.3832 - val_MSE: 0.3559
Epoch 8/8

Epoch 00008: saving model to /Users/victorialiu/git/creatica/tmp
126/126 - 7s - loss: 0.4304 - MSE: 0.0886 - val_loss: 1.3510 - val_MSE: 0.3537

True

Training CNN

Importing libraries and defining paths and constants¶

Command Line Argument Parser¶

Image Pre-processing with InceptionV3 net¶

Convolutional Neural Network¶

Ready to go¶