Loaded images as numpy file, started template for neural net

2018-05-13 23:13:46 +10:00 · 2018-05-13 23:13:46 +10:00 · 03eba4b101
commit 03eba4b101
parent b1a5006131
6 changed files with 194 additions and 0 deletions
--- a/mini_proj/Load_Images.py
+++ b/mini_proj/Load_Images.py
@ -0,0 +1,66 @@
 '''
 Created by Tony Silvestre to prepare images for use from a Kaggle Where's Waldo dataset
 '''
 import os
 import numpy as np
 from matplotlib import pyplot as plt
 import math
 import cv2
 def gen_data(w_path, n_w_path):
    waldo_file_list = os.listdir(os.path.join(w_path))
    total_w = len(waldo_file_list)
    not_waldo_file_list = os.listdir(os.path.join(n_w_path))
    total_nw = len(not_waldo_file_list)
    imgs_raw = []           # Images
    imgs_lbl = []           # Image labels
    #imgs_raw = np.array([np.array(imread(wdir + "waldo/"+fname)) for fname in os.listdir(wdir + "waldo")])
    i = 0
    for image_name in waldo_file_list:
        pic = cv2.imread(os.path.join(w_path, image_name))              # NOTE: cv2.imread() returns a numpy array in BGR not RGB
        imgs_raw.append(pic)
        imgs_lbl.append(1)                                              # Value of 1 as Waldo is present in the image
        print('Completed: {0}/{1} Waldo images'.format(i+1, total_w))
        i += 1
    i = 0
    for image_name in not_waldo_file_list:
        pic = cv2.imread(os.path.join(n_w_path, image_name))
        imgs_raw.append(pic)
        imgs_lbl.append(0)
        print('Completed: {0}/{1} non-Waldo images'.format(i+1, total_nw))
        i += 1
    # Calculate what 30% of each set is
    third_of_w = math.floor(0.3*total_w)
    third_of_nw = math.floor(0.3*total_nw)
    # Split data into training and test data (60%/30%)    
    train_data = np.append(imgs_raw[(third_of_w+1):total_w], imgs_raw[(total_w + third_of_nw + 1):len(imgs_raw)-1], axis=0)
    train_lbl = np.append(imgs_lbl[(third_of_w+1):total_w], imgs_lbl[(total_w + third_of_nw + 1):len(imgs_lbl)-1], axis=0)
    # If axis not given, both arrays are flattened before being appended
    test_data = np.append(imgs_raw[0:third_of_w], imgs_raw[total_w:(total_w + third_of_nw)], axis=0)
    test_lbl = np.append(imgs_lbl[0:third_of_w], imgs_lbl[total_w:(total_w + third_of_nw)], axis=0)
    try:
        # Save the data as numpy files
        np.save('Waldo_train_data.npy', train_data)
        np.save('Waldo_train_lbl.npy', train_lbl)
        np.save('Waldo_test_data.npy', test_data)
        np.save('Waldo_test_lbl.npy', test_lbl)
        print("All data saved")
    except:
        print("ERROR: Data may not be completely saved")
 def __main__():
    # Paths to the Waldo images
    waldo_path = 'waldo_data/64/waldo'
    n_waldo_path = 'waldo_data/64/notwaldo'
    gen_data(waldo_path, n_waldo_path)
 __main__()
--- a/mini_proj/Waldo_test_data.npy
+++ b/mini_proj/Waldo_test_data.npy
--- a/mini_proj/Waldo_test_lbl.npy
+++ b/mini_proj/Waldo_test_lbl.npy
--- a/mini_proj/Waldo_train_data.npy
+++ b/mini_proj/Waldo_train_data.npy
--- a/mini_proj/Waldo_train_lbl.npy
+++ b/mini_proj/Waldo_train_lbl.npy
--- a/mini_proj/waldo_model.py
+++ b/mini_proj/waldo_model.py
@ -0,0 +1,128 @@
 import numpy as np
 import sys
 import time as t
 '''
 from keras.models import Sequential
 from keras.layers import Dense, Dropout, Activation, Flatten, Reshape, Merge, Permute
 from keras.layers import Deconvolution2D, Convolution2D, MaxPooling2D, UpSampling2D, ZeroPadding2D
 from keras.layers import Input
 from keras.layers.normalization import BatchNormalization
 from keras.utils import np_utils
 '''
 from keras import backend as K
 K.set_image_dim_ordering('th')
 np.random.seed(7)
 '''
 Model definition
 '''
 def FCN():
    ## sample structure defined below
    # inputs = Input((1, w, h))
    # conv1 = Convolution2D(32, 3, 3, activation='relu', border_mode='same')(inputs)
    # conv1 = Convolution2D(32, 3, 3, activation='relu', border_mode='same')(conv1)
    # m_pool1 = MaxPooling2D(pool_size=(2, 2))(conv1)
    # conv2 = Convolution2D(64, 3, 3, activation='relu', border_mode='same')(m_pool1)
    # drop1 = Dropout(0.2)(conv2)
    # conv2 = Convolution2D(64, 3, 3, activation='relu', border_mode='same')(drop1)
    # m_pool2 = MaxPooling2D(pool_size=(2, 2))(conv2)
    # conv7 = Convolution2D(512, 3, 3, activation='relu', border_mode='same')(m_pool6)
    # conv7 = Convolution2D(1, 3, 3, activation='relu', border_mode='same')(conv7)
    # up8x = UpSampling2D(size=(2, 2))(conv16x)
    # merge8x = merge([up8x, m_pool3], mode='concat', concat_axis=1)
    # conv8x = Convolution2D(1, 1, 1, activation='relu', border_mode='same')(merge8x)
    # up4x = UpSampling2D(size=(2, 2))(conv8x)
    # merge4x = merge([up4x, m_pool2], mode='concat', concat_axis=1)
    # conv4x = Convolution2D(1, 1, 1, activation='relu', border_mode='same')(merge4x)
    # up4x = UpSampling2D(size=(4, 4))(conv4x)
    # model = Model(input=inputs, output=up4x)
    # # Optimizer uses recommended Adadelta values
    # model.compile(optimizer=Adadelta(lr=0.01), loss='categorical_crossentropy', metrics=['accuracy'])  
    return model
 ## Open data
 im_train = np.load('Waldo_train_data.npy')
 lbl_train = np.load('Waldo_test_lbl.npy')
 im_test = np.load('Waldo_test_data.npy')
 lbl_test = np.load('Waldo_test_lbl.npy')
 ## Define model
 model = FCN()
 ## Define training parameters
 epochs = 40             # an epoch is one forward pass and back propogation of all training data 
 batch_size = 5
 #lrate = 0.01
 #decay = lrate/epochs
 # epoch - one forward pass and one backward pass of all training data
 # batch size - number of training example used in one forward/backward pass
 # (higher batch size uses more memory)
 # learning rate - controls magnitude of weight changes in training the NN
 ## Train model
 # Purely superficial output
 sys.stdout.write("\nFitting model")
 sys.stdout.flush()
 for i in range(0, 3):
    t.sleep(0.8)
    sys.stdout.write('.')
    sys.stdout.flush()
 print()
 # Outputs the model structure
 for i in range(0, len(model.layers)):
    print("Layer {}: {}".format(i, model.layers[i].output))
 print('-'*30)
 filepath = "checkpoint.hdf5"                                            # Defines the model checkpoint file
 checkpoint = ModelCheckpoint(filepath, verbose=1, save_best_only=False) # Defines the checkpoint process
 callbacks_list = [checkpoint]               # Adds the checkpoint process to the list of action performed during training
 start = t.time()                            # Records time before training
 # Fits model based on initial parameters
 model.fit(im_train, lbl_train, nb_epoch=epochs, batch_size=batch_size,
          verbose=2, shuffle=True, callbacks=callbacks_list)
 # If getting a value error here, output of network and corresponding lbl_train
 # data probably don't match
 end = t.time()                              # Records time after tranining
 print('Training Duration: {}'.format(end-start))
 print('-'*30)
 print("*** Saving FCN model and weights ***")
 '''
 # *To save model and weights seperately:
 # save model as json file
 model_json = model.to_json()
 with open("UNet_model.json", "w") as json_file:
    json_file.write(model_json)
 # save weights as h5 file
 model.save_weights("UNet_weights.h5")
 print("\nModel weights and structure have been saved.\n")
 '''
 # Save model as one file
 model.save('Waldo.h5')
 print("\nModel weights and structure have been saved.\n")
 ## Testing the model
 # Load test data
 im_test, lbl_test = Load_Images()
 # Show data stats
 print('*'*30)
 print(im_test.shape)
 print(lbl_test.shape)
 print('*'*30)
 start = t.time()
 # Passes the dataset through the model
 pred_lbl = model.predict(im_test, verbose=1, batch_size=batch_size)
 end = t.time()
 print("Images generated in {} seconds".format(end - start))
 np.save('Test/predicted_results.npy', pred_lbl)