main.py

#!/usr/bin/env python3

import os
import io

import numpy as np


import itertools


import pickle

import time

import matplotlib.pyplot as plt

from datetime import datetime

import argparse
import csv

import tensorflow as tf
from tensorflow.keras.layers import *
from tensorflow.keras.models import *
from tensorflow.keras.utils import *
from tensorflow.keras.callbacks import *
from tensorflow.keras.activations import *

from tensorflow.keras import backend as K

from sklearn.metrics import confusion_matrix
from sklearn.metrics import classification_report
from sklearn.model_selection import StratifiedKFold
from sklearn.metrics import balanced_accuracy_score
from sklearn.model_selection import StratifiedShuffleSplit
from sklearn.model_selection import ShuffleSplit

from classifiers import FCN
from classifiers import FCNEmbedded
from classifiers import LSTM
from classifiers import LSTMEmbedded

seed = 7
epoch = 400
batch = 1024
verbose = True
patience = 20

np.random.seed(seed)


def load_data(input_file, path):
    """Load datasets

    Parameters
    ----------
    input_file : str
        name of the dataset file

    path : str
        path to the dataset folder

    
    Returns
    -------
    list
        list of subsets X_TRAIN, Y_TRAIN, X_VALIDATION, Y_VALIDATION, X_TEST, Y_TEST, 
        and dictActivities, listActivities
    
    """

    X_TRAIN = []
    Y_TRAIN = []

    X_VALIDATION = []
    Y_VALIDATION = []

    #load the dic of activities
    if "MILAN" in path:
        pickle_in = open("datasets/milan_activity_list.pickle","rb")

    if "ARUBA" in path:
        pickle_in = open("datasets/aruba_activity_list.pickle","rb")

    dictActivities = pickle.load(pickle_in)

    # get all keys to an array
    *listActivities, = dictActivities
    

    X_TEST = np.load("{}/{}_X_TEST.npy".format(path,input_file),allow_pickle=True)
    Y_TEST = np.load("{}/{}_Y_TEST.npy".format(path,input_file),allow_pickle=True)


    for k in range(3):
        X_TRAIN.append(np.load("{}/{}_X_TRAIN_{}.npy".format(path,input_file,k),allow_pickle=True))
        Y_TRAIN.append(np.load("{}/{}_Y_TRAIN_{}.npy".format(path,input_file,k),allow_pickle=True))


        X_VALIDATION.append(np.load("{}/{}_X_VALIDATION_{}.npy".format(path,input_file,k),allow_pickle=True))
        Y_VALIDATION.append(np.load("{}/{}_Y_VALIDATION_{}.npy".format(path,input_file,k),allow_pickle=True))

    return X_TRAIN, Y_TRAIN, X_VALIDATION, Y_VALIDATION, X_TEST, Y_TEST, listActivities


def evaluate_model(model, testX, testy, batch_size):
    
    # evaluate model
    _, accuracy = model.evaluate(testX, testy, batch_size=batch_size, verbose=0)
    
    return accuracy

# serialize model to JSON
def save_model(model,filename):
    model_json = model.to_json()
    with open(filename+".json", "w") as json_file:
        json_file.write(model_json)
    
    model.save_weights(filename+".h5")
    
    print("Saved model to disk")

# load json and create model
def load_model_2(filename):
    json_file = open(filename+".json", 'r')
    loaded_model_json = json_file.read()
    json_file.close()
    loaded_model = model_from_json(loaded_model_json)
    
    loaded_model.load_weights(filename+".h5")
    
    return loaded_model

def plot_to_image(figure):
  """Converts the matplotlib plot specified by 'figure' to a PNG image and
  returns it. The supplied figure is closed and inaccessible after this call."""
  # Save the plot to a PNG in memory.
  buf = io.BytesIO()
  plt.savefig(buf, format='png')
  # Closing the figure prevents it from being displayed directly inside
  # the notebook.
  plt.close(figure)
  buf.seek(0)
  # Convert PNG buffer to TF image
  image = tf.image.decode_png(buf.getvalue(), channels=4)
  # Add the batch dimension
  image = tf.expand_dims(image, 0)
  return image

def plot_confusion_matrix(cm, class_names):
  """
  Returns a matplotlib figure containing the plotted confusion matrix.

  Args:
    cm (array, shape = [n, n]): a confusion matrix of integer classes
    class_names (array, shape = [n]): String names of the integer classes
  """
  figure = plt.figure(figsize=(8, 8))
  plt.imshow(cm, interpolation='None', cmap=plt.cm.Blues)
  plt.title("Confusion matrix")
  plt.colorbar()
  tick_marks = np.arange(len(class_names))
  plt.xticks(tick_marks, class_names, rotation=45)
  plt.yticks(tick_marks, class_names)

  # Normalize the confusion matrix.
  cm = np.around(cm.astype('float') / cm.sum(axis=1)[:, np.newaxis], decimals=2)

  # Use white text if squares are dark; otherwise black.
  threshold = cm.max() / 1.05
  #threshold = 10
  for i, j in itertools.product(range(cm.shape[0]), range(cm.shape[1])):

    if cm[i, j] > threshold:
        color = "white"  
    else: 
        color = "black"

    plt.text(j, i, cm[i, j], horizontalalignment="center", color="black")

  plt.tight_layout()
  plt.ylabel('True label')
  plt.xlabel('Predicted label')
  return figure

def log_confusion_matrix(epoch, logs):
  # Use the model to predict the values from the validation dataset.
  test_pred_raw = model.predict(x_validation)
  test_pred = np.argmax(test_pred_raw, axis=1)

  # Calculate the confusion matrix.
  cm = confusion_matrix(data_Y_train[k_validation_index].astype('int32'), test_pred.astype('int32'))
  # Log the confusion matrix as an image summary.
  figure = plot_confusion_matrix(cm, class_names=listActivities)
  cm_image = plot_to_image(figure)

  # Log the confusion matrix as an image summary.
  with file_writer_cm.as_default():
    tf.summary.image("Confusion Matrix", cm_image, step=epoch)


if __name__ == '__main__':

    p = argparse.ArgumentParser(formatter_class=argparse.RawDescriptionHelpFormatter, description='')
    p.add_argument('--i', dest='input', action='store', default='', help='input', required = True)
    p.add_argument('--d', dest='path', action='store', default='', help='path', required = True)
    p.add_argument('--c', dest='option', action='store', default='', help='option')
    p.add_argument('--m', dest='models', action='store', default='[]', help='LSTM_Embedded,LSTM,FCN,FCN_Embedded', nargs='+', required = True)
    args = p.parse_args()

    input_file = str(args.input)
    path = str(args.path)
    option = str(args.option)
    MODELS = args.models

    print(MODELS)

    if "MILAN" in path:
        root_logdir = os.path.join("results", "logs_milan_sliding_windows_over_activity")
        vocabSize = 130
    
    if "ARUBA" in path:
        root_logdir = os.path.join("results", "logs_aruba_sliding_windows_over_activity")
        vocabSize = 309


    filename = "{}_{}".format(input_file,option)

    print(tf.__version__)

    strategy = tf.distribute.MirroredStrategy()

    X_TRAIN, Y_TRAIN, X_VALIDATION, Y_VALIDATION, X_TEST, Y_TEST, listActivities = load_data(input_file, path)


    cvscores = []
    bscores = []


    cvscores_FCN = []
    bscores_FCN = []
    path_FCN = ""


    cvscores_FCN_Embedded = []
    bscores_FCN_Embedded = []
    path_FCN_Embedded = ""


    cvscores_LSTM = []
    bscores_LSTM = []
    path_LSTM = ""


    cvscores_LSTM_Embedded = []
    bscores_LSTM_Embedded = []
    path_LSTM_Embedded = ""

    
    currenttime  = time.strftime("%Y_%m_%d_%H_%M_%S")


    for k in range(len(X_TRAIN)):


        y_train = to_categorical(Y_TRAIN[k])
        y_validation = to_categorical(Y_VALIDATION[k])
        y_test = to_categorical(Y_TEST)


        for m in MODELS:
            
            print("MODEL: {} EXPERIENCE: {}".format(m, k+1))

            ###########_FCN_##########
            if m == "FCN":

                cvscores = cvscores_FCN
                bscores = bscores_FCN

                x_train = X_TRAIN[k].reshape(X_TRAIN[k].shape[0],X_TRAIN[k].shape[1],1)
                
                x_validation = X_VALIDATION[k].reshape(X_VALIDATION[k].shape[0],X_VALIDATION[k].shape[1],1)
                
                x_test = X_TEST.reshape(X_TEST.shape[0],X_TEST.shape[1],1)

                with strategy.scope():
                    model = FCN.model(x_train,y_train)

            
            ###########_FCN_WITH_EMBEDDING_##########
            if m == "FCN_Embedded":

                cvscores = cvscores_FCN_Embedded
                bscores = bscores_FCN_Embedded

                x_train =  X_TRAIN[k]
                
                x_validation = X_VALIDATION[k]

                x_test = X_TEST

                with strategy.scope():
                    model = FCNEmbedded.modelFCNEmbedded(x_train,y_train,vocabSize)


            ###########_LSTM_##########
            if m == "LSTM":

                cvscores = cvscores_LSTM
                bscores = bscores_LSTM

                x_train = X_TRAIN[k].reshape(X_TRAIN[k].shape[0],X_TRAIN[k].shape[1],1)
                
                x_validation = X_VALIDATION[k].reshape(X_VALIDATION[k].shape[0],X_VALIDATION[k].shape[1],1)
                
                x_test = X_TEST.reshape(X_TEST.shape[0],X_TEST.shape[1],1)

                with strategy.scope():
                    model = LSTM.model(x_train,y_train)


            ###########_LSTM_WITH_EMBEDDING_##########
            if m == "LSTM_Embedded":

                cvscores = cvscores_LSTM_Embedded
                bscores = bscores_LSTM_Embedded

                x_train =  X_TRAIN[k]
                
                x_validation = X_VALIDATION[k]

                x_test = X_TEST

                with strategy.scope():
                    model = LSTMEmbedded.model(x_train,y_train,vocabSize)

            
            ###########_TRAIN_##########

            model_name = model.name

            path = os.path.join("results", model_name, "run_"+ filename + "_" + str(currenttime))

            ###########_FCN_##########
            if m == "FCN":
                path_FCN = path

            ###########_FCN_WITH_EMBEDDING_##########
            if m == "FCN_Embedded":
                path_FCN_Embedded = path

            ###########_LSTM_##########
            if m == "LSTM":
                path_LSTM = path

            ###########_LSTM_WITH_EMBEDDING_##########
            if m == "LSTM_Embedded":
                path_LSTM_Embedded = path


            # create a folder with the model name
            # if the folder doesn't exist
            if not os.path.exists(path):
                os.makedirs(path)
            

            # all paths
            run_id = model_name + "_" + filename + "_" + str(currenttime) + str(k)
            log_dir = os.path.join(root_logdir, run_id)

            csv_name = model_name + "_" + filename + "_"+ str(k) + ".csv"
            csv_path = os.path.join(path, csv_name)

            picture_name = model_name + "_" + filename + "_" + str(k) + ".png"
            picture_path = os.path.join(path, picture_name)

            report_name = model_name + "_repport_" + filename + "_" + str(k) + ".txt"
            report_path = os.path.join(path, report_name)

            confusion_name = model_name + "_confusion_matrix_" + filename + "_" + str(k) + ".txt"
            confusion_path = os.path.join(path, confusion_name)

            model_name_saved = model_name + "_" + filename + "_" + str(k)
            model_path = os.path.join(path, model_name_saved)

            best_model_name_saved = model_name + "_" + filename + "_BEST_" + str(k) +".h5"
            best_model_path = os.path.join(path, best_model_name_saved)

            
            #ceate a picture of the model
            plot_model(model, show_shapes=True, to_file=picture_path)

            #compile the model
            model.compile(loss='categorical_crossentropy', optimizer='adam', metrics=['accuracy'])
                
            #print summary
            print(model.summary())

            # create a folder with the log
            # if the folder doesn't exist
            if not os.path.exists(log_dir):
                os.makedirs(log_dir)

            # create a callback for the tensorboard
            tensorboard_cb = tf.keras.callbacks.TensorBoard(log_dir)
            #file_writer_cm = tf.summary.create_file_writer(log_dir + '/cm')


            #callbacks
            csv_logger = CSVLogger(csv_path)

            # simple early stopping
            es = EarlyStopping(monitor='val_loss', mode='min', verbose=1, patience=patience)
            mc = ModelCheckpoint(best_model_path, monitor='val_accuracy', mode='max', verbose=1, save_best_only=True)
            # Define the per-epoch callback.
            #cm_callback = tf.keras.callbacks.LambdaCallback(on_epoch_end=log_confusion_matrix)

            #cbs = [csv_logger,tensorboard_cb,mc,es,cm_callback]
            cbs = [csv_logger,tensorboard_cb,mc,es]


            # fit network
            model.fit(x_train, y_train, epochs=epoch, batch_size=batch, verbose=verbose, callbacks=cbs, validation_data=(x_validation, y_validation))
            

            ##########_EVALUATION_##########
            # load the best model on this k fold

            saved_model = tf.keras.models.load_model(best_model_path)
            
            # evaluate
            score = evaluate_model(saved_model, x_test, y_test, batch)

            # store score
            cvscores.append(score)
            
            print('Accuracy: %.3f' % (score * 100.0))

            ##########_GENERATE_##########

            # Make prediction using the model
            Y_hat = saved_model.predict(x_test)
            Y_pred = np.argmax(Y_hat, axis=1)
            Y_pred = Y_pred.reshape(Y_pred.shape[0], 1)
            Y_pred = Y_pred.astype('int32')
            Y_test = Y_TEST.astype('int32')


            report = classification_report(Y_test, Y_pred, target_names=listActivities)
            print(report)

            text_file = open(report_path, "w")
            n = text_file.write(report)
            text_file.close()


            cm=confusion_matrix(Y_test, Y_pred)
            print(cm)

            text_file = open(confusion_path, "w")
            n = text_file.write("{}".format(cm))
            text_file.close()

            bscore = balanced_accuracy_score(Y_test, Y_pred)
            bscores.append(bscore)
            print('Balanced Accuracy: %.3f' % (bscore * 100.0))

            
            ###########_FCN_##########
            if m == "FCN":
                
                cvscores_FCN = cvscores
                bscores_FCN = bscores

            ###########_FCN_WITH_EMBEDDING_##########
            if m == "FCN_Embedded":

                cvscores_FCN_Embedded = cvscores
                bscores_FCN_Embedded = bscores

            ###########_LSTM_##########
            if m == "LSTM":
                
                cvscores_LSTM = cvscores
                bscores_LSTM = bscores

            ###########_LSTM_WITH_EMBEDDING_##########
            if m == "LSTM_Embedded":

                cvscores_LSTM_Embedded = cvscores
                bscores_LSTM_Embedded = bscores
        

    for m in MODELS:
        ###########_FCN_##########
        if m == "FCN":

            cvscores = cvscores_FCN
            bscores = bscores_FCN
            path = path_FCN

        
        ###########_FCN_WITH_EMBEDDING_##########
        if m == "FCN_Embedded":

            cvscores = cvscores_FCN_Embedded
            bscores = bscores_FCN_Embedded
            path = path_FCN_Embedded


        ###########_LSTM_##########
        if m == "LSTM":

            cvscores = cvscores_LSTM
            bscores = bscores_LSTM
            path = path_LSTM


        ###########_LSTM_WITH_EMBEDDING_##########
        if m == "LSTM_Embedded":

            cvscores = cvscores_LSTM_Embedded
            bscores = bscores_LSTM_Embedded
            path = path_LSTM_Embedded


        print('Model: {}'.format(m))
        print('Accuracy: {:.2f}% (+/- {:.2f}%)'.format(np.mean(cvscores)*100, np.std(cvscores)))
        print('Balanced Accuracy: {:.2f}% (+/- {:.2f}%)'.format(np.mean(bscores)*100, np.std(bscores)))


        # save metrics
        csvfile = 'cv_scores_' + m + '_' + filename + '_' + str(currenttime) + '.csv'


        with open(os.path.join(path, csvfile), "w") as output:
            writer = csv.writer(output, lineterminator='\n')

            writer.writerow(["accuracy score :"])
            for val in cvscores:
                writer.writerow([val*100])
            writer.writerow([""])
            writer.writerow([np.mean(cvscores)*100])
            writer.writerow([np.std(cvscores)])

            writer.writerow([""])
            writer.writerow(["balanced accuracy score :"])

            for val2 in bscores:
                writer.writerow([val2*100])
            writer.writerow([""])
            writer.writerow([np.mean(bscores)*100])
            writer.writerow([np.std(bscores)])