resume_training.py

# This file runs the actual question answering program using our trained network
import sys
import numpy as np
import tensorflow as tf
import sklearn as sk
from network.config import CONFIG
from network.build_model import get_batch, get_feed_dict

# custom imports
from preprocessing.dataset import Dataset
from evaluation_metrics import get_f1_from_tokens, get_exact_match_from_tokens

print("Resumeing training")
D = Dataset(CONFIG.EMBEDDING_FILE)
index2embedding = D.index2embedding
padded_data, (max_length_question, max_length_context) = D.load_questions(CONFIG.QUESTION_FILE)
print("Loaded data")

tf.reset_default_graph()
latest_checkpoint_path = tf.train.latest_checkpoint('./model/')
print("restoring from "+latest_checkpoint_path)
imported_graph = tf.train.import_meta_graph(latest_checkpoint_path+'.meta')

init = tf.global_variables_initializer()
batch_size = CONFIG.BATCH_SIZE

with tf.Session() as sess:

    imported_graph.restore(sess, latest_checkpoint_path)
    graph = tf.get_default_graph()

    question_batch_placeholder = graph.get_tensor_by_name("question_batch_ph:0")
    context_batch_placeholder = graph.get_tensor_by_name("context_batch_ph:0")
    answer_start = graph.get_tensor_by_name("answer_start_true_ph:0")
    answer_end = graph.get_tensor_by_name("answer_end_true_ph:0")
    loss = graph.get_tensor_by_name("loss_to_optimize:0")
    train_op = graph.get_operation_by_name("train_op")
    embedding = graph.get_tensor_by_name("embedding_ph:0")

    loss_writer = tf.summary.FileWriter('./log_tensorboard/plot_loss', sess.graph)
    val_writer = tf.summary.FileWriter('./log_tensorboard/plot_val', sess.graph)
    # Summaries need to be displayed
    # Whenever you need to record the loss, feed the mean loss to this placeholder
    tf_loss_ph = tf.placeholder(tf.float32, shape=None, name='Loss_summary')
    tf_validation_ph = tf.placeholder(tf.float32, shape=None, name='f1_score')
    # Create a scalar summary object for the loss so it can be displayed on tensorboard
    tf_loss_summary = tf.summary.scalar('Loss_summary', tf_loss_ph)
    tf_validation_summary = tf.summary.scalar('f1_score', tf_validation_ph)
    sess.run(init)
    print("SESSION INITIALIZED")
    dataset_size = len(padded_data)
    padded_data = np.array(padded_data)
    np.random.shuffle(padded_data)
    # print("PADDED DATA SHAPE: ", padded_data.shape)
    padded_data_train = padded_data[0:(int)(0.95 * padded_data.shape[0])]
    padded_data_validation = padded_data[(int)(0.95 * padded_data.shape[0]):]

    print("Validating on", padded_data_validation.shape[0], "elements")

    losses = []
    for epoch in range(CONFIG.MAX_EPOCHS):
        print("Epoch # : ", epoch + 1)
        # Shuffle the data between epochs
        np.random.shuffle(padded_data)
        for iteration in range(0, len(padded_data_train) - CONFIG.BATCH_SIZE, CONFIG.BATCH_SIZE):
            batch = padded_data_train[iteration:iteration + CONFIG.BATCH_SIZE]
            question_batch, context_batch, answer_start_batch, answer_end_batch = get_batch(batch, CONFIG.BATCH_SIZE, max_length_question, max_length_context)
            _, loss_val  = sess.run([train_op, loss],feed_dict = get_feed_dict(question_batch, context_batch, answer_start_batch, answer_end_batch, CONFIG.DROPOUT_KEEP_PROB, index2embedding))
            loss_val_mean = np.mean(loss_val)
            if(iteration % ((CONFIG.BATCH_SIZE)-1) == 0):
                print("Loss in epoch: ", loss_val_mean, "(",iteration,"/",len(padded_data_train),")")

            losses.append(loss_val_mean.item())
        mean_epoch_loss = np.mean(np.array(losses))
        print("loss: ", mean_epoch_loss)
        summary_str = sess.run(tf_loss_summary, feed_dict={tf_loss_ph: mean_epoch_loss})
        loss_writer.add_summary(summary_str, epoch)
        loss_writer.flush()

        f1score = []
        emscore = []
        validation_losses = []

        # validation starting
        for counter in range(0, len(padded_data_validation) - CONFIG.BATCH_SIZE, CONFIG.BATCH_SIZE):
            batch = padded_data_validation[counter:(counter + CONFIG.BATCH_SIZE)]
            question_batch_validation, context_batch_validation, answer_start_batch_actual, answer_end_batch_actual = get_batch(batch, CONFIG.BATCH_SIZE, max_length_question, max_length_context)

            estimated_start_index, estimated_end_index, loss_validation = sess.run([answer_start, answer_end, loss],
                feed_dict=get_feed_dict(question_batch_validation, context_batch_validation, answer_start_batch_actual, answer_end_batch_actual, CONFIG.DROPOUT_KEEP_PROB, index2embedding) 
            )

            # print("pred:", loss_validation, estimated_start_index,"->" , estimated_end_index)
            # print("real:", loss_validation, answer_start_batch_actual,"->", answer_end_batch_actual)

            predictions = np.concatenate([estimated_start_index, estimated_end_index])
            actual = np.concatenate([answer_start_batch_actual, answer_end_batch_actual])

            validation_losses.append(loss_validation)

            f1 = 0
            em = 0
            for i in range(len(estimated_end_index)):
                f1 += get_f1_from_tokens(answer_start_batch_actual[i], answer_end_batch_actual[i],
                                         estimated_start_index[i], estimated_end_index[i],
                                         context_batch_validation[i], D)
                em += get_exact_match_from_tokens(answer_start_batch_actual[i], answer_end_batch_actual[i],
                                                    estimated_start_index[i], estimated_end_index[i],
                                                    context_batch_validation[i], D)

            print("f1 score: ", f1 / len(estimated_end_index))
            print("EM score: ", em / len(estimated_end_index))
            f1score.append(f1)
            emscore.append(em)

        # print(f1score)
        f1_mean = np.mean(f1score)
        em_mean = np.mean(emscore)
        validation_loss = np.mean(validation_losses)
        print("Validation loss: ", validation_loss)
        print("Validation f1 score %: ", f1_mean * 100)
        print("Validation em score %: ", em_mean * 100)
        summary_str = sess.run(tf_validation_summary, feed_dict={tf_validation_ph: f1_mean})
        val_writer.add_summary(summary_str, epoch)
        val_writer.flush()