cnn_hpc_final.py

#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
Created on Mon Nov 29 11:03:46 2021

@author: simon
"""


import numpy as np
from importlib import reload
import sys
import torch
import torch.nn as nn
import pickle

import helper_functions
reload(helper_functions)
from helper_functions import accuracy_rate, load_data, capacity, get_good_idx, get_slice, get_k_fold_cv_idx, get_x_sequences_cnn, train, get_all_accuracy_rates, allocate_x_batch_cnn, quantile_score, get_competition_preds


import argparse
import sys
import os

parser=argparse.ArgumentParser()

parser.add_argument('--num_hidden', help='Integer number of hidden layers', type=int)
parser.add_argument('--kernel_size', help='Integer size of kernel', type=int)
parser.add_argument('--pred_seq_len', help='Integer number of time steps for each prediction',type=int)
parser.add_argument('--loss', help='Training loss metric, either MSE or L1',type=str)
parser.add_argument('--weight_decay', help='weight_decay, float',type=float)
parser.add_argument('--dropout', help='dropout, float',type=float)
parser.add_argument('--case', help='case, int',type=int)

# args = parser.parse_args("--num_hidden=2 --kernel_size=7 --pred_seq_len=25 --loss=MSE --weight_decay=0.01 --dropout=0.1  --case=1".split())
args = parser.parse_args()

num_hidden = args.num_hidden

pred_seq_len = args.pred_seq_len
kernel_size = args.kernel_size
loss = args.loss
weight_decay = args.weight_decay
drop_p = args.dropout
case = args.case

#assert torch.cuda.is_available()

outfolder = 'final_net'
outfile = f'cnn_{"_".join(sys.argv[1:]).replace("=","_")}.pkl'.lower()
if outfile in os.listdir(outfolder):
    print(f'File {outfile} already exists. Exits.')
    sys.exit()


nn_type = 'cnn'
allocate_x_batch = allocate_x_batch_cnn
get_x_sequences = get_x_sequences_cnn


np.random.seed(2021)

x,x_time,y,y_time,time_dif,idx_offset = load_data(case)

# Index offset between start and end of training data for one single prediction
# i.e. number of quarters of an hour we wish to train on for each sample
good_idx = get_good_idx(x,y,idx_offset,pred_seq_len)[:-20000]

input_size = x.shape[1]
num_channels = input_size
out_size = 1


stride = 1
padding = kernel_size//2
conv_out_seq = round((pred_seq_len + 2*padding - kernel_size) / stride + 1)
# define network
class Net(nn.Module):

    def __init__(self):
        super(Net, self).__init__()

        self.conv_in = nn.Conv1d(in_channels = input_size,
                              out_channels = num_channels,
                              kernel_size = kernel_size,
                              stride=stride,
                              padding=padding,
                              groups = input_size)
        self.hidden_list=nn.ModuleList()
        for i in range(num_hidden):
            self.hidden_list.append(nn.Conv1d(in_channels = num_channels,
                                              out_channels = num_channels,
                                              kernel_size = kernel_size,
                                              stride=stride,
                                              padding=padding,
                                              groups = input_size))
        self.l_out = nn.Linear(in_features=conv_out_seq * num_channels,
                               out_features=out_size,
                               bias=True)

        self.act = nn.ReLU()
        self.dropout = nn.Dropout(p=drop_p)


    def forward(self, x):
        x = self.conv_in(x)
        for hidden_layer in self.hidden_list:
            x = hidden_layer(x)
            x = self.dropout(x)
            x = self.act(x)

        x = x.reshape(-1, conv_out_seq * num_channels)
        x = self.dropout(x)
        x = self.act(x)
        x = self.l_out(x)
        return x


# setting hyperparameters and gettings epoch sizes
batch_size = 1000
num_epochs = 80
k_fold_size = 1

if loss.lower() == 'mse':
    loss = nn.MSELoss()
elif loss.lower() == 'l1':
    loss = nn.L1Loss()
else:
    raise(Exception('unrecognized loss function'))

optim_params = {'lr': 3e-3, 'weight_decay': weight_decay}
train_loss, valid_loss, net = train(nn_type, x, y, Net, optim_params, num_epochs, batch_size, good_idx, k_fold_size, idx_offset, pred_seq_len, loss, case)
valid_loss[0] = np.sqrt(valid_loss[0])

#np.savez(os.path.join(outfolder, outfile), train_loss=train_loss, valid_loss=valid_loss)
with open(os.path.join(outfolder, outfile), 'wb') as outp:
    pickle.dump(net.to(torch.device('cpu')), outp, pickle.HIGHEST_PROTOCOL)