This is the latest codes for the paper.

zhenxingjian · May 28, 2018 · 1b67041 · 1b67041
commit 1b67041
Show file tree

Hide file tree

Showing 4 changed files with 694 additions and 0 deletions.
diff --git a/Preprocessed_UCF11.py b/Preprocessed_UCF11.py
@@ -0,0 +1,122 @@
+import os
+import numpy as np
+import pickle
+import datetime
+import pdb
+import cv2
+
+from keras.layers import Input, SimpleRNN, LSTM, GRU, Dense, Dropout, Masking, BatchNormalization
+from keras.models import Model
+from keras.optimizers import *
+from keras.regularizers import l2
+from keras.layers.wrappers import TimeDistributed
+from keras.preprocessing.sequence import pad_sequences
+from keras.utils.np_utils import to_categorical
+
+from sklearn.metrics import average_precision_score, roc_auc_score, accuracy_score
+
+GLOBAL_MAX_LEN = 1492
+
+def get_clips(class_name):
+    files = os.listdir(data_path + class_name)
+    files.sort()
+    clip_list = []
+    for this_file in files:
+        if '.DS_Store' not in this_file and 'Annotation' not in this_file:
+            clips = os.listdir(data_path + class_name + '/' + this_file)
+            clips.sort()
+            for this_clip in clips:
+                if '.DS_Store' not in this_clip and 'Annotation' not in this_file:
+                    clip_list.append( data_path + class_name + '/' + this_file + '/' + this_clip )
+    return clip_list
+
+
+def load_data(inds, mode = 'train'):
+    N = len(inds)
+    X = np.zeros((N, GLOBAL_MAX_LEN, 120*160*3), dtype='int8')
+    if mode == 'train':
+        set = train_set
+    else:
+        set = test_set
+    for i in range(N):
+        read_in = open(set[0][inds[i]])
+        this_clip = pickle.load(read_in)[0] # of shape (nb_frames, 240, 320, 3)
+        read_in.close()
+        # flatten the dimensions 1, 2 and 3
+        this_clip = this_clip.reshape(this_clip.shape[0], -1) # of shape (nb_frames, 240*320*3)
+        this_clip = (this_clip - 128.).astype('int8')   # this_clip.mean()
+        X[i] = pad_sequences([this_clip], maxlen=GLOBAL_MAX_LEN, truncating='post', dtype='int8')[0]
+    Y = set[1][inds]
+    return [X, Y]
+
+
+# Load the data --------------------------------------------------------------------------------------------------------
+np.random.seed(11111986)
+
+# Settings:
+
+CV_setting = 0  # [0, 1, 2, 3, 4]
+model_type = 1  # 0 for GRU, 1 for LSTM
+use_TT = 0      # 0 for non-TT, 1 for TT
+
+# Had to remove due to anonymity
+data_path = './UCF11_updated_mpg/'
+write_out_path = ''
+
+classes = ['basketball', 'biking', 'diving', 'golf_swing', 'horse_riding', 'soccer_juggling',
+           'swing', 'tennis_swing', 'trampoline_jumping', 'volleyball_spiking', 'walking']
+
+clips = [None]*11
+labels = [None]*11
+sizes = np.zeros(11)
+for k in range(11):
+    this_clip = get_clips(classes[k])
+    clips[k] = this_clip
+    sizes[k] = len(this_clip)
+    labels[k] = np.repeat([k], sizes[k])
+
+# flatten both lists
+clips = np.array( [item for sublist in clips for item in sublist] )
+labels = np.array( [item for sublist in labels for item in sublist] )
+labels = to_categorical(labels)
+
+shuffle_inds = np.random.choice(range(len(clips)), len(clips), False)
+totalclips = clips[shuffle_inds]
+totallabels = labels[shuffle_inds]
+
+pdb.set_trace()
+# iterate through all clips and store the length of each:
+for xj in range(40):
+    clips = totalclips[xj*40:xj*40+40]
+    labels = totallabels[xj*40:xj*40+40]
+    # pdb.set_trace()
+    data = []
+    length_of_frames = []
+    lengths = np.zeros(len(clips))
+    for l in range(len(clips)):
+        print clips[l]
+        cap = cv2.VideoCapture(clips[l])
+        ret = True
+        tempdata = []
+        count = 0
+        while(ret):
+            ret, frame = cap.read()
+            if ret:
+                count = count + 1
+                cv2.imshow('frame',frame)
+                frame = cv2.resize(frame,(160,120))
+                tempdata.append(frame)
+        length_of_frames.append(count)
+
+        # for i in range(count,GLOBAL_MAX_LEN):
+        #     tempdata.append(tempdata[count-1])
+
+
+        tempdata = np.asarray(tempdata,dtype=np.float32) / 255.
+        data.append(tempdata)
+    length_of_frames = np.asarray(length_of_frames)   
+    data = np.asarray(data)
+    np.save('processed_data/data'+str(xj)+'.npy',data)
+    np.save('processed_data/label'+str(xj)+'.npy',labels)
+    np.save('processed_data/length'+str(xj)+'.npy',length_of_frames)
+    # pdb.set_trace()
diff --git a/UCF11_cnn_rnn_for_matrix_batch.py b/UCF11_cnn_rnn_for_matrix_batch.py
@@ -0,0 +1,200 @@
+from __future__ import print_function
+
+import tensorflow as tf
+import numpy as np
+import random
+import pdb
+import math
+import time
+from sklearn.model_selection import KFold
+
+from tensorflow.python.ops.distributions.util import fill_triangular
+from matrixcell import MatrixRNNCell,CNNRNNCell,Chol_de
+
+from readdata import read_data
+
+
+def get_a_cell():
+    return MatrixRNNCell(alpha = a , batch_size = batch_size , matrix_size = matrix_size , eps = eps)
+
+
+
+batch_size = 40
+height = 120
+width = 160
+in_channel = 3
+out_channel = 7
+tot_time_points = 50
+class_num = 11
+matrix_size = out_channel+1
+epoch_num = 1000
+depth = 5
+
+CNN_kernel_shape = [[7,7,5],[7,7,out_channel]]
+CNN_num_layer = len(CNN_kernel_shape)
+
+
+reduced_spatial_dim = height * width / (4**CNN_num_layer) #4800 # height * width / (4**CNN_num_layer)
+beta = 0.3
+
+eps = 1e-10
+n = matrix_size
+a = [0.01, 0.25, 0.5, 0.9, 0.99]
+a_num = len(a)
+
+sample_rate = 3
+
+lr = 0.9
+decay_steps = 1000
+decay_rate = 0.99
+
+matrix_length = tot_time_points
+global_steps = tf.Variable(0,trainable = False)
+learning_rate = tf.train.exponential_decay(lr, global_step = global_steps, decay_steps = decay_steps, decay_rate = decay_rate)
+add_global = global_steps.assign_add(1)
+
+
+
+X = tf.placeholder(np.float32,shape = (batch_size,matrix_length,height,width,in_channel)) 
+y = tf.placeholder(np.float32,shape = (batch_size,class_num)) 
+
+keep_prob = tf.placeholder(tf.float32)
+
+W2_1 = tf.Variable(tf.random_normal([n*(n+1)//2, class_num],stddev=np.sqrt(2./(class_num*n*(n+1)//2))))
+b2_1 = tf.Variable(tf.random_normal([1, class_num],stddev=np.sqrt(2./class_num)))
+
+
+initMt = tf.placeholder(np.float32,[batch_size,a_num*n*n])
+
+Mt_1 = initMt
+
+tf.keras.backend.set_learning_phase(True)
+
+
+CNNRNNcell = [CNNRNNCell(alpha = a , num_layer = CNN_num_layer, kernel_shape = CNN_kernel_shape , batch_size = batch_size ,
+                        matrix_size = matrix_size ,in_channel= in_channel, out_channel=out_channel ,
+                        reduced_spatial_dim=reduced_spatial_dim , beta = beta, keep_prob = keep_prob , eps = eps)]
+
+for i in range(depth):
+    CNNRNNcell.append(get_a_cell())
+
+
+cells = tf.nn.rnn_cell.MultiRNNCell(CNNRNNcell)
+
+
+
+
+initial_state=tuple([initMt for _ in range(depth+1)])
+
+outputs, state = tf.nn.dynamic_rnn(cells,X,initial_state=initial_state , dtype = np.float32)
+
+outputs = tf.slice(outputs,[0,matrix_length-1,0],[-1,1,-1])
+outputs = tf.reshape(outputs,[batch_size,n,n])
+
+output_series =  Chol_de ( outputs, n,batch_size )
+
+output_series = tf.keras.layers.BatchNormalization()(output_series)
+
+output_series = tf.nn.dropout(output_series, keep_prob)
+
+predict_label = tf.add( tf.matmul ( output_series, W2_1 ), b2_1 ) 
+
+loss = tf.reduce_mean(tf.nn.softmax_cross_entropy_with_logits(
+     logits = predict_label,
+     labels = y
+))
+
+correct_prediction = tf.equal(tf.argmax(predict_label, 1), tf.argmax(y, 1))
+accuracy = tf.reduce_mean(tf.cast(correct_prediction, tf.float32))
+
+
+with tf.control_dependencies([add_global]):
+    opt = tf.train.AdadeltaOptimizer(learning_rate)
+    train_step = opt.minimize(loss)
+
+batch_num = 40
+
+init_state = np.reshape( np.tile(np.eye(n)*1e-5,[batch_size,a_num,1,1]) , [batch_size,a_num*n*n] )
+loss_p = 0
+
+batch_num_idx = range(batch_num)
+k_fold = KFold(n_splits=10)
+final_acc_fold = np.zeros((10,1))
+
+data = []
+label = []
+
+for idx in range(batch_num):
+    print (idx)
+    data_batch_in,label_batch_in = read_data(idx,'the_path_of_your_UCF11',matrix_length,sample_rate)
+    data.append(data_batch_in)
+    label.append(label_batch_in)
+
+
+with tf.Session() as sess:
+    final_acc = 0.
+    co = 0
+    for tr_indices, ts_indices in k_fold.split(batch_num_idx):
+        sess.run(tf.global_variables_initializer())
+        print(np.sum([np.prod(v.get_shape().as_list()) for v in tf.trainable_variables()]))
+        #start_time = time.time()
+        for epoch in range(epoch_num):
+            start_time = time.time()
+            train_acc = 0.
+            train_loss = 0.
+            for batch_idx in tr_indices:
+                data_batch_in = data[batch_idx]
+                label_batch_in = label[batch_idx]
+                _, loss_, acc_ = sess.run([train_step,loss,accuracy],
+                         feed_dict={
+                               X:data_batch_in,
+                               y:label_batch_in,
+                               initMt:init_state,
+                               keep_prob:0.75,
+                                })
+
+                if math.isnan(loss_):
+                    pdb.set_trace()
+                else:
+                    train_acc = train_acc + acc_
+                    train_loss = train_loss + loss_
+            train_acc = train_acc / len(tr_indices)
+            train_loss = train_loss/len(tr_indices)
+            print ('Train Accuracy is : ' , train_acc , ' in Epoch : ' , epoch)
+            print ('Train Loss is : ' , train_loss)
+            print ('Time per epoch : ' , time.time()-start_time)
+
+            test_acc = 0
+            for batch_idx in ts_indices:
+                data_batch_in = data[batch_idx]
+                label_batch_in = label[batch_idx]
+                loss_, acc_ = sess.run([loss,accuracy],
+                             feed_dict={
+                                   X:data_batch_in,
+                                   y:label_batch_in,
+                                   initMt:init_state,
+                                   keep_prob:1.,
+                                    })
+                test_acc = test_acc + acc_
+            test_acc = test_acc / len(ts_indices)
+            print ('Test Accuracy is : ' , test_acc)
+            print (' ')
+
+        final_acc_fold[co] = 0.
+        for batch_idx in ts_indices:
+            data_batch_in = data[batch_idx]
+            label_batch_in = label[batch_idx]
+            loss_, acc_ = sess.run([loss,accuracy],
+                         feed_dict={
+                               X:data_batch_in,
+                               y:label_batch_in,
+                               initMt:init_state,
+                               keep_prob:1.,
+                                })
+            final_acc_fold[co] = final_acc_fold[co] + 1.0*acc_/len(ts_indices)
+            print(loss_,acc_)
+        print('After kth fold' , final_acc_fold[co])
+        final_acc = final_acc + final_acc_fold[co]*1.0/10
+        co += 1
+    print(final_acc)
+    np.save('final_result.npy',final_acc_fold)