train_lstm.py

# -*- coding: utf-8 -*-
"""Train_LSTM.ipynb
**
 * This file is part of Hybrid CNN-LSTM for COVID-19 Severity Score Prediction paper.
 *
 * Written by Ankan Ghosh Dastider and Farhan Sadik.
 *
 * Copyright (c) by the authors under Apache-2.0 License. Some rights reserved, see LICENSE.
 */

"""

'''
Loading frames of the videos sequentially
'''
video_types=['Video 01', 'Video 05', 'Video 06', 'Video 07', 'Video 08', 'Video 09', 'Video 10', 'Video 14', 
             'Video 15', 'Video 16', 'Video 17', 'Video 20', 'Video 21', 'Video 27', 'Video 29']

NUM_VIDEOS = len(video_types)
NUM_FRAMES = 302

data_dir_lstm = ''  #Link Training Directory videowise
train_dir_lstm = os.path.join(data_dir_lstm)

train_data_lstm = []
for defects_id, sp in enumerate(video_types):
    temporary = []
    for file in sorted(os.listdir(os.path.join(train_dir_lstm, sp))):
        temporary.append(['{}/{}'.format(sp, file), defects_id, sp])

    total_frames = len(temporary)
    index = np.linspace(start = 0, stop = total_frames-1, num = NUM_FRAMES, dtype = int)

    for i in range(NUM_FRAMES):
        train_data_lstm.append(temporary[index[i]])
        
train_on_lstm = pd.DataFrame(train_data_lstm, columns=['File', 'FolderID','Video Type'])
train_on_lstm.head(NUM_VIDEOS*NUM_FRAMES)

video_types=['Video 01', 'Video 05', 'Video 06', 'Video 07', 'Video 08', 'Video 09', 'Video 10', 'Video 14', 
             'Video 15', 'Video 16', 'Video 17', 'Video 20', 'Video 21', 'Video 27', 'Video 29']

data_dir_lstm = '' #Link Training Directory videowise
train_dir_lstm = os.path.join(data_dir_lstm)

train_data_lstm = []
for defects_id, sp in enumerate(video_types):
    for file in sorted(os.listdir(os.path.join(train_dir_lstm, sp))):
        # print(file)
        train_data_lstm.append(['{}/{}'.format(sp, file), defects_id, sp])
        
train_on_lstm = pd.DataFrame(train_data_lstm, columns=['File', 'FolderID','Video Type'])
train_on_lstm.head()

IMAGE_SIZE = 128
SEED = 42

BATCH_SIZE_LSTM = 25
EPOCHS_LSTM = 120

def read_image_lstm(filepath):
    return cv2.imread(os.path.join(data_dir_lstm, filepath)) # Loading a color image is the default flag

#Resize image to target size
def resize_image(newimage, image_size):
    return cv2.resize(newimage.copy(), image_size, interpolation=cv2.INTER_AREA)

from tensorflow.keras.models import load_model
import re
from keras import backend as K

X_Train_Total = np.zeros((NUM_VIDEOS, NUM_FRAMES, IMAGE_SIZE, IMAGE_SIZE, 3))
Y_Train_Total = np.zeros((NUM_VIDEOS, NUM_FRAMES, 1))
k = 0
j = 0
for i, file in tqdm(enumerate(train_on_lstm['File'].values)):
    if i % NUM_FRAMES == 0 and i != 0 :
        k = k + 1
        j = 0
    if k == NUM_VIDEOS:
        break
    # print(i,file)
    newimage = read_image_lstm(file)
    if newimage is not None:
        # print(k,j)
        X_Train_Total[k,j] = resize_image(newimage, (IMAGE_SIZE, IMAGE_SIZE))
        match = re.search('Score(\d)',file)
        score = int(match.group(1))
        Y_Train_Total[k,j] = score
        #print(file)
        #print(score)
        #print(Y_test[k,j])
    j = j + 1

Y_Train_Total = to_categorical(Y_Train_Total, num_classes=4)
# print(Y_Train_Total)
# Normalize the data
X_Train_Total = X_Train_Total / 255.
print('X_Train_Total Shape: {}'.format(X_Train_Total.shape))
print('Y_Train_Total Shape: {}'.format(Y_Train_Total.shape))

np.random.seed(42)
np.random.shuffle(X_Train_Total)

np.random.seed(42)
np.random.shuffle(Y_Train_Total)

print('X_Train_Total Shape: {}'.format(X_Train_Total.shape))
print('Y_Train_Total Shape: {}'.format(Y_Train_Total.shape))

model = load_model('') #Link the CNN weights
model.summary()

output = np.zeros((NUM_VIDEOS, NUM_FRAMES, 64))

for i in range(NUM_VIDEOS):
  X_New = X_Train_Total[i]
  specific_layer_output = K.function([model.layers[0].input], [model.get_layer('dropout_35').output])
  layer_output = specific_layer_output([X_New])[0]
  #print(layer_output.shape)
  #print(layer_output)
  output[i] = layer_output

print('Output from CNN Shape: {}'.format(output.shape))
#custom3 = model.predict(X_Test)
#print(custom3)

X_Train_Total = output
Y_Train_Total = Y_Train_Total

print('X_Train_Total Shape: {}'.format(X_Train_Total.shape))
print('Y_Train_Total Shape: {}'.format(Y_Train_Total.shape))

# Split the train and validation sets 
X_Train_LSTM, X_Val_LSTM, Y_Train_LSTM, Y_Val_LSTM = train_test_split(X_Train_Total, Y_Train_Total, 
                                                                      test_size=0.2, random_state = SEED)

from keras.layers import Reshape, LSTM, Lambda, TimeDistributed, Conv1D, MaxPool1D, Dense, Dropout, Flatten, Conv2D, MaxPool2D, BatchNormalization, AveragePooling2D, GlobalAveragePooling2D


def build_lstm():

    input = Input(shape=(NUM_FRAMES, 64))
    

    x = LSTM(1000, return_sequences = True)(input)
    x = Dropout(0.5)(x)
    
    x = LSTM(1000, return_sequences = True)(x)
    x = Dropout(0.5)(x)

    x = LSTM(4, return_sequences=True)(x)
    # multi output
    output = Dense(4,activation = 'softmax', name='root')(x)

    # model
    model = Model(input,output)
    
    optimizer = Adam(lr=0.002, beta_1=0.9, beta_2=0.999, epsilon=0.1, decay=0.0)
    model.compile(loss='categorical_crossentropy', optimizer=optimizer, metrics=['accuracy'])
    model.summary()
    
    return model

model_lstm = build_lstm()
annealer = ReduceLROnPlateau(monitor='val_accuracy', factor=0.5, patience=5, verbose=1, min_lr=1e-3)
checkpoint = ModelCheckpoint('model_lstm.h5', verbose=1, save_best_only=True)
# Generates batches of image data with data augmentation
# datagen = ImageDataGenerator(rotation_range=360, # Degree range for random rotations
 #                       width_shift_range=0.2, # Range for random horizontal shifts
  #                      height_shift_range=0.2, # Range for random vertical shifts
   #                     zoom_range=0.2, # Range for random zoom
    #                    horizontal_flip=True, # Randomly flip inputs horizontally
     #                   vertical_flip=True) # Randomly flip inputs vertically

#datagen.fit(X_train)
# Fits the model on batches with real-time data augmentation
hist = model_lstm.fit(X_Train_LSTM, Y_Train_LSTM, batch_size = BATCH_SIZE_LSTM,
                     # steps_per_epoch=X_Train_LSTM.shape[0] // BATCH_SIZE,
                     epochs = EPOCHS_LSTM,
                     verbose = 2,
                     callbacks = [annealer, checkpoint],
                     validation_data = (X_Val_LSTM, Y_Val_LSTM))

final_loss_lstm, final_accuracy_lstm = model_lstm.evaluate(X_Val_LSTM, Y_Val_LSTM)
print('Final Loss LSTM: {}, Final Accuracy LSTM: {}'.format(final_loss_lstm, final_accuracy_lstm))

score_types = ['Score 0', 'Score 1', 'Score 2', 'Score 3']

Y_pred_lstm = model_lstm.predict(X_Val_LSTM)
Y_pred_lstm = np.reshape(Y_pred_lstm, (Y_pred_lstm.shape[0]*Y_pred_lstm.shape[1], Y_pred_lstm.shape[2]))
Y_pred_lstm = np.argmax(Y_pred_lstm, axis=1)

Y_true_lstm = np.reshape(Y_Val_LSTM, (Y_Val_LSTM.shape[0]*Y_Val_LSTM.shape[1], Y_Val_LSTM.shape[2]))
Y_true_lstm = np.argmax(Y_true_lstm, axis=1)

#print(Y_pred_lstm.shape)
#print(Y_Val_LSTM.shape)
cm = confusion_matrix(Y_true_lstm, Y_pred_lstm)
plt.figure(figsize=(12, 12))
ax = sns.heatmap(cm, cmap=plt.cm.Greens, annot=True, square=True, xticklabels=score_types, yticklabels=score_types)
ax.set_ylabel('Actual', fontsize=40)
ax.set_xlabel('Predicted', fontsize=40)

'''
# accuracy plot 
plt.plot(hist.history['accuracy'])
plt.plot(hist.history['val_accuracy'])
plt.title('model accuracy')
plt.ylabel('accuracy')
plt.xlabel('epoch')
plt.legend(['train', 'test'], loc='upper left')
plt.show()

# loss plot
plt.plot(hist.history['loss'])
plt.plot(hist.history['val_loss'])
plt.title('model loss')
plt.ylabel('loss')
plt.xlabel('epoch')
plt.legend(['train', 'test'], loc='upper left')
plt.show()
'''