two_labels.py

# -*- coding: utf-8 -*-
"""
Created on Sat Jan  4 11:19:08 2020

@author: Shreya
"""

from keras.models import Sequential
from keras.layers import Dense, LSTM, Embedding,Dropout
from keras.preprocessing import sequence
from keras.utils import to_categorical
import scipy.io as sio
import numpy as np
import os
import keras
from numpy import array
np.random.seed(1337)  # for reproducibility
from keras.models import Model
from keras.layers import Input
import keras.backend as K
import h5py

def ordering_loss(l,l_dash,ul,alpha):
    return K.maximum(ul-K.sum((alpha*l),((1-alpha)*l_dash)),0)

def triplet_loss(y_true, y_pred):
    """
    Implementation of the triplet loss function
    Arguments:
    y_true -- true labels, required when you define a loss in Keras, you don't need it in this function.
    y_pred -- python list containing three objects:
            anchor -- the encodings for the anchor data
            positive -- the encodings for the positive data (similar to anchor)
            negative -- the encodings for the negative data (different from anchor)
    Returns:
    loss -- real number, value of the loss
    """
    print('y_pred.shape = ',y_pred)
    
    total_length = y_pred.shape.as_list()[-1]-1
    print('total_length=',  total_length)
#     total_lenght =12
    
    anchor = y_pred[:,0:int(total_length*1/3)-1]
#    print(int(total_length*1/3-1))
    positive = y_pred[:,int(total_length*1/3):int(total_length*2/3)-1]
    negative = y_pred[:,int(total_length*2/3):int(total_length*3/3)-1]
    alpha = y_pred[:,total_length]
#    print(alpha)
    # distance between the anchor and the positive
    pos_dist = K.sum(K.square(anchor-positive),axis=1)

    # distance between the anchor and the negative
    neg_dist = K.sum(K.square(anchor-negative),axis=1)

    # compute loss
    basic_loss = pos_dist-neg_dist+alpha
    loss = K.maximum(basic_loss,0.0)
 
    return loss

def build_model():
    input_dim = 4096
    inputs_label = Input(shape=(input_dim,))
    inputs_unlabel = Input(shape=(input_dim,))
    inputs_label_dash = Input(shape=(input_dim,))
        
    x_inputs_label = Dense(512)(inputs_label)#(attention_mul)
    x_inputs_unlabel = Dense(512)(inputs_unlabel)
    x_inputs_label_dash = Dense(512)(inputs_label_dash)
    
    motion_1 = keras.layers.Subtract()([x_inputs_label, x_inputs_unlabel])
    motion_2 = keras.layers.Subtract()([x_inputs_label, x_inputs_unlabel])
    x = keras.layers.concatenate([x_inputs_unlabel,motion_1,motion_2], axis=-1)
#    # ATTENTION PART STARTS HERE
#    attention_probs = Dense(input_dim, activation='softmax', name='attention_vec')(inputs)
#    attention_mul = keras.layers.Multiply()([inputs, attention_probs])
#    # ATTENTION PART FINISHES HERE
#
#    attention_mul = Dense(64)(attention_mul)
    x = Dense(512)(x_inputs_label)#(attention_mul)
    x = Dense(512)(x)
    x = Dense(512)(x_inputs_label_dash)
    x = Dropout(0.4)(x)
    x = Dense(1024)(x)    
    x_embedding = Dense(4096,activation='sigmoid',name = 'x_embedding')(x)
    
    output_label = Dense(3, activation='sigmoid',name = 'Output_label')(x)
    output_label_dash = Dense(3, activation='sigmoid',name = 'Output_label_dash')(x)
    output_predicted_label = Dense(3, activation='sigmoid',name = 'output_predicted_label')(x)
    output_margin = Dense(1, activation='sigmoid')(x)
    merged_vector = keras.layers.concatenate([output_label, output_predicted_label, output_label_dash,output_margin], axis=-1, name='merged_layer')
    
    model = Model(input=[inputs_label,inputs_unlabel,inputs_label_dash], output=[x_embedding, output_label,output_label_dash,merged_vector])
    model.summary()

    losses ={'Output_label':'mean_squared_error',
              'Output_label_dash': 'mean_squared_error' , 
              'x_embedding': 'cosine_proximity',
              'merged_layer':triplet_loss }
    sgd = keras.optimizers.SGD(lr=0.01, decay=1e-6, momentum=0.9, nesterov=True)
    
   
    model.compile(
    optimizer=sgd,
    loss=losses,
    metrics=['acc'])
    
    return model

# =============================================================================
# data loading
# =============================================================================
file_list = os.listdir('./Dataset/data_triplets/')
count = 0
for file in file_list:
    print(file)
    filepath = './Dataset/data_triplets/'+ file
    
    with h5py.File(filepath, 'r') as hf:
        start_frames_l = hf['start_frames_l'][:]
        end_frames_l = hf['end_frames_l'][:]
        unlabelled_frames = hf['unlabelled_frames'][:]
        start_gaze_label = hf['start_gaze_label'][:]
        end_gaze_label = hf['end_gaze_label'][:]
    hf.close()    
    if count == 0:
        all_start_frames_l = start_frames_l
        all_end_frames_l = end_frames_l
        all_unlabelled_frames = unlabelled_frames
        all_start_gaze_label = start_gaze_label
        all_end_gaze_label = end_gaze_label        
        count = count + 1
        del start_frames_l,end_frames_l,unlabelled_frames,start_gaze_label,end_gaze_label
    else:
        all_start_frames_l = np.vstack((all_start_frames_l,start_frames_l))
        all_end_frames_l = np.vstack((all_end_frames_l,end_frames_l))
        all_unlabelled_frames = np.vstack((all_unlabelled_frames,unlabelled_frames))
        all_start_gaze_label = np.vstack((all_start_gaze_label,start_gaze_label))
        all_end_gaze_label = np.vstack((all_end_gaze_label,end_gaze_label))        
        count = count + 1
        del start_frames_l,end_frames_l,unlabelled_frames,start_gaze_label,end_gaze_label
#normalize data
Y_start_gaze_label=np.zeros([len(all_start_gaze_label),3])
Y_start_gaze_label[:,0] = (all_start_gaze_label[:,0]- np.ones(len(all_start_gaze_label[:,0]))*
                  min(all_start_gaze_label[:,0]))/(np.ones(len(all_start_gaze_label[:,0]))*
                     max(all_start_gaze_label[:,0])-np.ones(len(all_start_gaze_label[:,0]))*
                     min(all_start_gaze_label[:,0]))
Y_start_gaze_label[:,1] = (all_start_gaze_label[:,1]- np.ones(len(all_start_gaze_label[:,1]))*
                  min(all_start_gaze_label[:,1]))/(np.ones(len(all_start_gaze_label[:,1]))*
                     max(all_start_gaze_label[:,1])-np.ones(len(all_start_gaze_label[:,1]))*
                     min(all_start_gaze_label[:,1]))
Y_start_gaze_label[:,2] = (all_start_gaze_label[:,2]- np.ones(len(all_start_gaze_label[:,2]))*
                  min(all_start_gaze_label[:,2]))/(np.ones(len(all_start_gaze_label[:,2]))*
                     max(all_start_gaze_label[:,2])-np.ones(len(all_start_gaze_label[:,2]))*
                     min(all_start_gaze_label[:,2]))

Y_end_gaze_label=np.zeros([len(all_end_gaze_label),3])
Y_end_gaze_label[:,0] = (all_end_gaze_label[:,0]- np.ones(len(all_end_gaze_label[:,0]))*
                  min(all_end_gaze_label[:,0]))/(np.ones(len(all_end_gaze_label[:,0]))*
                     max(all_end_gaze_label[:,0])-np.ones(len(all_end_gaze_label[:,0]))*
                     min(all_end_gaze_label[:,0]))
Y_end_gaze_label[:,1] = (all_end_gaze_label[:,1]- np.ones(len(all_end_gaze_label[:,1]))*
                  min(all_end_gaze_label[:,1]))/(np.ones(len(all_end_gaze_label[:,1]))*
                     max(all_end_gaze_label[:,1])-np.ones(len(all_end_gaze_label[:,1]))*
                     min(all_end_gaze_label[:,1]))
Y_end_gaze_label[:,2] = (all_end_gaze_label[:,2]- np.ones(len(all_end_gaze_label[:,2]))*
                  min(all_end_gaze_label[:,2]))/(np.ones(len(all_end_gaze_label[:,2]))*
                     max(all_end_gaze_label[:,2])-np.ones(len(all_end_gaze_label[:,2]))*
                     min(all_end_gaze_label[:,2]))

del all_end_gaze_label,all_start_gaze_label
# =============================================================================
#   model training      
# =============================================================================
model = build_model()
checkpoint = keras.callbacks.ModelCheckpoint('./models/best_weights.h5', monitor='loss', 
                                             save_best_only=True,
                                              verbose=1,mode='min')

history = model.fit(
    [all_start_frames_l,all_end_frames_l,all_unlabelled_frames],
    [all_unlabelled_frames,Y_start_gaze_label,Y_end_gaze_label,all_unlabelled_frames],
    epochs=50,
    batch_size=32,callbacks=[checkpoint])

model.load_weights('./models/best_weights.h5')
model.save('./models/video_eyegaze_sgd0.01_normalizedlabel.h5')

# =============================================================================
# Plot curve
# =============================================================================

from matplotlib import pyplot as plt
#acc = history.history['acc']
#val_acc = history.history['val_acc']
loss = history.history['loss']
#val_loss = history.history['val_loss']

epochs = range(1, len(loss) + 1)

plt.plot(epochs, loss, 'b', label='loss')
#plt.plot(epochs, val_acc, 'b', label='Validation acc')
plt.title('loss')
plt.legend()

#    plt.plot(epochs, loss, 'bo', label='Training loss')
#    plt.plot(epochs, val_loss, 'b', label='Validation loss')
#    plt.title('Training and validation loss')
#plt.legend()

plt.show()
plt.savefig('./models/video_eyegaze_sgd0.01_normalizedlabel.png')