@inproceedings{64e0a17ab2dc46f090f0ccd2abdb7539,
title = "TCA-NET: TRIPLET CONCATENATED-ATTENTIONAL NETWORK FOR MULTIMODAL ENGAGEMENT ESTIMATION",
abstract = "Human social interactions involve intricate social signals that artificial intelligence and machine learning models aim to decipher, particularly in the context of artificial mediators that can enhance human interactions across domains like education and healthcare. Engagement, a key aspect of these interactions, relies heavily on multimodal information like facial expressions, voice and posture. Recently, many deep learning methods have been deployed in engagement estimation. Still, they often focus on unimodality or bimodality, leading to the results lacking robustness and adaptability due to factors like noise and varying individual responses. To address this challenge, we introduce a novel modality fusion framework named Triplet Concatenated-Attentional Net (TCA-Net). This framework takes three distinct types of data modality (video, audio and Kinect) as inputs and delivers a prediction score as output. Within this network, a specially designed concatenated-attention fusion mechanism serves the purpose of modality fusion and preserves the intra-modal features. Experimental results validate the efficiency of our TCA-Net in enhancing the accuracy and reliability of engagement estimation across diverse scenarios, with a test set Concordance Correlation Coefficient (CCC) of 0.75. We release our code at https://github.com/Daming-W/Multimodal_Engagement_Estimation.",
keywords = "attention network, deep learning, Engagement estimation, human interaction, multimodal fusion",
author = "Hongyuan He and Daming Wang and Hasan, {Md Rakibul} and Tom Gedeon and Hossain, {Md Zakir}",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 31st IEEE International Conference on Image Processing, ICIP 2024 ; Conference date: 27-10-2024 Through 30-10-2024",
year = "2024",
doi = "10.1109/ICIP51287.2024.10647692",
language = "English",
series = "Proceedings - International Conference on Image Processing, ICIP",
publisher = "IEEE Computer Society",
pages = "2062--2068",
booktitle = "2024 IEEE International Conference on Image Processing, ICIP 2024 - Proceedings",
address = "United States",
}