
@Article{jai.2024.048911,
AUTHOR = {Farhad Mortezapour Shiri, Ehsan Ahmadi, Mohammadreza Rezaee, Thinagaran Perumal},
TITLE = {Detection of Student Engagement in E-Learning Environments Using EfficientnetV2-L Together with RNN-Based Models},
JOURNAL = {Journal on Artificial Intelligence},
VOLUME = {6},
YEAR = {2024},
NUMBER = {1},
PAGES = {85--103},
URL = {http://www.techscience.com/jai/v6n1/56239},
ISSN = {2579-003X},
ABSTRACT = {Automatic detection of student engagement levels from videos, which is a spatio-temporal classification problem is crucial for enhancing the quality of online education. This paper addresses this challenge by proposing four novel hybrid end-to-end deep learning models designed for the automatic detection of student engagement levels in e-learning videos. The evaluation of these models utilizes the DAiSEE dataset, a public repository capturing student affective states in e-learning scenarios. The initial model integrates EfficientNetV2-L with Gated Recurrent Unit (GRU) and attains an accuracy of 61.45%. Subsequently, the second model combines EfficientNetV2-L with bidirectional GRU (Bi-GRU), yielding an accuracy of 61.56%. The third and fourth models leverage a fusion of EfficientNetV2-L with Long Short-Term Memory (LSTM) and bidirectional LSTM (Bi-LSTM), achieving accuracies of 62.11% and 61.67%, respectively. Our findings demonstrate the viability of these models in effectively discerning student engagement levels, with the EfficientNetV2-L+LSTM model emerging as the most proficient, reaching an accuracy of 62.11%. This study underscores the potential of hybrid spatio-temporal networks in automating the detection of student engagement, thereby contributing to advancements in online education quality.},
DOI = {10.32604/jai.2024.048911}
}



