@Article{cmes.2026.079697,
AUTHOR = {Mustaqeem Khan, Ufaq Khan, Mamoun Awad, Nazar Zaki, Guiyoung Son, Soonil Kwon},
TITLE = {Real-Time Emotion Recognition System Using Adaptive Distillation Technique},
JOURNAL = {Computer Modeling in Engineering \& Sciences},
VOLUME = {147},
YEAR = {2026},
NUMBER = {1},
PAGES = {0--0},
URL = {http://www.techscience.com/CMES/v147n1/67146},
ISSN = {1526-1506},
ABSTRACT = {Knowledge distillation has shown impressive results in different fields, including detection, recognition, and generation. These models are excellent at tasks such as speech recognition, but they need to be shrunk down using adaptive knowledge distillation (<i>AKD</i>). The use of <i>AKD</i> can improve human-computer interactions and streamline data collection in the field of Speech Emotion Recognition (<i>SER</i>). This study presents a high-level approach that employs a novel adaptive knowledge distillation (<i>AKD</i>) with spatio-temporal transformers to acquire advanced semantic features from the input signal. This method uses an instance-by-instance correlation between the teacher and a student to determine the teacher’s importance. Additionally, this work proposes a knowledge-transfer strategy to integrate soft targets between teachers and students, aiming to provide deeper insight for the final prediction. Our light-weight model <i>AKD</i> is an efficient solution for edge devices and learns the synergistic information for respective tasks, as discussed in the results and analysis section. Our proposed model <i>AKD</i> outperforms the <i>SOTA</i> models of SER systems on the benchmark datasets, IEMOCAP, EmoDB, and RAVDESS, with an absolute gain of 4%–6% in overall recognition rate.},
DOI = {10.32604/cmes.2026.079697}
}