Dataset Groups Activity Stream CREMA-D The CREMA-D dataset is an audio-visual dataset for emotion recognition task, each video in which consists of both facial and acoustic emotional expressions. BibTex: @dataset{H_Cao_and_D_G_Cooper_and_M_K_Keutmann_and_R_C_Gur_and_A_Nenkova_and_R_Verma_2024, abstract = {The CREMA-D dataset is an audio-visual dataset for emotion recognition task, each video in which consists of both facial and acoustic emotional expressions.}, author = {H. Cao and D. G. Cooper and M. K. Keutmann and R. C. Gur and A. Nenkova and R. Verma}, doi = {10.57702/f3iwin68}, institution = {No Organization}, keyword = {'Audiovisual Speech', 'CREMA-D', 'Emotion Recognition', 'Emotional Speech', 'Multimodal', 'Multimodal Emotions', 'Speech', 'Speech Prosody', 'Speech Recognition', 'audio', 'audio-visual', 'emotion recognition', 'keyword spotting', 'language identification', 'speech', 'video'}, month = {dec}, publisher = {TIB}, title = {CREMA-D}, url = {https://service.tib.eu/ldmservice/dataset/crema-d}, year = {2024} }