<?xml version="1.0" encoding="UTF-8"?>
<doi_batch version="4.3.0" xmlns="http://www.crossref.org/doi_resources_schema/4.3.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.crossref.org/doi_resources_schema/4.3.0 http://www.crossref.org/schema/deposit/doi_resources4.3.0.xsd">
<head>
<doi_batch_id>96f0bc5d-82a5-46ec-a033-425a1cc8ae07</doi_batch_id>
<depositor>
<name>beie</name>
<email_address>director@blueeyesintelligence.org</email_address>
</depositor>
</head>
<body>
<doi_citations>
<doi>10.35940/ijitee.J9968.13100924</doi>
<citation_list><citation key="ref0"><doi>10.1007/s10772-018-9491-z</doi><unstructured_citation>Swain, M.; Routray, A.; Kabisatpathy, P. Databases, features and classifiers for speech emotion recognition: A review. Int. J. Speech Technol. 2018, 21, 93-120.</unstructured_citation></citation><citation key="ref1"><doi>10.3390/e24091250</doi><unstructured_citation>Zong, Y.; Lian, H.; Chang, H.; Lu, C.; Tang, C. Adapting Multiple Distributions for Bridging Emotions from Different Speech Corpora. Entropy 2022, 24, 1250.</unstructured_citation></citation><citation key="ref2"><doi>10.1109/TAFFC.2020.2981446</doi><unstructured_citation>Li, S.; Deng, W. Deep facial expression recognition: A survey. IEEE Trans. Affect. Comput. 2020, 13, 1195-1215.</unstructured_citation></citation><citation key="ref3"><doi>10.3390/e25091246</doi><unstructured_citation>Yang, H.; Xie, L.; Pan, H.; Li, C.; Wang, Z.; Zhong, J. Multimodal Attention Dynamic Fusion Network for Facial Micro-Expression Recognition. Entropy 2023, 25, 1246.</unstructured_citation></citation><citation key="ref4"><doi>10.1145/3477495.3532064</doi><unstructured_citation>Zeng, J.; Liu, T.; Zhou, J. Tag-assisted Multimodal Sentiment Analysis under Uncertain Missing Modalities. In Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval, Madrid, Spain, 11-15 July 2022; pp. 1545-1554.</unstructured_citation></citation><citation key="ref5"><doi>10.1016/j.neucom.2022.06.072</doi><unstructured_citation>Shou, Y.; Meng, T.; Ai, W.; Yang, S.; Li, K. Conversational emotion recognition studies based on graph convolutional neural networks and a dependent syntactic analysis. Neurocomputing 2022, 501, 629-639.</unstructured_citation></citation><citation key="ref6"><doi>10.1109/CVPR52729.2023.00641</doi><unstructured_citation>Li, Y.; Wang, Y.; Cui, Z. Decoupled Multimodal Distilling for Emotion Recognition. In Proceedings of the IEEE/CVF Conference on Computer Vision and Pattern Recognition, Vancouver, BC, Canada, 17-24 June 2023; pp. 6631-6640.</unstructured_citation></citation><citation key="ref7"><journal_title>In Proceedings of the 10th annual Computing and Communication Workshop and Conference (CCWC) (pp</journal_title><author>Shirke</author><cYear>2020</cYear><doi>10.1109/ccwc47524.2020.9031124</doi><article_title>Brain-iot-based emotion recognition system</article_title><unstructured_citation>Shirke, B., Wong, J., Libut, J. C., George, K., &amp; Oh, S. J. (2020). Brain-iot-based emotion recognition system. In Proceedings of the 10th annual Computing and Communication Workshop and Conference (CCWC) (pp. 0991-0995). IEEE.</unstructured_citation></citation><citation key="ref8"><doi>10.1007/s10579-008-9076-6</doi><unstructured_citation>Busso, C.; Bulut, M.; Lee, C.C.; Kazemzadeh, A.; Mower, E.; Kim, S.; Chang, J.N.; Lee, S.; Narayanan, S.S. IEMOCAP: Interactive emotional dyadic motion capture database. Lang. Resour. Eval. 2008, 42, 335-359.</unstructured_citation></citation><citation key="ref9"><doi>10.18653/v1/P19-1050</doi><unstructured_citation>Poria, S.; Hazarika, D.; Majumder, N.; Naik, G.; Cambria, E.; Mihalcea, R. MELD: A Multimodal Multi-Party Dataset for Emotion Recognition in Conversations. In Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics, Florence, Italy, 28 July-2 August 2019; pp. 527-536.</unstructured_citation></citation><citation key="ref10"><doi>10.1109/TCYB.2018.2797176</doi><unstructured_citation>Wei-Long Zheng , Wei Liu, Yifei Lu, Bao-Liang Lu, and Andrzej Cichocki.&quot;EmotionMeter: A Multimodal Framework for Recognizing Human Emotions&quot; Volume: 49, Issue: 3, March 2019, Pages: 1110 - 1122, February 2018, DOI:10.1109/TCYB.2018.2797176.</unstructured_citation></citation><citation key="ref11"><doi>10.1109/ACCESS.2019.2955637</doi><unstructured_citation>SHAHLA NEMATI ,REZA ROHANI , MOHAMMAD EHSAN BASIRI , MOLOUD ABDAR , NEIL Y. YEN , AND VLADIMIR MAKARENKOV. &quot;A Hybrid Latent Space Data Fusion Method for Multimodal Emotion Recognition, IEEE Access Volume: 7, Pages: 172948 - 172964, ISSN:2169-3536, November 2019, DOI:10.1109/ACCESS.2019.2955637.</unstructured_citation></citation><citation key="ref12"><doi>10.1109/ACCESS.2019.2962085</doi><unstructured_citation>HAIPING HUANG, ZHENCHAO HU, WENMING WANG, AND MIN WU&quot;Multimodal Emotion Recognition Based on Ensemble Convolutional Neural Network&quot;, IEEE Access Volume: 8, Pages:3265 - 3271, December 2019, DOI:10.1109/ACCESS.2019.2962085.</unstructured_citation></citation><citation key="ref13"><doi>10.1109/ACCESS.2020.3021994</doi><unstructured_citation>HONGLI ZHANG &quot;Expression-EEG Based Collaborative Multimodal Emotion Recognition Using Deep AutoEncoder&quot;, IEEE Access Volume: 8, Pages: 164130 - 164143, ISSN: 2169-3536, September 2020, DOI:10.1109/ACCESS.2020.3021994.</unstructured_citation></citation><citation key="ref14"><doi>10.1109/ACCESS.2020.3026823</doi><unstructured_citation>SHAMANE SIRIWARDHANA , THARINDU KALUARACHCHI , MARK BILLINGHURST , AND SURANGA NANAYAKKARA. &quot;Multimodal Emotion Recognition With Transformer-Based Self Supervised Feature Fusion&quot;, IEEE Access Volume: 8, Pages: 176274 - 176285, ISSN: 2169-3536, September 2020, DOI:10.1109/ACCESS.2020.3026823,</unstructured_citation></citation><citation key="ref15"><doi>10.1109/ICASSP43922.2022.9746910</doi><unstructured_citation>Jinming Zhao, Ruichen Li, Qin Jin, Xinchao Wang, Haizhou Li, &quot;MEMOBERT: PRE-TRAINING MODEL WITH PROMPT-BASED LEARNING FOR MULTIMODAL EMOTION RECOGNITION&quot;, 27oct 2021.</unstructured_citation></citation><citation key="ref16"><doi>10.21437/Odyssey.2022-57</doi><unstructured_citation>Sarala Padi, Seyed Omid Sadjadi, Dinesh Manocha, and Ram D. Sriram. &quot;Multimodal Emotion Recognition using Transfer Learning from SpeakerRecognition and BERT-based models&quot;, 16 Feb 2022.</unstructured_citation></citation><citation key="ref17"><doi>10.1007/s11042-023-16443-1</doi><unstructured_citation>Puneet Kumar, Sarthak Malik, and Balasubramanian Raman, &quot;Interpretable Multimodal Emotion Recognition using Hybrid Fusion of Speech and Image Data&quot;, Springer Nature 2023.</unstructured_citation></citation><citation key="ref18"><doi>10.1109/ACCESS.2020.3023871</doi><unstructured_citation>YUCEL CIMTAY, ERHAN EKMEKCIOGLU, AND SEYMA CAGLAR-OZHAN, &quot;Cross-Subject Multimodal Emotion Recognition Based on Hybrid Fusion&quot;, September 14, 2020, DOI: 10.1109/ACCESS.2020.3023871</unstructured_citation></citation><citation key="ref19"><unstructured_citation>Fengmao Lv, Xiang Chen, Yanyong Huang, Lixin Duan, Guosheng Lin. &quot;Progressive Modality Reinforcement for Human Multimodal EmotionRecognition from Unaligned Multimodal Sequences&quot;</unstructured_citation></citation><citation key="ref20"><unstructured_citation>Jiahui Pan, Weijie Fang, Zhihang Zhang, Bingzhi Chen, Zheng Zhang, Shuihua Wang, &quot;Multimodal Emotion Recognition based on Facial Expressions Speech, and EEG&quot;, DOI 10.1109/OJEMB.2023.3240280</unstructured_citation></citation><citation key="ref21"><unstructured_citation>SANGHYUN LEE, DAVID K. HAN, AND HANSEOK KO, &quot;Multimodal Emotion Recognition Fusion Analysis Adapting BERT With Heterogeneous Feature Unification&quot;, June 2021, Digital Object Identifier 10.1109/ACCESS.2021.3092735.</unstructured_citation></citation><citation key="ref22"><doi>10.1109/TMM.2021.3063612</doi><unstructured_citation>Dung Nguyen, Duc Thanh Nguyen , Rui Zeng, Thanh Thi Nguyen , Son N. Tran, Thin Nguyen, Sridha Sridharan, &quot;Deep Auto-Encoders With Sequential Learning for Multimodal Dimensional Emotion Recognition&quot; IEEE, VOL. 24, 2020, pages:1313-1324.</unstructured_citation></citation><citation key="ref23"><doi>10.1109/JBHI.2021.3092412</doi><unstructured_citation>Yi Yang, Qiang Gao, Yu Song, Xiaolin Song, Zemin Mao, and Junjie Liu, &quot;Investigating of Deaf Emotion Cognition Pattern By EEG and Facial Expression Combination&quot;, IEEE, VOL. 26, FEBRUARY 2022, pg.589-599</unstructured_citation></citation><citation key="ref24"><doi>10.1109/TAFFC.2022.3216993</doi><unstructured_citation>Lucas Goncalves, Carlos Busso, &quot;Robust Audiovisual Emotion Recognition: Aligning Modalities, Capturing Temporal Information, and Handling Missing Features&quot;, IEEE, VOL. 13, OCTOBER-DECEMBER 2022, pg. 2156- 2169</unstructured_citation></citation><citation key="ref25"><doi>10.1109/TCSVT.2021.3072412</doi><unstructured_citation>Ke Zhang, Yuanqing Li, Jingyu Wang, Erik Cambria, Xuelong Li, &quot;Real-Time Video Emotion Recognition Based on Reinforcement Learning and Domain Knowledge&quot;, IEEE Vol 32, MARCH 2022, pg. 1034- 1047</unstructured_citation></citation><citation key="ref26"><doi>10.1109/LSP.2022.3151551</doi><unstructured_citation>Norbert Braunsch weiler , Rama Doddipatla ,Simon Keizer, and Svetlana Stoyanchev, &quot;Factors in Emotion Recognition With Deep Learning Models Using Speech and Text on Multiple Corpora&quot;,IEEE , VOL. 29, 2022, pg. 722-726</unstructured_citation></citation><citation key="ref27"><doi>10.1109/TCSVT.2022.3163445</doi><unstructured_citation>Guan-Nan Dong, Chi-Man Pun, and Zheng Zhang, &quot;Temporal Relation Inference Network for Multimodal Speech Emotion Recognition&quot; IEEE, VOL. 32, SEPTEMBER 2022, pg.6472- 6485</unstructured_citation></citation><citation key="ref28"><doi>10.1109/TAFFC.2024.3357656</doi><unstructured_citation>Jiménez-Guarneros, Magdiel, and Gibran Fuentes-Pineda. &quot;CFDA-CSF: A Multi-modal Domain Adaptation Method for Cross-subject Emotion Recognition.&quot; IEEE Transactions on Affective Computing (2024).</unstructured_citation></citation><citation key="ref29"><doi>10.1109/TMM.2024.3385180</doi><unstructured_citation>Sun, Teng, et al. &quot;Muti-modal Emotion Recognition via Hierarchical Knowledge Distillation.&quot; IEEE Transactions on Multimedia (2024).</unstructured_citation></citation><citation key="ref30"><doi>10.17694/bajece.1372107</doi><unstructured_citation>Alsaadawı, Hussein Farooq Tayeb, and Resul Daş. &quot;Multimodal Emotion Recognition Using Bi-LG-GCN for MELD Dataset.&quot; Balkan Journal of Electrical and Computer Engineering 12.1 (2024): 36-46.</unstructured_citation></citation><citation key="ref31"><doi>10.1007/s11042-023-16443-1</doi><unstructured_citation>Kumar, Puneet, Sarthak Malik, and Balasubramanian Raman. &quot;Interpretable multimodal emotion recognition using a hybrid fusion of speech and image data.&quot; Multimedia Tools and Applications 83.10 (2024): 28373-28394.</unstructured_citation></citation><citation key="ref32"><doi>10.1016/j.bspc.2024.106224</doi><unstructured_citation>Umair, Muhammad, et al. &quot;Emotion Fusion-Sense (Emo Fu-Sense)-A novel multimodal emotion classification technique.&quot; Biomedical Signal Processing and Control 94 (2024): 106224.</unstructured_citation></citation><citation key="ref33"><doi>10.3390/app14104199</doi><unstructured_citation>Makhmudov, Fazliddin, Alpamis Kultimuratov, and Young-Im Cho. &quot;Enhancing Multimodal Emotion Recognition through Attention Mechanisms in BERT and CNN Architectures.&quot; Applied Sciences 14.10 (2024): 4199.</unstructured_citation></citation><citation key="ref34"><doi>10.1109/TCDS.2024.3357618</doi><unstructured_citation>Wang, Ruiqi, et al. &quot;Husformer: A multi-modal transformer for multi-modal human state recognition.&quot; IEEE Transactions on Cognitive and Developmental Systems (2024).</unstructured_citation></citation><citation key="ref35"><doi>10.3390/s24113484</doi><unstructured_citation>Pereira, Rafael, et al. &quot;Systematic Review of Emotion Detection with Computer Vision and Deep Learning.&quot; Sensors 24.11 (2024): 3484.</unstructured_citation></citation><citation key="ref36"><doi>10.1016/j.knosys.2023.111126</doi><unstructured_citation>Li, Xingye, et al. &quot;Magdra: a multi-modal attention graph network with dynamic routing-by-agreement for multi-label emotion recognition.&quot; Knowledge-Based Systems 283 (2024): 111126.</unstructured_citation></citation><citation key="ref37"><doi>10.1109/ACCESS.2023.3263670</doi><unstructured_citation>Wang, Shuai, et al. &quot;Multimodal emotion recognition from EEG signals and facial expressions.&quot; IEEE Access 11 (2023): 33061-33068.</unstructured_citation></citation><citation key="ref38"><doi>10.1109/TAFFC.2023.3234777</doi><unstructured_citation>Lei, Yuanyuan, and Houwei Cao. &quot;Audio-visual emotion recognition with preference learning based on intended and multi-modal perceived labels.&quot; IEEE Transactions on Affective Computing (2023).</unstructured_citation></citation><citation key="ref39"><doi>10.1016/j.ins.2022.11.076</doi><unstructured_citation>Liu, Shuai, et al. &quot;Multi-modal fusion network with complementarity and importance for emotion recognition.&quot; Information Sciences 619 (2023): 679-694.</unstructured_citation></citation><citation key="ref40"><doi>10.1109/TCSVT.2023.3247822</doi><unstructured_citation>Hou, Mixiao, et al. &quot;Semantic alignment network for multi-modal emotion recognition.&quot; IEEE Transactions on Circuits and Systems for Video Technology (2023).</unstructured_citation></citation><citation key="ref41"><doi>10.1109/ACCESS.2023.3310428</doi><unstructured_citation>Shahzad, H. M., et al. &quot;Multi-Modal CNN Features Fusion for Emotion Recognition: A Modified Xception Model.&quot; IEEE Access (2023).</unstructured_citation></citation><citation key="ref42"><doi>10.1109/TMM.2023.3238314</doi><unstructured_citation>Zhang, Duzhen, et al. &quot;Structure Aware Multi-Graph Network for Multi-Modal Emotion Recognition in Conversations.&quot; IEEE Transactions on Multimedia (2023).</unstructured_citation></citation><citation key="ref43"><doi>10.1145/3593583</doi><unstructured_citation>Zhang, Yazhou, et al. &quot;M3GAT: A Multi-modal, Multi-task Interactive Graph Attention Network for Conversational Sentiment Analysis and Emotion Recognition.&quot; ACM Transactions on Information Systems 42.1 (2023): 1-32</unstructured_citation></citation><citation key="ref44"><doi>10.1109/TASLP.2022.3224287</doi><unstructured_citation>Singh, Gopendra Vikram, et al. &quot;Emoint-trans: A multimodal transformer for identifying emotions and intents in social conversations.&quot; IEEE/ACM Transactions on Audio, Speech, and Language Processing 31 (2022): 290-300.</unstructured_citation></citation><citation key="ref45"><doi>10.1016/j.knosys.2022.109978</doi><unstructured_citation>Zou, ShiHao, et al. &quot;Improving multimodal fusion with Main Modal Transformer for emotion recognition in conversation.&quot; Knowledge-Based Systems 258 (2022): 109978.</unstructured_citation></citation><citation key="ref46"><doi>10.1109/TAFFC.2022.3141237</doi><unstructured_citation>Lian, Zheng, Bin Liu, and Jianhua Tao. &quot;Smin: Semi-supervised multi-modal interaction network for conversational emotion recognition.&quot; IEEE Transactions on Affective Computing (2022).</unstructured_citation></citation><citation key="ref47"><doi>10.1109/ACCESS.2022.3183587</doi><unstructured_citation>Yoon, Yeo Chan. &quot;Can we exploit all datasets? Multimodal emotion recognition using cross-modal translation.&quot; IEEE Access 10 (2022): 64516-64524.</unstructured_citation></citation><citation key="ref48"><doi>10.1016/j.compbiomed.2022.105907</doi><unstructured_citation>Wang, Qian, et al. &quot;Multi-modal emotion recognition using EEG and speech signals.&quot; Computers in Biology and Medicine 149 (2022): 105907.</unstructured_citation></citation><citation key="ref49"><doi>10.1109/TMM.2022.3144885</doi><unstructured_citation>Zheng, Jiahao, et al. &quot;Multi-channel weight-sharing autoencoder based on cascade multi-head attention for multimodal emotion recognition.&quot; IEEE Transactions on Multimedia (2022).</unstructured_citation></citation><citation key="ref50"><doi>10.1109/LSP.2022.3210836</doi><unstructured_citation>Yang, Dingkang, et al. &quot;Contextual and cross-modal interaction for multi-modal speech emotion recognition.&quot; IEEE Signal Processing Letters 29 (2022): 2093-2097.</unstructured_citation></citation><citation key="ref51"><doi>10.1109/TCDS.2021.3071170</doi><unstructured_citation>Liu, Wei, et al. &quot;Comparing recognition performance and robustness of multimodal deep learning models for multimodal emotion recognition.&quot; IEEE Transactions on Cognitive and Developmental Systems 14.2 (2021): 715-729.</unstructured_citation></citation><citation key="ref52"><doi>10.1109/LSP.2021.3055755</doi><unstructured_citation>Guanghui, Chen, and Zeng Xiaoping. &quot;Multi-modal emotion recognition by fusing correlation features of speech-visual.&quot; IEEE Signal Processing Letters 28 (2021): 533-537.</unstructured_citation></citation><citation key="ref53"><doi>10.35940/ijeat.F8587.088619</doi><unstructured_citation>Kanani, P., &amp; Padole, Dr. M. (2019). Deep Learning to Detect Skin Cancer using Google Colab. In International Journal of Engineering and Advanced Technology (Vol. 8, Issue 6, pp. 2176-2183). https://doi.org/10.35940/ijeat.f8587.088619</unstructured_citation></citation><citation key="ref54"><doi>10.35940/ijitee.E2486.039520</doi><unstructured_citation>Sultana, N., Rahman, Md. T., Parven, N., Rashiduzzaman, M., &amp; Jabiullah, Md. I. (2020). Computer Vision based Plant Leaf Disease Recognition using Deep Learning. In International Journal of Innovative Technology and Exploring Engineering (Vol. 9, Issue 5, pp. 622-626). https://doi.org/10.35940/ijitee.e2486.039520</unstructured_citation></citation><citation key="ref55"><doi>10.35940/ijsce.C3265.099319</doi><unstructured_citation>Radhamani, V., &amp; Dalin, G. (2019). Significance of Artificial Intelligence and Machine Learning Techniques in Smart Cloud Computing: A Review. In International Journal of Soft Computing and Engineering (Vol. 9, Issue 3, pp. 1-7). https://doi.org/10.35940/ijsce.c3265.099319</unstructured_citation></citation></citation_list>
</doi_citations>
</body>
</doi_batch>
