{"id":"https://openalex.org/W4410536426","doi":"https://doi.org/10.1109/tcsvt.2025.3571534","title":"MDKAT: Multimodal Decoupling With Knowledge Aggregation and Transfer for Video Emotion Recognition","display_name":"MDKAT: Multimodal Decoupling With Knowledge Aggregation and Transfer for Video Emotion Recognition","publication_year":2025,"publication_date":"2025-05-20","ids":{"openalex":"https://openalex.org/W4410536426","doi":"https://doi.org/10.1109/tcsvt.2025.3571534"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2025.3571534","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3571534","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100696824","display_name":"Jian Wang","orcid":"https://orcid.org/0000-0002-4316-932X"},"institutions":[{"id":"https://openalex.org/I82760581","display_name":"Taizhou University","ror":"https://ror.org/04fzhyx73","country_code":"CN","type":"education","lineage":["https://openalex.org/I82760581"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jian Wang","raw_affiliation_strings":["Institute of Intelligent Information Processing, Taizhou University, Taizhou, China"],"affiliations":[{"raw_affiliation_string":"Institute of Intelligent Information Processing, Taizhou University, Taizhou, China","institution_ids":["https://openalex.org/I82760581"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100367825","display_name":"Chenglong Wang","orcid":"https://orcid.org/0000-0003-2391-0923"},"institutions":[{"id":"https://openalex.org/I82760581","display_name":"Taizhou University","ror":"https://ror.org/04fzhyx73","country_code":"CN","type":"education","lineage":["https://openalex.org/I82760581"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenglong Wang","raw_affiliation_strings":["Institute of Intelligent Information Processing, Taizhou University, Taizhou, China"],"affiliations":[{"raw_affiliation_string":"Institute of Intelligent Information Processing, Taizhou University, Taizhou, China","institution_ids":["https://openalex.org/I82760581"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072247998","display_name":"Lin Guo","orcid":"https://orcid.org/0000-0003-2244-0034"},"institutions":[{"id":"https://openalex.org/I82760581","display_name":"Taizhou University","ror":"https://ror.org/04fzhyx73","country_code":"CN","type":"education","lineage":["https://openalex.org/I82760581"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lin Guo","raw_affiliation_strings":["Institute of Intelligent Information Processing, Taizhou University, Taizhou, China"],"affiliations":[{"raw_affiliation_string":"Institute of Intelligent Information Processing, Taizhou University, Taizhou, China","institution_ids":["https://openalex.org/I82760581"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057674073","display_name":"Shuchang Zhao","orcid":"https://orcid.org/0009-0004-8777-2974"},"institutions":[{"id":"https://openalex.org/I82760581","display_name":"Taizhou University","ror":"https://ror.org/04fzhyx73","country_code":"CN","type":"education","lineage":["https://openalex.org/I82760581"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuchang Zhao","raw_affiliation_strings":["Institute of Intelligent Information Processing, Taizhou University, Taizhou, China"],"affiliations":[{"raw_affiliation_string":"Institute of Intelligent Information Processing, Taizhou University, Taizhou, China","institution_ids":["https://openalex.org/I82760581"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100462164","display_name":"Dandan Wang","orcid":"https://orcid.org/0000-0002-5490-3921"},"institutions":[{"id":"https://openalex.org/I82760581","display_name":"Taizhou University","ror":"https://ror.org/04fzhyx73","country_code":"CN","type":"education","lineage":["https://openalex.org/I82760581"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dandan Wang","raw_affiliation_strings":["Institute of Intelligent Information Processing, Taizhou University, Taizhou, China"],"affiliations":[{"raw_affiliation_string":"Institute of Intelligent Information Processing, Taizhou University, Taizhou, China","institution_ids":["https://openalex.org/I82760581"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101891025","display_name":"Shiqing Zhang","orcid":"https://orcid.org/0000-0001-8184-5088"},"institutions":[{"id":"https://openalex.org/I82760581","display_name":"Taizhou University","ror":"https://ror.org/04fzhyx73","country_code":"CN","type":"education","lineage":["https://openalex.org/I82760581"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiqing Zhang","raw_affiliation_strings":["Institute of Intelligent Information Processing, Taizhou University, Taizhou, China"],"affiliations":[{"raw_affiliation_string":"Institute of Intelligent Information Processing, Taizhou University, Taizhou, China","institution_ids":["https://openalex.org/I82760581"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021523224","display_name":"Xiaoming Zhao","orcid":"https://orcid.org/0000-0002-4708-4171"},"institutions":[{"id":"https://openalex.org/I82760581","display_name":"Taizhou University","ror":"https://ror.org/04fzhyx73","country_code":"CN","type":"education","lineage":["https://openalex.org/I82760581"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoming Zhao","raw_affiliation_strings":["Institute of Intelligent Information Processing, Taizhou University, Taizhou, China"],"affiliations":[{"raw_affiliation_string":"Institute of Intelligent Information Processing, Taizhou University, Taizhou, China","institution_ids":["https://openalex.org/I82760581"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050817770","display_name":"Jun Yu","orcid":"https://orcid.org/0000-0003-1922-7283"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Yu","raw_affiliation_strings":["School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China","Department of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]},{"raw_affiliation_string":"Department of Computer Science and Technology, Harbin Institute of Technology, Shenzhen, China","institution_ids":["https://openalex.org/I204983213"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100631216","display_name":"Yaowei Wang","orcid":"https://orcid.org/0000-0003-2197-9038"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaowei Wang","raw_affiliation_strings":["Peng Cheng Laboratory, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005421447","display_name":"Yi Yang","orcid":"https://orcid.org/0000-0002-0512-880X"},"institutions":[{"id":"https://openalex.org/I168879160","display_name":"Zhejiang University of Science and Technology","ror":"https://ror.org/05mx0wr29","country_code":"CN","type":"education","lineage":["https://openalex.org/I168879160"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yi Yang","raw_affiliation_strings":["College of Computer Science and Technology, Zhejiang University, Hangzhou, Zhejiang, China"],"affiliations":[{"raw_affiliation_string":"College of Computer Science and Technology, Zhejiang University, Hangzhou, Zhejiang, China","institution_ids":["https://openalex.org/I168879160"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039832462","display_name":"Siwei Ma","orcid":"https://orcid.org/0000-0002-2731-5403"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Siwei Ma","raw_affiliation_strings":["National Engineering Research Center of Visual Technology, School of Computer Science, Peking University, Beijing, China","School of Computer Science, National Engineering Research Center of Visual Technology, Peking University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"National Engineering Research Center of Visual Technology, School of Computer Science, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"School of Computer Science, National Engineering Research Center of Visual Technology, Peking University, Beijing, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100393506","display_name":"Qi Tian","orcid":"https://orcid.org/0000-0002-7252-5047"},"institutions":[{"id":"https://openalex.org/I2250955327","display_name":"Huawei Technologies (China)","ror":"https://ror.org/00cmhce21","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250955327"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qi Tian","raw_affiliation_strings":["Huawei Cloud and AI, Shenzhen, China","Huawei Cloud &#x0026; AI, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Huawei Cloud and AI, Shenzhen, China","institution_ids":["https://openalex.org/I2250955327"]},{"raw_affiliation_string":"Huawei Cloud &#x0026; AI, Shenzhen, China","institution_ids":["https://openalex.org/I2250955327"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":12,"corresponding_author_ids":["https://openalex.org/A5100696824"],"corresponding_institution_ids":["https://openalex.org/I82760581"],"apc_list":null,"apc_paid":null,"fwci":46.4094,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.99880066,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"35","issue":"10","first_page":"9809","last_page":"9822"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9503999948501587,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9503999948501587,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7021239399909973},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5493504405021667},{"id":"https://openalex.org/keywords/decoupling","display_name":"Decoupling (probability)","score":0.5230487585067749},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.41387754678726196},{"id":"https://openalex.org/keywords/knowledge-transfer","display_name":"Knowledge transfer","score":0.4116722643375397},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.40284398198127747},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3449632525444031},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3227831721305847},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.10030055046081543},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07428455352783203}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7021239399909973},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5493504405021667},{"id":"https://openalex.org/C205606062","wikidata":"https://www.wikidata.org/wiki/Q5249645","display_name":"Decoupling (probability)","level":2,"score":0.5230487585067749},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.41387754678726196},{"id":"https://openalex.org/C2776960227","wikidata":"https://www.wikidata.org/wiki/Q2586354","display_name":"Knowledge transfer","level":2,"score":0.4116722643375397},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.40284398198127747},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3449632525444031},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3227831721305847},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.10030055046081543},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07428455352783203},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2025.3571534","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2025.3571534","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2576352071","display_name":null,"funder_award_id":"LQ24F020014","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2745919159","display_name":null,"funder_award_id":"LZ20F020002","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4329375876","display_name":null,"funder_award_id":"62276180","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5851559761","display_name":null,"funder_award_id":"61976149","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G721482673","display_name":null,"funder_award_id":"62406217","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W2095176743","https://openalex.org/W2395639500","https://openalex.org/W2556418146","https://openalex.org/W2703895418","https://openalex.org/W2766272105","https://openalex.org/W2809734421","https://openalex.org/W2883409523","https://openalex.org/W2962931510","https://openalex.org/W2964051877","https://openalex.org/W2964216663","https://openalex.org/W3037572520","https://openalex.org/W3093051361","https://openalex.org/W3169801598","https://openalex.org/W3173549566","https://openalex.org/W3205519684","https://openalex.org/W3207376445","https://openalex.org/W3208632377","https://openalex.org/W4220829848","https://openalex.org/W4221162874","https://openalex.org/W4226442948","https://openalex.org/W4281701185","https://openalex.org/W4283034150","https://openalex.org/W4304092664","https://openalex.org/W4312758889","https://openalex.org/W4320004356","https://openalex.org/W4321482228","https://openalex.org/W4372341189","https://openalex.org/W4375928984","https://openalex.org/W4376607994","https://openalex.org/W4379356527","https://openalex.org/W4380875665","https://openalex.org/W4386075879","https://openalex.org/W4386699383","https://openalex.org/W4386826611","https://openalex.org/W4387010698","https://openalex.org/W4387249887","https://openalex.org/W4387968266","https://openalex.org/W4389195633","https://openalex.org/W4390872585","https://openalex.org/W4390876428","https://openalex.org/W4391302483","https://openalex.org/W4392903856","https://openalex.org/W4392908038","https://openalex.org/W4392909853","https://openalex.org/W4393156571","https://openalex.org/W4393161236","https://openalex.org/W4395070006","https://openalex.org/W4402979780","https://openalex.org/W4405686157"],"related_works":["https://openalex.org/W4313561376","https://openalex.org/W3103825105","https://openalex.org/W3027880158","https://openalex.org/W3207533102","https://openalex.org/W1617565119","https://openalex.org/W160381218","https://openalex.org/W2512958550","https://openalex.org/W2004102934","https://openalex.org/W4366455350","https://openalex.org/W2329266651"],"abstract_inverted_index":{"Multimodal":[0,49],"Emotion":[1],"Recognition":[2],"(MER)":[3],"leverages":[4],"multiple":[5],"input":[6],"signals":[7],"to":[8,32,94],"identify":[9],"the":[10,33,131,145,153,169],"expressed":[11],"emotions":[12],"in":[13,38,63],"user-generated":[14],"data.":[15],"Currently,":[16],"effectively":[17],"addressing":[18],"both":[19],"modality":[20],"heterogeneity":[21],"and":[22,55,79,137,156],"homogeneity":[23],"on":[24,101,152,173],"MER":[25,102,174],"tasks":[26],"is":[27,67],"a":[28,105,124,138],"challenging":[29],"issue":[30],"due":[31],"diversity":[34],"of":[35,69,98,134,147,171],"multimodal":[36,60,99],"inputs":[37],"videos.":[39,65],"To":[40],"address":[41],"this":[42,44],"issue,":[43],"work":[45],"proposes":[46],"an":[47,115],"efficient":[48],"Decoupling":[50],"Method":[51],"with":[52],"Knowledge":[53,125,139],"Aggregation":[54,126],"Transfer":[56,140],"(MDKAT)":[57],"for":[58,82,111,121,129,143],"robust":[59],"feature":[61,74,77,122],"learning":[62,100],"emotional":[64],"MDKAT":[66,161,172],"consisted":[68],"three":[70,86],"key":[71],"steps:":[72],"modality-independent":[73,113,135],"extraction,":[75,78],"modality-specific":[76],"multi-loss":[80],"integration":[81],"decoupling.":[83],"In":[84],"these":[85],"steps,":[87],"four":[88],"crucial":[89],"modules":[90],"are":[91],"individually":[92],"designed":[93],"improve":[95],"different":[96,148],"aspects":[97],"tasks,":[103],"including":[104],"Cross-modal":[106],"Feature":[107],"Fusion":[108],"(CFF)":[109],"module":[110,120,128,142],"enhancing":[112],"features,":[114,136],"Adaptive":[116],"Masked":[117],"Self-Attention":[118],"(AMSA)":[119],"refinement,":[123],"(KA)":[127],"ensuring":[130],"semantic":[132],"similarity":[133],"(KT)":[141],"balancing":[144],"strengths":[146],"modalities.":[149],"Experimental":[150],"results":[151],"typical":[154],"CMU-MOSI":[155],"CMU-MOSEI":[157],"datasets":[158],"show":[159],"that":[160],"obtains":[162],"superior":[163],"performance":[164],"over":[165],"state-of-the-art":[166],"methods,":[167],"demonstrating":[168],"effectiveness":[170],"tasks.":[175]},"counts_by_year":[{"year":2026,"cited_by_count":8},{"year":2025,"cited_by_count":15}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
