{"id":"https://openalex.org/W7160513442","doi":"https://doi.org/10.48550/arxiv.2605.04877","title":"To Fuse or to Drop? Dual-Path Learning for Resolving Modality Conflicts in Multimodal Emotion Recognition","display_name":"To Fuse or to Drop? Dual-Path Learning for Resolving Modality Conflicts in Multimodal Emotion Recognition","publication_year":2026,"publication_date":"2026-05-06","ids":{"openalex":"https://openalex.org/W7160513442","doi":"https://doi.org/10.48550/arxiv.2605.04877"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.04877","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04877","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.04877","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058525575","display_name":"Yangchen Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yu, Yangchen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135601176","display_name":"Qian Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Qian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135563009","display_name":"Jia Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135550334","display_name":"Zhenzhen Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Zhenzhen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135601421","display_name":"Jinpeng Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Jinpeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135552974","display_name":"Lizi Liao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liao, Lizi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135637202","display_name":"Erik Cambria","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cambria, Erik","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135573202","display_name":"Richang Hong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hong, Richang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5058525575"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9840999841690063,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9840999841690063,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.002300000051036477,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.0010000000474974513,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.6007000207901001},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.588699996471405},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5873000025749207},{"id":"https://openalex.org/keywords/discernment","display_name":"Discernment","score":0.5580999851226807},{"id":"https://openalex.org/keywords/legibility","display_name":"Legibility","score":0.5293999910354614},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.5073000192642212},{"id":"https://openalex.org/keywords/fusion-mechanism","display_name":"Fusion mechanism","score":0.5026000142097473},{"id":"https://openalex.org/keywords/fuse","display_name":"Fuse (electrical)","score":0.4560999870300293}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6834999918937683},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6008999943733215},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.6007000207901001},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.588699996471405},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5873000025749207},{"id":"https://openalex.org/C2780211513","wikidata":"https://www.wikidata.org/wiki/Q1132167","display_name":"Discernment","level":2,"score":0.5580999851226807},{"id":"https://openalex.org/C2779332521","wikidata":"https://www.wikidata.org/wiki/Q1820694","display_name":"Legibility","level":2,"score":0.5293999910354614},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.5073000192642212},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.5026000142097473},{"id":"https://openalex.org/C141353440","wikidata":"https://www.wikidata.org/wiki/Q182221","display_name":"Fuse (electrical)","level":2,"score":0.4560999870300293},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.4034999907016754},{"id":"https://openalex.org/C160151201","wikidata":"https://www.wikidata.org/wiki/Q207946","display_name":"Arbitration","level":2,"score":0.38670000433921814},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3653999865055084},{"id":"https://openalex.org/C165838908","wikidata":"https://www.wikidata.org/wiki/Q736777","display_name":"Calibration","level":2,"score":0.3628000020980835},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.35510000586509705},{"id":"https://openalex.org/C2779545769","wikidata":"https://www.wikidata.org/wiki/Q5135364","display_name":"Closeness","level":2,"score":0.329800009727478},{"id":"https://openalex.org/C2778971668","wikidata":"https://www.wikidata.org/wiki/Q5510284","display_name":"Fusion rules","level":4,"score":0.2953999936580658},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.2946000099182129},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2922999858856201},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.288100004196167},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.2824999988079071},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.27649998664855957},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.25369998812675476}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.04877","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04877","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.04877","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.04877","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7510124444961548,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multimodal":[0],"emotion":[1,220],"recognition":[2],"(MER)":[3],"benefits":[4],"from":[5,27,44,89],"combining":[6],"text,":[7],"audio,":[8],"and":[9,33,75,105,128,136,159,187,205,211,215],"vision,":[10],"yet":[11],"standard":[12],"fusion":[13,55,107,127,178],"often":[14],"fails":[15],"when":[16,72,76,108,177],"modalities":[17,176],"conflict.":[18],"Crucially,":[19],"conflicts":[20,25,42,145,168],"differ":[21],"in":[22],"resolvability:":[23],"benign":[24],"stem":[26],"missing,":[28],"weak,":[29],"or":[30,49,195],"ambiguous":[31],"cues":[32],"can":[34,170],"be":[35,171],"mitigated":[36],"by":[37],"cross-modal":[38],"calibration,":[39],"while":[40,173],"severe":[41],"arise":[43],"intrinsically":[45],"contradictory":[46],"(e.g.,":[47],"sarcasm)":[48],"misleading":[50,175],"signals,":[51],"for":[52],"which":[53],"forced":[54],"may":[56],"amplify":[57],"errors.":[58],"Recognizing":[59],"this,":[60],"we":[61],"propose":[62],"Dual-Path":[63],"Conflict":[64],"Resolution":[65],"(DCR),":[66],"a":[67,93,121,133,137],"unified":[68],"framework":[69],"that":[70,124,169,209],"learns":[71],"to":[73,77,92],"fuse":[74],"drop":[78],"modalities.":[79],"Path":[80,112],"I":[81],"(Affective":[82,114],"Fusion":[83],"Distiller,":[84],"AFD)":[85],"performs":[86],"reverse":[87],"distillation":[88],"audio/visual":[90],"teachers":[91],"textual":[94],"student":[95],"using":[96],"temporally":[97],"weighted":[98],"class":[99],"evidence,":[100],"thereby":[101],"enhancing":[102],"representation-level":[103],"calibration":[104,162],"improving":[106],"alignment":[109],"is":[110,179],"beneficial.":[111],"II":[113],"Discernment":[115],"Agent,":[116],"ADA)":[117],"formulates":[118],"MER":[119],"as":[120],"contextual":[122],"bandit":[123],"selects":[125],"among":[126],"unimodal":[129],"predictions":[130],"based":[131],"on":[132],"dual-view":[134],"state":[135],"calibration-aware":[138],"reward,":[139],"enabling":[140],"decision-level":[141],"arbitration":[142],"under":[143],"irreconcilable":[144],"without":[146],"requiring":[147],"per-modality":[148],"reliability":[149],"labels.":[150],"By":[151],"taking":[152],"into":[153],"account":[154],"the":[155],"full":[156],"multimodal":[157],"context":[158],"coupling":[160],"soft":[161],"with":[163],"hard":[164],"arbitration,":[165],"DCR":[166,190],"reconciles":[167],"aligned":[172],"bypassing":[174],"harmful.":[180],"Across":[181],"five":[182],"benchmarks":[183],"covering":[184],"both":[185],"dialogue-level":[186],"clip-level":[188],"MER,":[189],"consistently":[191],"outperforms":[192],"competitive":[193,198],"baselines":[194],"achieves":[196],"highly":[197],"results.":[199],"Further":[200],"ablations,":[201],"conflict-specific":[202],"subset":[203],"evaluation,":[204],"modality-selection":[206],"analysis":[207],"verify":[208],"AFD":[210],"ADA":[212],"are":[213],"complementary":[214],"jointly":[216],"improve":[217],"robust":[218],"conflict-aware":[219],"recognition.":[221]},"counts_by_year":[],"updated_date":"2026-05-08T13:18:25.657630","created_date":"2026-05-08T00:00:00"}
