{"id":"https://openalex.org/W7137811341","doi":"https://doi.org/10.48550/arxiv.2603.14976","title":"Anchoring Emotions in Text: Robust Multimodal Fusion for Mimicry Intensity Estimation","display_name":"Anchoring Emotions in Text: Robust Multimodal Fusion for Mimicry Intensity Estimation","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7137811341","doi":"https://doi.org/10.48550/arxiv.2603.14976"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.14976","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14976","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.14976","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120131327","display_name":"Lingsi Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhu, Lingsi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129728923","display_name":"Yuefeng Zou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zou, Yuefeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129646829","display_name":"Yunxiang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yunxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129702304","display_name":"Naixiang Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Naixiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128664826","display_name":"Guoyuan Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Guoyuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129707797","display_name":"Jun Yu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yu, Jun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129646099","display_name":"Jiaen Liang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Jiaen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129708282","display_name":"Wei Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101461639","display_name":"Shengping Liu","orcid":"https://orcid.org/0000-0001-9026-0436"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Shengping","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129689475","display_name":"Ximin Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Ximin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.7689999938011169,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.7689999938011169,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.029200000688433647,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10429","display_name":"EEG and Brain-Computer Interfaces","score":0.021800000220537186,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.47380000352859497},{"id":"https://openalex.org/keywords/mimicry","display_name":"Mimicry","score":0.46709999442100525},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.4487000107765198},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.43459999561309814},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.38589999079704285},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.3853999972343445},{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.37929999828338623},{"id":"https://openalex.org/keywords/imperfect","display_name":"Imperfect","score":0.31839999556541443}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7620999813079834},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6258000135421753},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.47380000352859497},{"id":"https://openalex.org/C7863114","wikidata":"https://www.wikidata.org/wiki/Q192627","display_name":"Mimicry","level":2,"score":0.46709999442100525},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.4487000107765198},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.43459999561309814},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.38589999079704285},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.3853999972343445},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.37929999828338623},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37049999833106995},{"id":"https://openalex.org/C2780310539","wikidata":"https://www.wikidata.org/wiki/Q12547192","display_name":"Imperfect","level":2,"score":0.31839999556541443},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.2969000041484833},{"id":"https://openalex.org/C2776459999","wikidata":"https://www.wikidata.org/wiki/Q2119376","display_name":"Fidelity","level":2,"score":0.2969000041484833},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.29159998893737793},{"id":"https://openalex.org/C52421305","wikidata":"https://www.wikidata.org/wiki/Q1151499","display_name":"Particle filter","level":3,"score":0.28139999508857727},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.26820001006126404},{"id":"https://openalex.org/C2779585090","wikidata":"https://www.wikidata.org/wiki/Q3457762","display_name":"Resilience (materials science)","level":2,"score":0.2662999927997589},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2540000081062317},{"id":"https://openalex.org/C115051666","wikidata":"https://www.wikidata.org/wiki/Q6522493","display_name":"Ranging","level":2,"score":0.2535000145435333},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.2531000077724457}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.14976","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14976","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.14976","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.14976","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Estimating":[0],"Emotional":[1,48],"Mimicry":[2,49],"Intensity":[3,50],"(EMI)":[4],"in":[5,14,21,137],"naturalistic":[6],"environments":[7],"is":[8],"a":[9,52,93,103,147,178],"critical":[10],"yet":[11],"challenging":[12],"task":[13],"affective":[15],"computing.":[16],"The":[17],"primary":[18],"difficulty":[19],"lies":[20],"effectively":[22,162],"modeling":[23],"the":[24,58,64,81,122,156],"complex,":[25],"nonlinear":[26],"temporal":[27],"dynamics":[28],"across":[29,184],"highly":[30,73],"heterogeneous":[31],"modalities,":[32],"especially":[33],"when":[34],"physical":[35,124],"signals":[36,71],"are":[37,72],"corrupted":[38],"or":[39],"missing.":[40],"To":[41],"tackle":[42],"this,":[43],"we":[44,79,87,101,141],"propose":[45],"TAEMI":[46,161],"(Text-Anchored":[47],"estimation),":[51],"novel":[53],"multimodal":[54],"framework":[55,176],"designed":[56],"for":[57],"10th":[59],"ABAW":[60],"Competition.":[61],"Motivated":[62],"by":[63,133],"observation":[65],"that":[66,108,160],"continuous":[67,186],"visual":[68],"and":[69,120,146,167],"acoustic":[70],"susceptible":[74],"to":[75,114,127],"transient":[76],"environmental":[77],"noise,":[78],"break":[80],"traditional":[82],"symmetric":[83],"fusion":[84],"paradigm.":[85],"Instead,":[86],"leverage":[88],"textual":[89,112],"transcript--which":[90],"inherently":[91],"encode":[92],"stable,":[94],"time-independent":[95],"semantic":[96],"prior--as":[97],"central":[98],"anchors.":[99],"Specifically,":[100],"introduce":[102],"Text-Anchored":[104],"Dual":[105],"Cross-Attention":[106],"mechanism":[107],"utilizes":[109],"these":[110],"robust":[111,169],"queries":[113],"actively":[115],"filter":[116],"out":[117],"frame-level":[118],"redundancies":[119],"align":[121],"noisy":[123],"streams.":[125],"Furthermore,":[126],"prevent":[128],"catastrophic":[129],"performance":[130],"degradation":[131],"caused":[132],"inevitably":[134],"missing":[135],"data":[136],"unconstrained":[138],"real-world":[139],"scenarios,":[140],"integrate":[142],"Learnable":[143],"Missing-Modality":[144],"Tokens":[145],"Modality":[148],"Dropout":[149],"strategy":[150],"during":[151],"training.":[152],"Extensive":[153],"experiments":[154],"on":[155],"Hume-Vidmimic2":[157],"dataset":[158],"demonstrate":[159],"captures":[163],"fine-grained":[164],"emotional":[165,187],"variations":[166],"maintains":[168],"predictive":[170],"resilience":[171],"under":[172],"imperfect":[173],"conditions.":[174],"Our":[175],"achieves":[177],"state-of-the-art":[179],"mean":[180],"Pearson":[181],"correlation":[182],"coefficient":[183],"six":[185],"dimensions,":[188],"significantly":[189],"outperforming":[190],"existing":[191],"baseline":[192],"methods.":[193]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-18T00:00:00"}
