{"id":"https://openalex.org/W7139034035","doi":"https://doi.org/10.48550/arxiv.2603.15818","title":"Conflict-Aware Multimodal Fusion for Ambivalence and Hesitancy Recognition","display_name":"Conflict-Aware Multimodal Fusion for Ambivalence and Hesitancy Recognition","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7139034035","doi":"https://doi.org/10.48550/arxiv.2603.15818"},"language":"en","primary_location":{"id":"pmh:oai:HAL:hal-05596258v1","is_oa":false,"landing_page_url":"https://hal.science/hal-05596258","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2026","raw_type":"Preprints, Working Papers, ..."},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.15818","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5080484799","display_name":"Salah Eddine Bekhouche","orcid":"https://orcid.org/0000-0001-5538-7407"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Bekhouche, Salah Eddine","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073329526","display_name":"Hichem Telli","orcid":"https://orcid.org/0000-0003-4600-1781"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Telli, Hichem","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089464212","display_name":"Azeddine Benlamoudi","orcid":"https://orcid.org/0000-0002-2023-2154"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Benlamoudi, Azeddine","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129813817","display_name":"Salah Eddine Herrouz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Herrouz, Salah Eddine","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114889285","display_name":"Abdelmalik Taleb-Ahmed","orcid":"https://orcid.org/0000-0001-6034-7290"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Taleb-Ahmed, Abdelmalik","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129860709","display_name":"Abdenour Hadid","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hadid, Abdenour","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5080484799"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9555000066757202,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.9555000066757202,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12684","display_name":"Stuttering Research and Treatment","score":0.004100000020116568,"subfield":{"id":"https://openalex.org/subfields/3203","display_name":"Clinical Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.00279999990016222,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/ambivalence","display_name":"Ambivalence","score":0.5935999751091003},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5681999921798706},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.5493999719619751},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.5231999754905701},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.519599974155426},{"id":"https://openalex.org/keywords/macro","display_name":"Macro","score":0.4596000015735626},{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.44850000739097595},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.4415000081062317}],"concepts":[{"id":"https://openalex.org/C162127614","wikidata":"https://www.wikidata.org/wiki/Q5928045","display_name":"Ambivalence","level":2,"score":0.5935999751091003},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5681999921798706},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5508999824523926},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.5493999719619751},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.5231999754905701},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.5203999876976013},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.519599974155426},{"id":"https://openalex.org/C166955791","wikidata":"https://www.wikidata.org/wiki/Q629579","display_name":"Macro","level":2,"score":0.4596000015735626},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.44850000739097595},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4424999952316284},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.4415000081062317},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4146000146865845},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.4034000039100647},{"id":"https://openalex.org/C48677424","wikidata":"https://www.wikidata.org/wiki/Q6888088","display_name":"Mode (computer interface)","level":2,"score":0.3871999979019165},{"id":"https://openalex.org/C2777716012","wikidata":"https://www.wikidata.org/wiki/Q5318389","display_name":"Dyad","level":2,"score":0.35910001397132874},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.35030001401901245},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.33469998836517334},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.3325999975204468},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.3109999895095825},{"id":"https://openalex.org/C2780339515","wikidata":"https://www.wikidata.org/wiki/Q3074698","display_name":"Arrow","level":2,"score":0.3093999922275543},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.29760000109672546},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.29319998621940613},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.28279998898506165},{"id":"https://openalex.org/C2776035091","wikidata":"https://www.wikidata.org/wiki/Q7928819","display_name":"Viewpoints","level":2,"score":0.2676999866962433},{"id":"https://openalex.org/C2778344882","wikidata":"https://www.wikidata.org/wiki/Q278938","display_name":"Shot (pellet)","level":2,"score":0.2644999921321869},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.25029999017715454}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:HAL:hal-05596258v1","is_oa":false,"landing_page_url":"https://hal.science/hal-05596258","pdf_url":null,"source":{"id":"https://openalex.org/S4306402512","display_name":"HAL (Le Centre pour la Communication Scientifique Directe)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1294671590","host_organization_name":"Centre National de la Recherche Scientifique","host_organization_lineage":["https://openalex.org/I1294671590"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"2026","raw_type":"Preprints, Working Papers, ..."},{"id":"doi:10.48550/arxiv.2603.15818","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15818","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.15818","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15818","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.41062572598457336,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Ambivalence":[0],"and":[1,59,80,109,148,194],"hesitancy":[2],"(A/H)":[3],"are":[4],"subtle":[5],"affective":[6],"states":[7,31],"where":[8],"a":[9,67,118,160,211],"person":[10],"shows":[11],"conflicting":[12],"signals":[13],"through":[14],"different":[15],"channels":[16],"--":[17,86,93,208],"saying":[18],"one":[19],"thing":[20],"while":[21,103,131],"their":[22],"face":[23,62],"or":[24],"voice":[25],"tells":[26],"another":[27],"story.":[28],"Recognising":[29],"these":[30],"automatically":[32],"is":[33,40,54],"valuable":[34],"in":[35,49,214],"clinical":[36],"settings,":[37],"but":[38],"it":[39,57],"hard":[41],"for":[42,71],"machines":[43],"because":[44],"the":[45,50,61,111,150,165,175,179,190,197],"key":[46,119],"evidence":[47],"lives":[48],"\\emph{disagreements}":[51],"between":[52,90],"what":[53,60],"said,":[55],"how":[56],"sounds,":[58],"shows.":[63],"We":[64],"present":[65],"\\textbf{ConflictAwareAH},":[66],"multimodal":[68,138,202],"framework":[69],"built":[70],"this":[72],"problem.":[73],"Three":[74],"pre-trained":[75],"encoders":[76],"extract":[77],"video,":[78],"audio,":[79],"text":[81,146],"representations.":[82],"Pairwise":[83],"conflict":[84],"features":[85],"element-wise":[87],"absolute":[88],"differences":[89,100,105],"modality":[91],"embeddings":[92],"serve":[94],"as":[95],"\\emph{bidirectional}":[96],"cues:":[97],"large":[98],"cross-modal":[99],"flag":[101],"A/H,":[102],"small":[104],"confirm":[106,134],"behavioural":[107],"consistency":[108],"anchor":[110],"negative":[112],"class.":[113],"This":[114],"conflict-aware":[115],"design":[116],"addresses":[117],"limitation":[120],"of":[121,218],"text-dominant":[122],"approaches,":[123],"which":[124],"tend":[125],"to":[126,133],"over-detect":[127],"A/H":[128],"(high":[129],"F1-AH)":[130],"struggling":[132],"its":[135],"absence:":[136],"our":[137,183],"model":[139,167],"improves":[140],"F1-NoAH":[141],"by":[142,204],"+4.6":[143],"points":[144,207],"over":[145,205],"alone":[147],"halves":[149],"class-performance":[151],"gap.":[152],"A":[153],"complementary":[154],"\\emph{text-guided":[155],"late":[156],"fusion}":[157],"strategy":[158],"blends":[159],"text-only":[161],"auxiliary":[162],"head":[163],"with":[164],"full":[166],"at":[168],"inference,":[169],"adding":[170],"+4.1":[171],"Macro":[172,187],"F1.":[173],"On":[174],"BAH":[176],"dataset":[177],"from":[178],"ABAW10":[180],"Ambivalence/Hesitancy":[181],"Challenge,":[182],"method":[184],"reaches":[185],"\\textbf{0.694":[186],"F1}":[188],"on":[189,196,210],"labelled":[191],"test":[192],"split":[193],"\\textbf{0.715}":[195],"private":[198],"leaderboard,":[199],"outperforming":[200],"published":[201],"baselines":[203],"10":[206],"all":[209],"single":[212],"GPU":[213],"under":[215],"25":[216],"minutes":[217],"training.":[219]},"counts_by_year":[],"updated_date":"2026-05-07T13:39:58.223016","created_date":"2026-03-20T00:00:00"}
