{"id":"https://openalex.org/W7138837287","doi":"https://doi.org/10.48550/arxiv.2603.16939","title":"Solution for 10th Competition on Ambivalence/Hesitancy (AH) Video Recognition Challenge using Divergence-Based Multimodal Fusion","display_name":"Solution for 10th Competition on Ambivalence/Hesitancy (AH) Video Recognition Challenge using Divergence-Based Multimodal Fusion","publication_year":2026,"publication_date":"2026-03-15","ids":{"openalex":"https://openalex.org/W7138837287","doi":"https://doi.org/10.48550/arxiv.2603.16939"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.16939","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16939","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.16939","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130068908","display_name":"Aislan Gabriel O. Souza","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Souza, Aislan Gabriel O.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129928556","display_name":"Agostinho Freire","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Freire, Agostinho","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129813519","display_name":"Leandro Honorato Silva","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Silva, Leandro Honorato","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129839458","display_name":"Igor Lucas B. da Silva","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"da Silva, Igor Lucas B.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130075908","display_name":"Jo\u00e3o Vin\u00edcius R. de Andrade","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Andrade, Jo\u00e3o Vin\u00edcius R.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129914166","display_name":"Gabriel C. de Albuquerque","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Albuquerque, Gabriel C.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130151427","display_name":"Lucas Matheus da S. Oliveira","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Oliveira, Lucas Matheus da S.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101673605","display_name":"M\u00e1rio Stela Guerra","orcid":"https://orcid.org/0009-0006-4158-7057"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guerra, M\u00e1rio Stela","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130135684","display_name":"Luciana Machado","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Machado, Luciana","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5130068908"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.3700000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.3700000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10667","display_name":"Emotion and Mood Recognition","score":0.15690000355243683,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.1185000017285347,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.7990000247955322},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.7653999924659729},{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.6783000230789185},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6126999855041504},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6093000173568726},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.5663999915122986},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.46970000863075256},{"id":"https://openalex.org/keywords/action-recognition","display_name":"Action recognition","score":0.44780001044273376}],"concepts":[{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.7990000247955322},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.7653999924659729},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7598000168800354},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7231000065803528},{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.6783000230789185},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6126999855041504},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6093000173568726},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.5663999915122986},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.46970000863075256},{"id":"https://openalex.org/C2987834672","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Action recognition","level":3,"score":0.44780001044273376},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.41690000891685486},{"id":"https://openalex.org/C166955791","wikidata":"https://www.wikidata.org/wiki/Q629579","display_name":"Macro","level":2,"score":0.414900004863739},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.4099000096321106},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.4083999991416931},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3953999876976013},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.3952000141143799},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3637999892234802},{"id":"https://openalex.org/C2779506182","wikidata":"https://www.wikidata.org/wiki/Q7580141","display_name":"Spotting","level":2,"score":0.3440999984741211},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3305000066757202},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.30660000443458557},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.3052999973297119},{"id":"https://openalex.org/C121687571","wikidata":"https://www.wikidata.org/wiki/Q4677630","display_name":"Activity recognition","level":2,"score":0.304500013589859},{"id":"https://openalex.org/C91306197","wikidata":"https://www.wikidata.org/wiki/Q45767","display_name":"Competition (biology)","level":2,"score":0.30300000309944153},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2797999978065491},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.26899999380111694},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2522999942302704}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.16939","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16939","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.16939","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.16939","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.7569898962974548,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,15],"address":[1],"the":[2,9,80,86,98,103,120],"Ambivalence/Hesitancy":[3],"(A/H)":[4],"Video":[5],"Recognition":[6],"Challenge":[7],"at":[8],"10th":[10],"ABAW":[11],"Competition":[12],"(CVPR":[13],"2026).":[14],"propose":[16],"a":[17,56,64,92],"divergence-based":[18],"multimodal":[19],"fusion":[20,69],"that":[21,82,114],"explicitly":[22],"measures":[23],"cross-modal":[24],"conflict":[25],"between":[26,75],"visual,":[27],"audio,":[28],"and":[29,47,61],"textual":[30],"channels.":[31],"Visual":[32],"features":[33],"are":[34],"encoded":[35],"as":[36],"Action":[37],"Units":[38],"(AUs)":[39],"extracted":[40],"via":[41,44,49],"Py-Feat,":[42],"audio":[43],"Wav2Vec":[45],"2.0,":[46],"text":[48],"BERT.":[50],"Each":[51],"modality":[52,76],"is":[53,119],"processed":[54],"by":[55],"BiLSTM":[57],"with":[58],"attention":[59],"pooling":[60],"projected":[62],"into":[63],"shared":[65],"embedding":[66],"space.":[67],"The":[68],"module":[70],"computes":[71],"pairwise":[72],"absolute":[73],"differences":[74],"embeddings,":[77],"directly":[78],"capturing":[79],"incongruence":[81],"characterizes":[83],"A/H.":[84,125],"On":[85],"BAH":[87],"dataset,":[88],"our":[89],"approach":[90],"achieves":[91],"Macro":[93],"F1":[94],"of":[95,106,117,124],"0.6808":[96],"on":[97],"validation":[99],"test":[100],"set,":[101],"outperforming":[102],"challenge":[104],"baseline":[105],"0.2827.":[107],"Statistical":[108],"analysis":[109],"across":[110],"1{,}132":[111],"videos":[112],"confirms":[113],"temporal":[115],"variability":[116],"AUs":[118],"dominant":[121],"visual":[122],"discriminator":[123]},"counts_by_year":[],"updated_date":"2026-03-20T20:54:20.808490","created_date":"2026-03-20T00:00:00"}
