{"id":"https://openalex.org/W4412082248","doi":"https://doi.org/10.1109/tifs.2025.3586484","title":"Adaptive Interaction and Correction Attention Network for Audio-Visual Matching","display_name":"Adaptive Interaction and Correction Attention Network for Audio-Visual Matching","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4412082248","doi":"https://doi.org/10.1109/tifs.2025.3586484"},"language":"en","primary_location":{"id":"doi:10.1109/tifs.2025.3586484","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tifs.2025.3586484","pdf_url":null,"source":{"id":"https://openalex.org/S61310614","display_name":"IEEE Transactions on Information Forensics and Security","issn_l":"1556-6013","issn":["1556-6013","1556-6021"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Information Forensics and Security","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100784264","display_name":"Jiaxiang Wang","orcid":"https://orcid.org/0000-0003-3059-798X"},"institutions":[{"id":"https://openalex.org/I184681353","display_name":"Anhui University of Science and Technology","ror":"https://ror.org/00q9atg80","country_code":"CN","type":"education","lineage":["https://openalex.org/I184681353"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiaxiang Wang","raw_affiliation_strings":["School of Artificial Intelligence, Anhui University of Science and Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Anhui University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I184681353"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017558628","display_name":"Aihua Zheng","orcid":"https://orcid.org/0000-0002-9820-4743"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Aihua Zheng","raw_affiliation_strings":["Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, and the School of Artificial Intelligence, Anhui University, Hefei, China","the Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui University, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, and the School of Artificial Intelligence, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]},{"raw_affiliation_string":"the Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100349638","display_name":"Lei Liu","orcid":"https://orcid.org/0000-0003-2749-5528"},"institutions":[{"id":"https://openalex.org/I184681353","display_name":"Anhui University of Science and Technology","ror":"https://ror.org/00q9atg80","country_code":"CN","type":"education","lineage":["https://openalex.org/I184681353"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Liu","raw_affiliation_strings":["School of Artificial Intelligence, Anhui University of Science and Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Anhui University of Science and Technology, Hefei, China","institution_ids":["https://openalex.org/I184681353"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100398932","display_name":"Chenglong Li","orcid":"https://orcid.org/0000-0002-7233-2739"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenglong Li","raw_affiliation_strings":["Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, and the School of Artificial Intelligence, Anhui University, Hefei, China","the Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui University, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, and the School of Artificial Intelligence, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]},{"raw_affiliation_string":"the Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112749024","display_name":"Ran He","orcid":"https://orcid.org/0000-0002-3807-991X"},"institutions":[{"id":"https://openalex.org/I4210112150","display_name":"Institute of Automation","ror":"https://ror.org/022c3hy66","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210112150"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ran He","raw_affiliation_strings":["Institute of Automation, University of Chinese Academy of Sciences, Beijing, China","University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Automation, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210112150","https://openalex.org/I4210165038"]},{"raw_affiliation_string":"University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030720334","display_name":"Jin Tang","orcid":"https://orcid.org/0000-0001-8375-3590"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Tang","raw_affiliation_strings":["Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Anhui University, Hefei, China","School of Computer Science and Technology, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, Anhui University, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]},{"raw_affiliation_string":"School of Computer Science and Technology, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100784264"],"corresponding_institution_ids":["https://openalex.org/I184681353"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.19125401,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"20","issue":null,"first_page":"7558","last_page":"7571"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9916999936103821,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9887999892234802,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11439","display_name":"Video Analysis and Summarization","score":0.9072999954223633,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8395787477493286},{"id":"https://openalex.org/keywords/audio-visual","display_name":"Audio visual","score":0.48506394028663635},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4535828232765198},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.45044010877609253},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.4474157392978668},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3960537910461426},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.378091037273407},{"id":"https://openalex.org/keywords/multimedia","display_name":"Multimedia","score":0.22415491938591003}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8395787477493286},{"id":"https://openalex.org/C3017588708","wikidata":"https://www.wikidata.org/wiki/Q758901","display_name":"Audio visual","level":2,"score":0.48506394028663635},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4535828232765198},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45044010877609253},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4474157392978668},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3960537910461426},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.378091037273407},{"id":"https://openalex.org/C49774154","wikidata":"https://www.wikidata.org/wiki/Q131765","display_name":"Multimedia","level":1,"score":0.22415491938591003},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tifs.2025.3586484","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tifs.2025.3586484","pdf_url":null,"source":{"id":"https://openalex.org/S61310614","display_name":"IEEE Transactions on Information Forensics and Security","issn_l":"1556-6013","issn":["1556-6013","1556-6021"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Information Forensics and Security","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4306577167","display_name":null,"funder_award_id":"62372003","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G569029087","display_name":null,"funder_award_id":"2308085Y40","funder_id":"https://openalex.org/F4320334897","funder_display_name":"Natural Science Foundation of Anhui Province"},{"id":"https://openalex.org/G7432064593","display_name":null,"funder_award_id":"2408085QF199","funder_id":"https://openalex.org/F4320334897","funder_display_name":"Natural Science Foundation of Anhui Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334897","display_name":"Natural Science Foundation of Anhui Province","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W1925193522","https://openalex.org/W2096733369","https://openalex.org/W2106873328","https://openalex.org/W2108598243","https://openalex.org/W2146842127","https://openalex.org/W2194775991","https://openalex.org/W2726515241","https://openalex.org/W2752782242","https://openalex.org/W2775516437","https://openalex.org/W2808260522","https://openalex.org/W2808631503","https://openalex.org/W2963026686","https://openalex.org/W2963066927","https://openalex.org/W2963801643","https://openalex.org/W2963887950","https://openalex.org/W2969985801","https://openalex.org/W2984696290","https://openalex.org/W2997819898","https://openalex.org/W3024840775","https://openalex.org/W3034303554","https://openalex.org/W3034725201","https://openalex.org/W3034956129","https://openalex.org/W3093411628","https://openalex.org/W3104090442","https://openalex.org/W3118548710","https://openalex.org/W3154848313","https://openalex.org/W3169472988","https://openalex.org/W3177326298","https://openalex.org/W3182657421","https://openalex.org/W3199528201","https://openalex.org/W3200115061","https://openalex.org/W3214311327","https://openalex.org/W4224924564","https://openalex.org/W4285603046","https://openalex.org/W4312337341","https://openalex.org/W4312626422","https://openalex.org/W4312763854","https://openalex.org/W4312886874","https://openalex.org/W4313196086","https://openalex.org/W4313387422","https://openalex.org/W4318811844","https://openalex.org/W4322576470","https://openalex.org/W4360993864","https://openalex.org/W4372341093","https://openalex.org/W4383199472","https://openalex.org/W4386065291","https://openalex.org/W4386065863","https://openalex.org/W4386066416","https://openalex.org/W4386071498","https://openalex.org/W4386075642","https://openalex.org/W4388240180","https://openalex.org/W4390097682","https://openalex.org/W4393034333","https://openalex.org/W4394805464","https://openalex.org/W4394897075","https://openalex.org/W6752791795"],"related_works":["https://openalex.org/W2271369634","https://openalex.org/W3147472394","https://openalex.org/W2047100085","https://openalex.org/W2350550760","https://openalex.org/W578794879","https://openalex.org/W2625296515","https://openalex.org/W3137890128","https://openalex.org/W1984634519","https://openalex.org/W4245955731","https://openalex.org/W2393726419"],"abstract_inverted_index":{"Audio-visual":[0],"matching":[1,43,177],"techniques":[2],"aim":[3],"to":[4,86,125],"recognize":[5],"and":[6,27,57,128,146,175,184],"match":[7],"information":[8,67],"across":[9,17,194],"different":[10],"identities":[11],"by":[12],"learning":[13,39],"a":[14,53,74,154,172],"similarity":[15,166],"metric":[16,38,76,158],"modalities.":[18],"However,":[19],"modal":[20,48,88],"differences":[21,49],"arise":[22],"from":[23],"insufficient":[24],"cross-modal":[25,104],"correlations":[26],"noise":[28],"interference,":[29],"which":[30,99,120,163],"substantially":[31],"hinder":[32],"the":[33,47,93,114,131,138,165,182],"performance":[34],"of":[35,80,133,168],"traditional":[36],"deep":[37,66],"methods":[40],"in":[41,171],"audio-visual":[42],"tasks.":[44],"To":[45],"address":[46],"issue,":[50],"we":[51,91,112,152],"propose":[52,92,113],"novel":[54],"Adaptive":[55,94,115],"Interactive":[56,95],"Correction":[58,116],"Attention":[59,96,117],"Network":[60],"(AICANet).":[61],"This":[62],"network":[63],"efficiently":[64],"captures":[65],"connections,":[68],"generating":[69],"modality-consistent":[70],"feature":[71,135,169],"embeddings":[72,170],"within":[73],"unified":[75],"framework.":[77],"The":[78,202],"core":[79],"AICANet":[81,189],"is":[82,141],"its":[83,199],"two-pronged":[84],"approach":[85],"reducing":[87],"differences.":[89],"First,":[90],"(AIA)":[97],"module,":[98],"flexibly":[100],"establishes":[101],"associations":[102],"among":[103],"local":[105,134],"features":[106],"using":[107],"dynamically":[108],"generated":[109],"pseudo-labels.":[110],"Second,":[111],"(ACA)":[118],"mechanism,":[119],"employs":[121],"an":[122],"adaptive":[123],"threshold":[124],"de-interference":[126],"effectively":[127],"accurately":[129],"adjust":[130],"representation":[132],"associations.":[136],"Notably,":[137],"ACA":[139],"mechanism":[140],"suitable":[142],"for":[143],"both":[144],"intra-modal":[145],"inter-modal":[147],"refined":[148],"attention":[149],"correction.":[150],"Additionally,":[151],"design":[153],"relative":[155],"distance":[156],"stretching":[157],"loss":[159],"(<italic":[160],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[161],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">L<sub>RDSM</sub></i>),":[162],"reinforces":[164],"invariance":[167],"uniform":[173],"space":[174],"enhances":[176],"accuracy.":[178],"Extensive":[179],"tests":[180],"on":[181],"VoxCeleb":[183],"VoxCeleb2":[185],"datasets":[186],"demonstrate":[187],"that":[188],"outperforms":[190],"leading":[191],"existing":[192],"algorithms":[193],"several":[195],"evaluation":[196],"metrics,":[197],"validating":[198],"superior":[200],"performance.":[201],"codes":[203],"can":[204],"be":[205],"found":[206],"at":[207],"https://github.com/w1018979952/AICANet.":[208]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
