{"id":"https://openalex.org/W4378805087","doi":"https://doi.org/10.1109/tnnls.2023.3276796","title":"BCAN: Bidirectional Correct Attention Network for Cross-Modal Retrieval","display_name":"BCAN: Bidirectional Correct Attention Network for Cross-Modal Retrieval","publication_year":2023,"publication_date":"2023-05-31","ids":{"openalex":"https://openalex.org/W4378805087","doi":"https://doi.org/10.1109/tnnls.2023.3276796","pmid":"https://pubmed.ncbi.nlm.nih.gov/37256811"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2023.3276796","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3276796","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101810463","display_name":"Yang Liu","orcid":"https://orcid.org/0000-0001-5159-5954"},"institutions":[{"id":"https://openalex.org/I24185976","display_name":"Sichuan University","ror":"https://ror.org/011ashp19","country_code":"CN","type":"education","lineage":["https://openalex.org/I24185976"]},{"id":"https://openalex.org/I4210125143","display_name":"Chengdu University","ror":"https://ror.org/034z67559","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210125143"]},{"id":"https://openalex.org/I50632499","display_name":"Chongqing University of Technology","ror":"https://ror.org/04vgbd477","country_code":"CN","type":"education","lineage":["https://openalex.org/I50632499"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Liu","raw_affiliation_strings":["School of Artificial Intelligence, Chongqing University of Technology, Chongqing, China","College of Computer Science, Sichuan University, Chengdu, China"],"raw_orcid":"https://orcid.org/0000-0001-5159-5954","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Chongqing University of Technology, Chongqing, China","institution_ids":["https://openalex.org/I50632499"]},{"raw_affiliation_string":"College of Computer Science, Sichuan University, Chengdu, China","institution_ids":["https://openalex.org/I4210125143","https://openalex.org/I24185976"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100410326","display_name":"Hong Liu","orcid":"https://orcid.org/0000-0002-7498-6541"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hong Liu","raw_affiliation_strings":["Key Laboratory of Machine Perception, Shenzhen Graduate School, Peking University, Shenzhen, China","Shenzhen Graduate School, Key Laboratory of Machine Perception, Peking University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-7498-6541","affiliations":[{"raw_affiliation_string":"Key Laboratory of Machine Perception, Shenzhen Graduate School, Peking University, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"Shenzhen Graduate School, Key Laboratory of Machine Perception, Peking University, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046380673","display_name":"Huaqiu Wang","orcid":"https://orcid.org/0000-0002-6789-6775"},"institutions":[{"id":"https://openalex.org/I50632499","display_name":"Chongqing University of Technology","ror":"https://ror.org/04vgbd477","country_code":"CN","type":"education","lineage":["https://openalex.org/I50632499"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huaqiu Wang","raw_affiliation_strings":["School of Artificial Intelligence, Chongqing University of Technology, Chongqing, China"],"raw_orcid":"https://orcid.org/0000-0002-6789-6775","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Chongqing University of Technology, Chongqing, China","institution_ids":["https://openalex.org/I50632499"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038040039","display_name":"Fanyang Meng","orcid":"https://orcid.org/0000-0001-5725-2178"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fanyang Meng","raw_affiliation_strings":["Peng Cheng Laboratory, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0001-5725-2178","affiliations":[{"raw_affiliation_string":"Peng Cheng Laboratory, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100705472","display_name":"Mengyuan Liu","orcid":"https://orcid.org/0000-0002-6332-8316"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengyuan Liu","raw_affiliation_strings":["Key Laboratory of Machine Perception, Shenzhen Graduate School, Peking University, Shenzhen, China","Shenzhen Graduate School, Key Laboratory of Machine Perception, Peking University, Shenzhen, China"],"raw_orcid":"https://orcid.org/0000-0002-6332-8316","affiliations":[{"raw_affiliation_string":"Key Laboratory of Machine Perception, Shenzhen Graduate School, Peking University, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"Shenzhen Graduate School, Key Laboratory of Machine Perception, Peking University, Shenzhen, China","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.6842,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.86329464,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":"35","issue":"10","first_page":"14247","last_page":"14258"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7550853490829468},{"id":"https://openalex.org/keywords/bridging","display_name":"Bridging (networking)","score":0.6585684418678284},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.6442062854766846},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.6414440870285034},{"id":"https://openalex.org/keywords/modal","display_name":"Modal","score":0.602512538433075},{"id":"https://openalex.org/keywords/semantic-gap","display_name":"Semantic gap","score":0.575721025466919},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.55503249168396},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.550049901008606},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.52399080991745},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.5036749243736267},{"id":"https://openalex.org/keywords/attention-network","display_name":"Attention network","score":0.5013101100921631},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.34580695629119873},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.2933928072452545},{"id":"https://openalex.org/keywords/image-retrieval","display_name":"Image retrieval","score":0.23468488454818726}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7550853490829468},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.6585684418678284},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.6442062854766846},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.6414440870285034},{"id":"https://openalex.org/C71139939","wikidata":"https://www.wikidata.org/wiki/Q910194","display_name":"Modal","level":2,"score":0.602512538433075},{"id":"https://openalex.org/C86034646","wikidata":"https://www.wikidata.org/wiki/Q474311","display_name":"Semantic gap","level":4,"score":0.575721025466919},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.55503249168396},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.550049901008606},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.52399080991745},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.5036749243736267},{"id":"https://openalex.org/C2993807640","wikidata":"https://www.wikidata.org/wiki/Q103709453","display_name":"Attention network","level":2,"score":0.5013101100921631},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.34580695629119873},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.2933928072452545},{"id":"https://openalex.org/C1667742","wikidata":"https://www.wikidata.org/wiki/Q10927554","display_name":"Image retrieval","level":3,"score":0.23468488454818726},{"id":"https://openalex.org/C188027245","wikidata":"https://www.wikidata.org/wiki/Q750446","display_name":"Polymer chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2023.3276796","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2023.3276796","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:37256811","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/37256811","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8283459870","display_name":null,"funder_award_id":"62203476","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":67,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1527575280","https://openalex.org/W1614298861","https://openalex.org/W1773149199","https://openalex.org/W1861492603","https://openalex.org/W1905882502","https://openalex.org/W2064675550","https://openalex.org/W2100235303","https://openalex.org/W2102605133","https://openalex.org/W2106277773","https://openalex.org/W2149557440","https://openalex.org/W2150600350","https://openalex.org/W2157331557","https://openalex.org/W2210322478","https://openalex.org/W2277195237","https://openalex.org/W2524097181","https://openalex.org/W2546696630","https://openalex.org/W2552579943","https://openalex.org/W2745461083","https://openalex.org/W2752782242","https://openalex.org/W2774267535","https://openalex.org/W2883311563","https://openalex.org/W2894879246","https://openalex.org/W2896457183","https://openalex.org/W2942614241","https://openalex.org/W2961553857","https://openalex.org/W2962964995","https://openalex.org/W2963340196","https://openalex.org/W2963383990","https://openalex.org/W2963467339","https://openalex.org/W2963633722","https://openalex.org/W2964044605","https://openalex.org/W2964120214","https://openalex.org/W2964216321","https://openalex.org/W2965848243","https://openalex.org/W2976669726","https://openalex.org/W2981448908","https://openalex.org/W2982078236","https://openalex.org/W2988823324","https://openalex.org/W2990571534","https://openalex.org/W3005971801","https://openalex.org/W3015655929","https://openalex.org/W3016451726","https://openalex.org/W3021938280","https://openalex.org/W3035454331","https://openalex.org/W3035552787","https://openalex.org/W3035605030","https://openalex.org/W3080952252","https://openalex.org/W3108274592","https://openalex.org/W3110042533","https://openalex.org/W3110846182","https://openalex.org/W3119545279","https://openalex.org/W3119589206","https://openalex.org/W3121052081","https://openalex.org/W3160179442","https://openalex.org/W3195903836","https://openalex.org/W3202436960","https://openalex.org/W3213100861","https://openalex.org/W4205432963","https://openalex.org/W6631190155","https://openalex.org/W6631516269","https://openalex.org/W6636510571","https://openalex.org/W6678470764","https://openalex.org/W6684191040","https://openalex.org/W6747225742","https://openalex.org/W6755207826","https://openalex.org/W6776031226"],"related_works":["https://openalex.org/W4388870064","https://openalex.org/W2210139803","https://openalex.org/W4235186151","https://openalex.org/W2054685365","https://openalex.org/W2056057048","https://openalex.org/W2128807628","https://openalex.org/W1555966012","https://openalex.org/W4234264766","https://openalex.org/W2415426693","https://openalex.org/W3209623075"],"abstract_inverted_index":{"As":[0],"a":[1,127,148,156,175,204],"fundamental":[2],"topic":[3],"in":[4,24,28,72,280,293,315],"bridging":[5],"the":[6,17,38,47,51,57,83,88,91,136,160,165,168,182,193,198,207,223,241,247,256,264,269,285,291,294,304,333,340],"gap":[7],"between":[8,20,59,75,85,162,187,210,259,297],"vision":[9],"and":[10,26,44,61,87,113,126,164,173,184,189,212,217,261,284,324,336,344],"language,":[11],"cross-modal":[12,64],"retrieval":[13],"purposes":[14],"to":[15,46,55,103,191,221,239,267,302,339],"obtain":[16],"correspondences'":[18],"relationship":[19,84,209],"fragments,":[21],"i.e.,":[22],"subregions":[23],"images":[25,43,93,105,170,188,214,260],"words":[27,60,125],"texts.":[29],"Compared":[30],"with":[31,108,254],"earlier":[32],"methods":[33,53,335],"that":[34,327],"focus":[35,117],"on":[36,120,197,246,277,312,321],"learning":[37],"visual":[39],"semantic":[40,73,111,139,208,224,270,305],"embedding":[41,49],"from":[42,226],"sentences":[45,107,172,190,216,262],"shared":[48],"space,":[50],"existing":[52],"tend":[54],"learn":[56],"correspondences":[58],"regions":[62],"via":[63],"attention.":[65],"However,":[66],"such":[67,101,115],"attention-based":[68,334],"approaches":[69,102,116],"invariably":[70],"result":[71],"misalignment":[74,225,271,306],"subfragments":[76,86,163,211,279,314],"for":[77,100],"two":[78,227,236,300],"reasons:":[79],"1)":[80],"without":[81],"modeling":[82,181,255],"semantics":[89,166],"of":[90,129,138,159,167,243],"entire":[92,169,213],"or":[94,106,171,215],"sentences,":[95],"it":[96],"will":[97,134],"be":[98],"hard":[99],"distinguish":[104],"multiple":[109],"same":[110],"fragments":[112,298],"2)":[114],"attention":[118,151,178,194,232,244,265,276,295,311],"evenly":[119],"all":[121,332],"subfragments,":[122],"including":[123],"nonvisual":[124],"lot":[128],"redundant":[130],"regions,":[131],"which":[132,154],"also":[133],"face":[135],"problem":[137,272,307],"misalignment.":[140],"To":[141],"solve":[142,222,268,303],"these":[143],"problems,":[144],"this":[145,219],"article":[146],"proposes":[147],"bidirectional":[149],"correct":[150,177,192,231,240,251,287],"network":[152],"(BCAN),":[153],"introduces":[155],"novel":[157,176],"concept":[158,205,220],"relevance":[161],"designs":[174],"mechanism":[179,266],"by":[180,274,309],"local":[183,286],"global":[185,257],"similarity":[186,258],"weights":[195,296],"focused":[196,245],"wrong":[199,248],"fragments.":[200,249],"Specifically,":[201],"we":[202,234],"introduce":[203],"about":[206],"use":[218],"aspects.":[228],"In":[229],"our":[230,328],"mechanism,":[233],"design":[235],"independent":[237],"units":[238],"weight":[242],"Global":[250],"unit":[252,288],"(GCU)":[253],"into":[263],"caused":[273,308],"focusing":[275,310],"relevant":[278,316],"irrelevant":[281,313],"pairs":[282,317],"(RI)":[283],"(LCU)":[289],"consider":[290],"difference":[292],"among":[299],"steps":[301],"(IR).":[318],"Extensive":[319],"experiments":[320],"large-scale":[322],"MS-COCO":[323],"Flickr30K":[325],"show":[326],"proposed":[329],"method":[330],"outperforms":[331],"is":[337],"competitive":[338],"state-of-the-art.":[341],"Our":[342],"code":[343],"pretrained":[345],"model":[346],"are":[347],"publicly":[348],"available":[349],"at:":[350],"https://github.com/liuyyy111/BCAN.":[351]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
