{"id":"https://openalex.org/W3196281958","doi":"https://doi.org/10.1109/icip42928.2021.9506438","title":"Attend, Correct And Focus: A Bidirectional Correct Attention Network For Image-Text Matching","display_name":"Attend, Correct And Focus: A Bidirectional Correct Attention Network For Image-Text Matching","publication_year":2021,"publication_date":"2021-08-23","ids":{"openalex":"https://openalex.org/W3196281958","doi":"https://doi.org/10.1109/icip42928.2021.9506438","mag":"3196281958"},"language":"en","primary_location":{"id":"doi:10.1109/icip42928.2021.9506438","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip42928.2021.9506438","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101810463","display_name":"Yang Liu","orcid":"https://orcid.org/0000-0001-5159-5954"},"institutions":[{"id":"https://openalex.org/I50632499","display_name":"Chongqing University of Technology","ror":"https://ror.org/04vgbd477","country_code":"CN","type":"education","lineage":["https://openalex.org/I50632499"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yang Liu","raw_affiliation_strings":["Chongqing University of Technology,School of Artificial Intelligence","School of Artificial Intelligence, Chongqing University of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Chongqing University of Technology,School of Artificial Intelligence","institution_ids":["https://openalex.org/I50632499"]},{"raw_affiliation_string":"School of Artificial Intelligence, Chongqing University of Technology","institution_ids":["https://openalex.org/I50632499"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046380673","display_name":"Huaqiu Wang","orcid":"https://orcid.org/0000-0002-6789-6775"},"institutions":[{"id":"https://openalex.org/I50632499","display_name":"Chongqing University of Technology","ror":"https://ror.org/04vgbd477","country_code":"CN","type":"education","lineage":["https://openalex.org/I50632499"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huaqiu Wang","raw_affiliation_strings":["Chongqing University of Technology,School of Artificial Intelligence","School of Artificial Intelligence, Chongqing University of Technology"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Chongqing University of Technology,School of Artificial Intelligence","institution_ids":["https://openalex.org/I50632499"]},{"raw_affiliation_string":"School of Artificial Intelligence, Chongqing University of Technology","institution_ids":["https://openalex.org/I50632499"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038040039","display_name":"Fanyang Meng","orcid":"https://orcid.org/0000-0001-5725-2178"},"institutions":[{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fanyang Meng","raw_affiliation_strings":["Peng Cheng Laboratory"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Peng Cheng Laboratory","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100705472","display_name":"Mengyuan Liu","orcid":"https://orcid.org/0000-0002-6332-8316"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengyuan Liu","raw_affiliation_strings":["Sun Yat-sen University,School of Intelligent Systems Engineering","School of Intelligent Systems Engineering, Sun Yat-sen University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Sun Yat-sen University,School of Intelligent Systems Engineering","institution_ids":["https://openalex.org/I157773358"]},{"raw_affiliation_string":"School of Intelligent Systems Engineering, Sun Yat-sen University","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100410326","display_name":"Hong Liu","orcid":"https://orcid.org/0000-0002-7498-6541"},"institutions":[{"id":"https://openalex.org/I20231570","display_name":"Peking University","ror":"https://ror.org/02v51f717","country_code":"CN","type":"education","lineage":["https://openalex.org/I20231570"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hong Liu","raw_affiliation_strings":["Peking University,Key Laboratory of Machine Perception, Shenzhen Graduate School","Key Laboratory of Machine Perception, Shenzhen Graduate School, Peking University"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Peking University,Key Laboratory of Machine Perception, Shenzhen Graduate School","institution_ids":["https://openalex.org/I20231570"]},{"raw_affiliation_string":"Key Laboratory of Machine Perception, Shenzhen Graduate School, Peking University","institution_ids":["https://openalex.org/I20231570"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.2911,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.5602329,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"2673","last_page":"2677"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8467297554016113},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.805307924747467},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.7310467958450317},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6356557011604309},{"id":"https://openalex.org/keywords/attention-network","display_name":"Attention network","score":0.63017737865448},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.6163343191146851},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5812703371047974},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5574929118156433},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5139855742454529},{"id":"https://openalex.org/keywords/semantic-matching","display_name":"Semantic matching","score":0.4870936870574951},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.48153287172317505},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.09236103296279907}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8467297554016113},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.805307924747467},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.7310467958450317},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6356557011604309},{"id":"https://openalex.org/C2993807640","wikidata":"https://www.wikidata.org/wiki/Q103709453","display_name":"Attention network","level":2,"score":0.63017737865448},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.6163343191146851},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5812703371047974},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5574929118156433},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5139855742454529},{"id":"https://openalex.org/C2778493491","wikidata":"https://www.wikidata.org/wiki/Q7449072","display_name":"Semantic matching","level":3,"score":0.4870936870574951},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.48153287172317505},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.09236103296279907},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icip42928.2021.9506438","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icip42928.2021.9506438","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Image Processing (ICIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6200000047683716,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1527575280","https://openalex.org/W1773149199","https://openalex.org/W1861492603","https://openalex.org/W1905882502","https://openalex.org/W2149557440","https://openalex.org/W2546696630","https://openalex.org/W2745461083","https://openalex.org/W2774267535","https://openalex.org/W2950096400","https://openalex.org/W2952524542","https://openalex.org/W2962964995","https://openalex.org/W2963445828","https://openalex.org/W2964042428","https://openalex.org/W2965809241","https://openalex.org/W2965848243","https://openalex.org/W2982078236","https://openalex.org/W3035454331","https://openalex.org/W6631516269","https://openalex.org/W6639102338","https://openalex.org/W6747225742","https://openalex.org/W6749537441"],"related_works":["https://openalex.org/W1972035260","https://openalex.org/W4301594054","https://openalex.org/W2794488505","https://openalex.org/W3125889879","https://openalex.org/W3124422538","https://openalex.org/W1986106996","https://openalex.org/W4285012873","https://openalex.org/W2122517733","https://openalex.org/W1595649729","https://openalex.org/W3196281958"],"abstract_inverted_index":{"Image-text":[0],"matching":[1],"task":[2],"aims":[3],"to":[4,18,24,39,63,68,80,97],"learn":[5,19],"the":[6,20,29,65,82,99,115],"fine-grained":[7],"correspondences":[8,21],"between":[9,31],"images":[10],"and":[11,33,60,111,127],"sentences.":[12],"Existing":[13],"methods":[14,126],"use":[15],"attention":[16,66,83,100],"mechanism":[17],"by":[22,121],"attending":[23],"all":[25],"fragments":[26,32,87,104],"without":[27],"considering":[28],"relationship":[30],"global":[34,58,77],"semantics,":[35],"which":[36,56],"inevitably":[37],"lead":[38],"semantic":[40,71],"misalignment":[41],"among":[42],"irrelevant":[43,89,103],"fragments.":[44],"To":[45],"this":[46],"end,":[47],"we":[48,74],"propose":[49],"a":[50,76],"Bidirectional":[51],"Correct":[52],"Attention":[53],"Network":[54],"(BCAN),":[55],"leverages":[57],"similarities":[59,62],"local":[61,92],"reassign":[64],"weight,":[67],"avoid":[69],"such":[70],"misalignment.":[72],"Specifically,":[73],"introduce":[75],"correct":[78,81,93,98],"unit":[79,94],"focused":[84,101],"on":[85,102,109],"relevant":[86,106],"in":[88,105],"semantics.":[90,107],"A":[91],"is":[95],"used":[96],"Experiments":[108],"Flickr30K":[110],"MSCOCO":[112],"datasets":[113],"verify":[114],"effectiveness":[116],"of":[117],"our":[118],"proposed":[119],"BCAN":[120],"outperforming":[122],"both":[123],"previous":[124],"attention-based":[125],"state-of-the-art":[128],"methods.":[129],"Code":[130],"can":[131],"be":[132],"found":[133],"at:":[134],"https://github.com/liuyyy111/BCAN.":[135]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
