{"id":"https://openalex.org/W3199894437","doi":"https://doi.org/10.1109/ijcnn52387.2021.9534069","title":"FA-IATI: A Framework of Frequency Adaptive and Iterative Attention Interaction for Image-Text Matching","display_name":"FA-IATI: A Framework of Frequency Adaptive and Iterative Attention Interaction for Image-Text Matching","publication_year":2021,"publication_date":"2021-07-18","ids":{"openalex":"https://openalex.org/W3199894437","doi":"https://doi.org/10.1109/ijcnn52387.2021.9534069","mag":"3199894437"},"language":"en","primary_location":{"id":"doi:10.1109/ijcnn52387.2021.9534069","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9534069","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5034674934","display_name":"Youxuan Qin","orcid":null},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Youxuan Qin","raw_affiliation_strings":["School of Computer Science and Technology, (ShanDong Academy of Sciences),Qilu University of Technology,Jinan,China","Qilu University of Technology, School of Computer Science and Technology, (ShanDong Academy of Sciences), Jinan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, (ShanDong Academy of Sciences),Qilu University of Technology,Jinan,China","institution_ids":["https://openalex.org/I152269853"]},{"raw_affiliation_string":"Qilu University of Technology, School of Computer Science and Technology, (ShanDong Academy of Sciences), Jinan, China","institution_ids":["https://openalex.org/I152269853"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102993611","display_name":"Jing Zhao","orcid":"https://orcid.org/0000-0002-8169-2867"},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Zhao","raw_affiliation_strings":["School of Computer Science and Technology, (ShanDong Academy of Sciences),Qilu University of Technology,Jinan,China","Qilu University of Technology, School of Computer Science and Technology, (ShanDong Academy of Sciences), Jinan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, (ShanDong Academy of Sciences),Qilu University of Technology,Jinan,China","institution_ids":["https://openalex.org/I152269853"]},{"raw_affiliation_string":"Qilu University of Technology, School of Computer Science and Technology, (ShanDong Academy of Sciences), Jinan, China","institution_ids":["https://openalex.org/I152269853"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100351350","display_name":"Ming Li","orcid":"https://orcid.org/0000-0001-9017-2057"},"institutions":[{"id":"https://openalex.org/I134738993","display_name":"Shandong University of Traditional Chinese Medicine","ror":"https://ror.org/0523y5c19","country_code":"CN","type":"education","lineage":["https://openalex.org/I134738993"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ming Li","raw_affiliation_strings":["Shandong University of Traditional Chinese Medicine,School of Intelligence and Information Engineering,Jinan,China","School of Intelligence and Information Engineering, Shandong University of Traditional Chinese Medicine, Jinan, China"],"affiliations":[{"raw_affiliation_string":"Shandong University of Traditional Chinese Medicine,School of Intelligence and Information Engineering,Jinan,China","institution_ids":["https://openalex.org/I134738993"]},{"raw_affiliation_string":"School of Intelligence and Information Engineering, Shandong University of Traditional Chinese Medicine, Jinan, China","institution_ids":["https://openalex.org/I134738993"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060129397","display_name":"Chao Sun","orcid":"https://orcid.org/0000-0002-8778-0665"},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Sun","raw_affiliation_strings":["School of Computer Science and Technology, (ShanDong Academy of Sciences),Qilu University of Technology,Jinan,China","Qilu University of Technology, School of Computer Science and Technology, (ShanDong Academy of Sciences), Jinan, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, (ShanDong Academy of Sciences),Qilu University of Technology,Jinan,China","institution_ids":["https://openalex.org/I152269853"]},{"raw_affiliation_string":"Qilu University of Technology, School of Computer Science and Technology, (ShanDong Academy of Sciences), Jinan, China","institution_ids":["https://openalex.org/I152269853"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5034674934"],"corresponding_institution_ids":["https://openalex.org/I152269853"],"apc_list":null,"apc_paid":null,"fwci":0.0961,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.39619281,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"8"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9944999814033508,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7518178224563599},{"id":"https://openalex.org/keywords/matching","display_name":"Matching (statistics)","score":0.6444315910339355},{"id":"https://openalex.org/keywords/semantic-matching","display_name":"Semantic matching","score":0.6050424575805664},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5173044204711914},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4786359369754791},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4726373553276062},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.46992194652557373},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.44452497363090515},{"id":"https://openalex.org/keywords/aggregate","display_name":"Aggregate (composite)","score":0.441854327917099},{"id":"https://openalex.org/keywords/visual-reasoning","display_name":"Visual reasoning","score":0.4344252347946167},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3654790222644806},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.32611969113349915},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.2367781102657318},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11350730061531067}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7518178224563599},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.6444315910339355},{"id":"https://openalex.org/C2778493491","wikidata":"https://www.wikidata.org/wiki/Q7449072","display_name":"Semantic matching","level":3,"score":0.6050424575805664},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5173044204711914},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4786359369754791},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4726373553276062},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.46992194652557373},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.44452497363090515},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.441854327917099},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.4344252347946167},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3654790222644806},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.32611969113349915},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.2367781102657318},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11350730061531067},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/ijcnn52387.2021.9534069","is_oa":false,"landing_page_url":"https://doi.org/10.1109/ijcnn52387.2021.9534069","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 International Joint Conference on Neural Networks (IJCNN)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.5099999904632568,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G1565240383","display_name":null,"funder_award_id":"2019YFB1404700","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W68733909","https://openalex.org/W123527740","https://openalex.org/W1514535095","https://openalex.org/W1529533208","https://openalex.org/W1756422141","https://openalex.org/W1821462560","https://openalex.org/W1861492603","https://openalex.org/W2158937425","https://openalex.org/W2295158492","https://openalex.org/W2302086703","https://openalex.org/W2466714650","https://openalex.org/W2499696929","https://openalex.org/W2519887557","https://openalex.org/W2546696630","https://openalex.org/W2557283755","https://openalex.org/W2745461083","https://openalex.org/W2774267535","https://openalex.org/W2778100917","https://openalex.org/W2883311563","https://openalex.org/W2890531016","https://openalex.org/W2919115771","https://openalex.org/W2953022248","https://openalex.org/W2956018683","https://openalex.org/W2962949934","https://openalex.org/W2962964995","https://openalex.org/W2963389687","https://openalex.org/W2963393391","https://openalex.org/W2963899908","https://openalex.org/W2964015378","https://openalex.org/W2964120214","https://openalex.org/W2964152081","https://openalex.org/W2964157791","https://openalex.org/W2965848243","https://openalex.org/W2988823324","https://openalex.org/W3029678209","https://openalex.org/W3035454331","https://openalex.org/W3128443161","https://openalex.org/W3173240144","https://openalex.org/W4299801216","https://openalex.org/W6605003669","https://openalex.org/W6630875275","https://openalex.org/W6637805884","https://openalex.org/W6638523607","https://openalex.org/W6639102338","https://openalex.org/W6685183736","https://openalex.org/W6724366048","https://openalex.org/W6726873649","https://openalex.org/W6747225742","https://openalex.org/W6749537441","https://openalex.org/W6754778999","https://openalex.org/W6789964533"],"related_works":["https://openalex.org/W3238102","https://openalex.org/W1380946","https://openalex.org/W12239746","https://openalex.org/W4090223","https://openalex.org/W6368054","https://openalex.org/W4603406","https://openalex.org/W7765441","https://openalex.org/W7122632","https://openalex.org/W6534656","https://openalex.org/W11006606"],"abstract_inverted_index":{"The":[0],"matching":[1,28,66,163],"relationship":[2],"between":[3,96],"language":[4],"and":[5,16,37,60,83,110,120,136,154,169],"vision,":[6],"which":[7],"extensively":[8],"involves":[9],"various":[10],"fields":[11],"such":[12],"as":[13],"search":[14],"engines":[15],"social":[17],"media,":[18],"is":[19],"a":[20,57],"hot":[21],"topic":[22],"that":[23,125],"researchers":[24],"are":[25],"exploring.":[26],"Existing":[27],"methods":[29],"pay":[30],"more":[31],"attention":[32,62,100],"to":[33,91],"alignment":[34,114],"of":[35,41,73,118,133],"features":[36,105],"lack":[38],"the":[39,46,52,71,93,116,130,140,148],"reasoning":[40],"high-level":[42],"semantic":[43,76,113],"concepts,":[44],"especially":[45],"difference":[47],"in":[48],"visual":[49,75],"expression,":[50],"inside":[51],"modal.":[53],"Therefore,":[54],"we":[55,79],"propose":[56],"frequency":[58],"adaptive":[59],"iterative":[61,108],"interaction":[63,101],"for":[64],"image-text":[65],"(FA-IATI)":[67],"framework,":[68],"starting":[69],"from":[70],"perspective":[72],"capturing":[74],"relationships.":[77],"Specifically,":[78],"adaptively":[80],"aggregate":[81],"low-frequency":[82],"high-frequency":[84],"signals":[85],"by":[86],"using":[87],"graph":[88],"convolutional":[89],"networks":[90],"enhance":[92],"contextual":[94],"information":[95],"image":[97,121,155],"regions.":[98,122],"An":[99],"module":[102],"generates":[103],"global":[104],"through":[106],"an":[107],"mechanism":[109],"gradually":[111],"achieves":[112,129],"during":[115],"aggregation":[117],"words":[119],"Experiments":[123],"show":[124],"our":[126],"FA-IATI":[127,165],"model":[128,150],"best":[131],"results":[132],"98.4%":[134],"(R@10)":[135,138],"94.9%":[137],"on":[139,151],"MS":[141],"COCO":[142],"dataset":[143],"(using":[144],"1Ktesting)":[145],"compared":[146],"with":[147,159],"baseline":[149],"text":[152],"query":[153],"query,":[156],"respectively.":[157],"Compared":[158],"other":[160],"current":[161],"advanced":[162],"models,":[164],"has":[166],"superior":[167],"performance":[168],"strong":[170],"competitiveness.":[171]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
