{"id":"https://openalex.org/W3087338569","doi":"https://doi.org/10.1109/tnnls.2020.3017530","title":"Rich Visual Knowledge-Based Augmentation Network for Visual Question Answering","display_name":"Rich Visual Knowledge-Based Augmentation Network for Visual Question Answering","publication_year":2020,"publication_date":"2020-09-17","ids":{"openalex":"https://openalex.org/W3087338569","doi":"https://doi.org/10.1109/tnnls.2020.3017530","mag":"3087338569","pmid":"https://pubmed.ncbi.nlm.nih.gov/32941156"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2020.3017530","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2020.3017530","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014009259","display_name":"Liyang Zhang","orcid":"https://orcid.org/0000-0003-2675-9763"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Liyang Zhang","raw_affiliation_strings":["Future Media Center, University of Electronic Science and Technology of China, Chengdu, China","School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Future Media Center, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039387461","display_name":"Shuaicheng Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726805","display_name":"Megvii (China)","ror":"https://ror.org/040b32p69","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726805"]},{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuaicheng Liu","raw_affiliation_strings":["Megvii Technology Ltd., Chengdu, China","School of Information and Communication Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Megvii Technology Ltd., Chengdu, China","institution_ids":["https://openalex.org/I4401726805"]},{"raw_affiliation_string":"School of Information and Communication Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101442435","display_name":"Donghao Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726805","display_name":"Megvii (China)","ror":"https://ror.org/040b32p69","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726805"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Donghao Liu","raw_affiliation_strings":["Megvii Technology Ltd., Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Megvii Technology Ltd., Chengdu, China","institution_ids":["https://openalex.org/I4401726805"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087623065","display_name":"Pengpeng Zeng","orcid":"https://orcid.org/0000-0002-0672-3790"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Pengpeng Zeng","raw_affiliation_strings":["Future Media Center, University of Electronic Science and Technology of China, Chengdu, China","School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Future Media Center, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101598763","display_name":"Xiangpeng Li","orcid":"https://orcid.org/0000-0001-5350-5780"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiangpeng Li","raw_affiliation_strings":["Future Media Center, University of Electronic Science and Technology of China, Chengdu, China","School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Future Media Center, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036987388","display_name":"Jingkuan Song","orcid":"https://orcid.org/0000-0002-2549-8322"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingkuan Song","raw_affiliation_strings":["Future Media Center, University of Electronic Science and Technology of China, Chengdu, China","School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Future Media Center, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066645546","display_name":"Lianli Gao","orcid":"https://orcid.org/0000-0002-2522-6394"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lianli Gao","raw_affiliation_strings":["Future Media Center, University of Electronic Science and Technology of China, Chengdu, China","School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Future Media Center, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]},{"raw_affiliation_string":"School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5014009259"],"corresponding_institution_ids":["https://openalex.org/I150229711"],"apc_list":null,"apc_paid":null,"fwci":3.3374,"has_fulltext":false,"cited_by_count":76,"citation_normalized_percentile":{"value":0.9377101,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":100},"biblio":{"volume":"32","issue":"10","first_page":"4362","last_page":"4373"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9968000054359436,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.9019513130187988},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.784688413143158},{"id":"https://openalex.org/keywords/open-domain","display_name":"Open domain","score":0.6092882752418518},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5467575192451477},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.5443285703659058},{"id":"https://openalex.org/keywords/domain-knowledge","display_name":"Domain knowledge","score":0.529306173324585},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4998760223388672},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4762444794178009},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.46405211091041565},{"id":"https://openalex.org/keywords/knowledge-extraction","display_name":"Knowledge extraction","score":0.44530928134918213},{"id":"https://openalex.org/keywords/commonsense-knowledge","display_name":"Commonsense knowledge","score":0.41970184445381165},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.38416439294815063},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.13722988963127136}],"concepts":[{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.9019513130187988},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.784688413143158},{"id":"https://openalex.org/C2993776861","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Open domain","level":3,"score":0.6092882752418518},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5467575192451477},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.5443285703659058},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.529306173324585},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4998760223388672},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4762444794178009},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.46405211091041565},{"id":"https://openalex.org/C120567893","wikidata":"https://www.wikidata.org/wiki/Q1582085","display_name":"Knowledge extraction","level":2,"score":0.44530928134918213},{"id":"https://openalex.org/C30542707","wikidata":"https://www.wikidata.org/wiki/Q1603203","display_name":"Commonsense knowledge","level":3,"score":0.41970184445381165},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38416439294815063},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.13722988963127136},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2020.3017530","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2020.3017530","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:32941156","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/32941156","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.8299999833106995}],"awards":[{"id":"https://openalex.org/G1390112858","display_name":null,"funder_award_id":"2019JDTD0005","funder_id":"https://openalex.org/F4320333335","funder_display_name":"Sichuan Province Science and Technology Support Program"},{"id":"https://openalex.org/G3623292902","display_name":null,"funder_award_id":"61632007","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4883897726","display_name":null,"funder_award_id":"61872067","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7095600686","display_name":null,"funder_award_id":"61602049","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7314976618","display_name":null,"funder_award_id":"61872064","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7422496417","display_name":null,"funder_award_id":"ZYGX2019J073","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G8027008232","display_name":null,"funder_award_id":"61772116","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8213391892","display_name":null,"funder_award_id":"2019YFH0016","funder_id":"https://openalex.org/F4320333335","funder_display_name":"Sichuan Province Science and Technology Support Program"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320333335","display_name":"Sichuan Province Science and Technology Support Program","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":65,"referenced_works":["https://openalex.org/W102708294","https://openalex.org/W179875071","https://openalex.org/W639708223","https://openalex.org/W1514535095","https://openalex.org/W1686810756","https://openalex.org/W1933349210","https://openalex.org/W2064675550","https://openalex.org/W2122865749","https://openalex.org/W2142192571","https://openalex.org/W2147527908","https://openalex.org/W2189070436","https://openalex.org/W2194775991","https://openalex.org/W2250210237","https://openalex.org/W2250539671","https://openalex.org/W2560730294","https://openalex.org/W2560920409","https://openalex.org/W2561529111","https://openalex.org/W2613718673","https://openalex.org/W2739107216","https://openalex.org/W2745461083","https://openalex.org/W2904452845","https://openalex.org/W2905224888","https://openalex.org/W2948434896","https://openalex.org/W2950096400","https://openalex.org/W2950577311","https://openalex.org/W2962731754","https://openalex.org/W2962749469","https://openalex.org/W2962861647","https://openalex.org/W2962958773","https://openalex.org/W2963176022","https://openalex.org/W2963341956","https://openalex.org/W2963383024","https://openalex.org/W2963403868","https://openalex.org/W2963477107","https://openalex.org/W2963521239","https://openalex.org/W2963576560","https://openalex.org/W2963644680","https://openalex.org/W2963738886","https://openalex.org/W2964121744","https://openalex.org/W2964138017","https://openalex.org/W2964207259","https://openalex.org/W2964303913","https://openalex.org/W2964308564","https://openalex.org/W2966683369","https://openalex.org/W2979382951","https://openalex.org/W2981582341","https://openalex.org/W3008062779","https://openalex.org/W3046423960","https://openalex.org/W6630875275","https://openalex.org/W6631190155","https://openalex.org/W6636510571","https://openalex.org/W6637373629","https://openalex.org/W6678053269","https://openalex.org/W6679434410","https://openalex.org/W6682137061","https://openalex.org/W6686883664","https://openalex.org/W6689414982","https://openalex.org/W6739901393","https://openalex.org/W6748581942","https://openalex.org/W6752083267","https://openalex.org/W6755207826","https://openalex.org/W6757374366","https://openalex.org/W6758609666","https://openalex.org/W6763534971","https://openalex.org/W6765766786"],"related_works":["https://openalex.org/W2951097643","https://openalex.org/W2391533720","https://openalex.org/W4309395021","https://openalex.org/W4307481286","https://openalex.org/W3215363805","https://openalex.org/W204133468","https://openalex.org/W2991310128","https://openalex.org/W2395174199","https://openalex.org/W4226441484","https://openalex.org/W2516703895"],"abstract_inverted_index":{"Visual":[0],"question":[1,87],"answering":[2],"(VQA)":[3],"that":[4,124,134,150],"involves":[5],"understanding":[6],"an":[7,64,121],"image":[8],"and":[9,30,97,167],"paired":[10],"questions":[11,46,59],"develops":[12],"very":[13],"quickly":[14],"with":[15],"the":[16,38,41,53,86,104,111,130,135],"boost":[17],"of":[18,40,137],"deep":[19],"learning":[20],"in":[21],"relevant":[22],"research":[23],"fields,":[24],"such":[25,63,133],"as":[26],"natural":[27],"language":[28],"processing":[29],"computer":[31],"vision.":[32],"Existing":[33],"works":[34],"highly":[35],"rely":[36],"on":[37,156],"knowledge":[39,56,83,100,139,173],"data":[42,54,160],"set.":[43],"However,":[44],"some":[45],"require":[47],"more":[48,92],"professional":[49],"cues":[50],"other":[51],"than":[52],"set":[55],"to":[57,84,102,129,177],"answer":[58],"correctly.":[60],"To":[61],"address":[62],"issue,":[65],"we":[66,90,119],"propose":[67],"a":[68,72,99],"novel":[69],"framework":[70],"named":[71],"knowledge-based":[73],"augmentation":[74],"network":[75],"(KAN)":[76],"for":[77,110],"VQA.":[78],"We":[79],"introduce":[80,98],"object-related":[81],"open-domain":[82,172],"assist":[85],"answering.":[88],"Concretely,":[89],"extract":[91],"visual":[93],"information":[94],"from":[95],"images":[96],"graph":[101],"provide":[103],"necessary":[105],"common":[106],"sense":[107],"or":[108],"experience":[109],"reasoning":[112],"process.":[113],"For":[114],"these":[115],"two":[116],"augmented":[117],"inputs,":[118],"design":[120],"attention":[122],"module":[123],"can":[125,143],"adjust":[126],"itself":[127],"according":[128],"specific":[131],"questions,":[132],"importance":[136],"external":[138],"against":[140],"detected":[141],"objects":[142],"be":[144],"balanced":[145],"adaptively.":[146],"Extensive":[147],"experiments":[148],"show":[149],"our":[151,171],"KAN":[152],"achieves":[153],"state-of-the-art":[154],"performance":[155],"three":[157],"challenging":[158],"VQA":[159,163,178],"sets,":[161],"i.e.,":[162],"v2,":[164,166],"VQA-CP":[165],"FVQA.":[168],"In":[169],"addition,":[170],"is":[174,181],"also":[175],"beneficial":[176],"baselines.":[179],"Code":[180],"available":[182],"at":[183],"https://github.com/yyyanglz/KAN.":[184]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":19},{"year":2024,"cited_by_count":20},{"year":2023,"cited_by_count":18},{"year":2022,"cited_by_count":11},{"year":2021,"cited_by_count":5}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
