{"id":"https://openalex.org/W4395065450","doi":"https://doi.org/10.48550/arxiv.2404.13947","title":"Self-Bootstrapped Visual-Language Model for Knowledge Selection and Question Answering","display_name":"Self-Bootstrapped Visual-Language Model for Knowledge Selection and Question Answering","publication_year":2024,"publication_date":"2024-04-22","ids":{"openalex":"https://openalex.org/W4395065450","doi":"https://doi.org/10.48550/arxiv.2404.13947"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2404.13947","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.13947","pdf_url":"https://arxiv.org/pdf/2404.13947","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2404.13947","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5094185904","display_name":"Dongze Hao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hao, Dongze","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043193778","display_name":"Qunbo Wang","orcid":"https://orcid.org/0000-0002-5607-7854"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Qunbo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040424302","display_name":"Longteng Guo","orcid":"https://orcid.org/0000-0002-4340-4000"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Longteng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020010429","display_name":"Jie Jiang","orcid":"https://orcid.org/0000-0003-3985-8701"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Jie","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100748638","display_name":"Jing Liu","orcid":"https://orcid.org/0000-0002-7594-3244"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Jing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9391000270843506,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10876","display_name":"Fault Detection and Control Systems","score":0.9391000270843506,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bootstrapping","display_name":"Bootstrapping (finance)","score":0.9118492603302002},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.6754178404808044},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.6463080644607544},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.47558653354644775},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.36212795972824097},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.28516700863838196},{"id":"https://openalex.org/keywords/econometrics","display_name":"Econometrics","score":0.17458337545394897},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1304090917110443}],"concepts":[{"id":"https://openalex.org/C207609745","wikidata":"https://www.wikidata.org/wiki/Q4944086","display_name":"Bootstrapping (finance)","level":2,"score":0.9118492603302002},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.6754178404808044},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.6463080644607544},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.47558653354644775},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.36212795972824097},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28516700863838196},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.17458337545394897},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1304090917110443}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2404.13947","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.13947","pdf_url":"https://arxiv.org/pdf/2404.13947","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2404.13947","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2404.13947","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2404.13947","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2404.13947","pdf_url":"https://arxiv.org/pdf/2404.13947","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1283858192","display_name":null,"funder_award_id":"U21B2043","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1508456709","display_name":null,"funder_award_id":"62102416","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4729153174","display_name":null,"funder_award_id":"2023ZD0121200","funder_id":"https://openalex.org/F4320329860","funder_display_name":"National Science and Technology Major Project"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321605","display_name":"Government of Jiangsu Province","ror":"https://ror.org/004svx814"},{"id":"https://openalex.org/F4320329860","display_name":"National Science and Technology Major Project","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4395065450.pdf","grobid_xml":"https://content.openalex.org/works/W4395065450.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W1534274833","https://openalex.org/W3117246195","https://openalex.org/W156620619","https://openalex.org/W2616249226","https://openalex.org/W2098233217","https://openalex.org/W2914363205","https://openalex.org/W2997844990","https://openalex.org/W1598221548"],"abstract_inverted_index":{"While":[0],"large":[1],"visual-language":[2,110],"models":[3],"(LVLM)":[4],"have":[5],"shown":[6],"promising":[7],"results":[8],"on":[9,174,203],"traditional":[10],"visual":[11],"question":[12],"answering":[13],"benchmarks,":[14],"it":[15],"is":[16,82,219],"still":[17],"challenging":[18,205],"for":[19],"them":[20,158],"to":[21,51,55,86,112,159,163,189],"answer":[22,59,88,121],"complex":[23],"VQA":[24,208],"problems":[25],"which":[26,69],"requires":[27],"diverse":[28],"world":[29],"knowledge.":[30],"Motivated":[31],"by":[32,118,136,142],"the":[33,39,57,79,89,92,95,109,114,137,148,153,161,167,175,178,187,198,201,204],"research":[34],"of":[35,41,75,94,126,169,177,200,215],"retrieval-augmented":[36],"generation":[37],"in":[38,65,147],"field":[40],"natural":[42,66],"language":[43,67],"processing,":[44],"we":[45,102],"use":[46,157],"Dense":[47],"Passage":[48],"Retrieval":[49],"(DPR)":[50],"retrieve":[52],"related":[53],"knowledge":[54,81,116,146,150,171],"help":[56],"model":[58,111],"questions.":[60,122],"However,":[61],"DPR":[62,119],"conduct":[63],"retrieving":[64],"space,":[68],"may":[70],"not":[71,83],"ensure":[72],"comprehensive":[73],"acquisition":[74],"image":[76],"information.":[77],"Thus,":[78],"retrieved":[80,117,149],"truly":[84],"conducive":[85],"helping":[87],"question,":[90],"affecting":[91],"performance":[93,199],"overall":[96],"system.":[97],"To":[98],"address":[99],"this":[100],"issue,":[101],"propose":[103],"a":[104,212],"novel":[105],"framework":[106,124,195],"that":[107],"leverages":[108],"select":[113,190],"key":[115,145,170,191],"and":[120,130,139,155,180,184],"The":[123],"consists":[125],"two":[127],"modules:":[128],"Selector":[129,188],"Answerer,":[131],"where":[132],"both":[133],"are":[134],"initialized":[135],"LVLM":[138],"parameter-efficiently":[140],"finetuned":[141],"self-bootstrapping:":[143],"find":[144],"documents":[151,172],"using":[152],"Selector,":[154],"then":[156,185],"finetune":[160,186],"Answerer":[162,179],"predict":[164],"answers;":[165],"obtain":[166],"pseudo-labels":[168],"based":[173],"predictions":[176],"weak":[181],"supervision":[182],"labels,":[183],"knowledge;":[192],"repeat.":[193],"Our":[194,217],"significantly":[196],"enhances":[197],"baseline":[202],"open-domain":[206],"Knowledge-based":[207],"benchmark,":[209],"OK-VQA,":[210],"achieving":[211],"state-of-the-art":[213],"accuracy":[214],"62.83%.":[216],"code":[218],"publicly":[220],"available":[221],"at":[222],"https://github.com/haodongze/Self-KSel-QAns.":[223]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2024-04-24T00:00:00"}
