{"id":"https://openalex.org/W7128398860","doi":"https://doi.org/10.48550/arxiv.2602.06050","title":"Relevance-aware Multi-context Contrastive Decoding for Retrieval-augmented Visual Question Answering","display_name":"Relevance-aware Multi-context Contrastive Decoding for Retrieval-augmented Visual Question Answering","publication_year":2026,"publication_date":"2026-01-14","ids":{"openalex":"https://openalex.org/W7128398860","doi":"https://doi.org/10.48550/arxiv.2602.06050"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.06050","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5001493781","display_name":"Jongha Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Kim, Jongha","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110502130","display_name":"B. Ko","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ko, Byungoh","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084675431","display_name":"Jeehye Na","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Na, Jeehye","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125423765","display_name":"Jinsung Yoon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yoon, Jinsung","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125390144","display_name":"Hyunwoo J. Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kim, Hyunwoo J.","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5001493781"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9926000237464905,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.0027000000700354576,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.0010999999940395355,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.8654000163078308},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6238999962806702},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.5547000169754028},{"id":"https://openalex.org/keywords/question-answering","display_name":"Question answering","score":0.5414999723434448},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4661000072956085},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.33329999446868896}],"concepts":[{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.8654000163078308},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6991999745368958},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6238999962806702},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.5547000169754028},{"id":"https://openalex.org/C44291984","wikidata":"https://www.wikidata.org/wiki/Q1074173","display_name":"Question answering","level":2,"score":0.5414999723434448},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5235999822616577},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.48030000925064087},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4661000072956085},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.33329999446868896},{"id":"https://openalex.org/C204397858","wikidata":"https://www.wikidata.org/wiki/Q4437907","display_name":"List decoding","level":5,"score":0.30730000138282776},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.29440000653266907},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.28119999170303345},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.27320000529289246},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.25690001249313354},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2547000050544739}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.06050","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.06050","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.06050","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.06050","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"score":0.6204025745391846,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Despite":[0],"the":[1,60,104,121,140,157,173,178,181,184],"remarkable":[2],"capabilities":[3],"of":[4,63,124,160],"Large":[5],"Vision":[6],"Language":[7],"Models":[8],"(LVLMs),":[9],"they":[10,50],"still":[11],"lack":[12],"detailed":[13],"knowledge":[14],"about":[15],"specific":[16],"entities.":[17],"Retrieval-augmented":[18],"Generation":[19],"(RAG)":[20],"is":[21,97,170,189],"a":[22,76,84],"widely":[23],"adopted":[24],"solution":[25],"that":[26,41,129,168],"enhances":[27],"LVLMs":[28,161],"by":[29,87,155],"providing":[30],"additional":[31,163],"contexts":[32,57,117],"from":[33,114],"an":[34],"external":[35],"Knowledge":[36],"Base.":[37],"However,":[38],"we":[39,69],"observe":[40],"previous":[42],"decoding":[43,78,134,158],"methods":[44,135],"for":[45,80],"RAG":[46],"are":[47],"sub-optimal":[48],"as":[49],"fail":[51],"to":[52,103,172,183],"sufficiently":[53],"leverage":[54],"multiple":[55,115,137],"relevant":[56,116],"and":[58],"suppress":[59],"negative":[61,122],"effects":[62,123],"irrelevant":[64,125],"contexts.":[65],"To":[66],"this":[67],"end,":[68],"propose":[70],"Relevance-aware":[71],"Multi-context":[72],"Contrastive":[73],"Decoding":[74],"(RMCD),":[75],"novel":[77],"method":[79,159],"RAG.":[81],"RMCD":[82,109,130,150,169],"outputs":[83,89],"final":[85],"prediction":[86],"combining":[88],"predicted":[90],"with":[91],"each":[92,95],"context,":[93],"where":[94],"output":[96],"weighted":[98],"based":[99],"on":[100,143],"its":[101],"relevance":[102],"question.":[105],"By":[106],"doing":[107],"so,":[108],"effectively":[110],"aggregates":[111],"useful":[112],"information":[113],"while":[118],"also":[119,166],"counteracting":[120],"ones.":[126],"Experiments":[127],"show":[128,167],"consistently":[131,176],"outperforms":[132],"other":[133],"across":[136,180],"LVLMs,":[138],"achieving":[139],"best":[141,179],"performance":[142],"three":[144],"knowledge-intensive":[145],"visual":[146],"question-answering":[147],"benchmarks.":[148],"Also,":[149],"can":[151],"be":[152],"simply":[153],"applied":[154],"replacing":[156],"without":[162],"training.":[164],"Analyses":[165],"robust":[171],"retrieval":[174,186],"results,":[175],"performing":[177],"weakest":[182],"strongest":[185],"results.":[187],"Code":[188],"available":[190],"at":[191],"https://github.com/mlvlab/RMCD.":[192]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-10T00:00:00"}
