{"id":"https://openalex.org/W7155192189","doi":"https://doi.org/10.48550/arxiv.2604.19412","title":"VCE: A zero-cost hallucination mitigation method of LVLMs via visual contrastive editing","display_name":"VCE: A zero-cost hallucination mitigation method of LVLMs via visual contrastive editing","publication_year":2026,"publication_date":"2026-04-21","ids":{"openalex":"https://openalex.org/W7155192189","doi":"https://doi.org/10.48550/arxiv.2604.19412"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.19412","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19412","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.19412","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134276702","display_name":"Yanbin Huang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Huang, Yanbin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134207770","display_name":"Yisen Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Yisen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134252818","display_name":"Guiyao Tie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tie, Guiyao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065871371","display_name":"Xiaoye Qu","orcid":"https://orcid.org/0000-0002-4907-3978"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qu, Xiaoye","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134309524","display_name":"Pan Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Pan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134257048","display_name":"Hongfei Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Hongfei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005852517","display_name":"Zhaofan Zou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zou, Zhaofan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101409441","display_name":"Hao Sun","orcid":"https://orcid.org/0000-0001-7797-8718"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Hao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134294175","display_name":"XueLong Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Xuelong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.3582000136375427,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.3582000136375427,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13397","display_name":"Hallucinations in medical conditions","score":0.07209999859333038,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T11094","display_name":"Face Recognition and Perception","score":0.050999999046325684,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/singular-value-decomposition","display_name":"Singular value decomposition","score":0.614300012588501},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5910000205039978},{"id":"https://openalex.org/keywords/visual-hallucination","display_name":"Visual Hallucination","score":0.541100025177002},{"id":"https://openalex.org/keywords/decomposition","display_name":"Decomposition","score":0.37220001220703125},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.367900013923645},{"id":"https://openalex.org/keywords/linear-subspace","display_name":"Linear subspace","score":0.34299999475479126},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.31380000710487366}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7088000178337097},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6413000226020813},{"id":"https://openalex.org/C22789450","wikidata":"https://www.wikidata.org/wiki/Q420904","display_name":"Singular value decomposition","level":2,"score":0.614300012588501},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5910000205039978},{"id":"https://openalex.org/C2908998935","wikidata":"https://www.wikidata.org/wiki/Q130741","display_name":"Visual Hallucination","level":2,"score":0.541100025177002},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4253000020980835},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.41670000553131104},{"id":"https://openalex.org/C124681953","wikidata":"https://www.wikidata.org/wiki/Q339062","display_name":"Decomposition","level":2,"score":0.37220001220703125},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.367900013923645},{"id":"https://openalex.org/C12362212","wikidata":"https://www.wikidata.org/wiki/Q728435","display_name":"Linear subspace","level":2,"score":0.34299999475479126},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.31380000710487366},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.3133000135421753},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2773999869823456},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.2696000039577484},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2687000036239624},{"id":"https://openalex.org/C178253425","wikidata":"https://www.wikidata.org/wiki/Q162668","display_name":"Visual perception","level":3,"score":0.26249998807907104},{"id":"https://openalex.org/C2911011789","wikidata":"https://www.wikidata.org/wiki/Q130741","display_name":"Hallucinating","level":2,"score":0.26159998774528503},{"id":"https://openalex.org/C155092808","wikidata":"https://www.wikidata.org/wiki/Q182557","display_name":"Computational linguistics","level":2,"score":0.25270000100135803},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.25200000405311584}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.19412","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19412","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.19412","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.19412","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"vision-language":[1],"models":[2],"(LVLMs)":[3],"frequently":[4],"suffer":[5],"from":[6,53],"Object":[7],"Hallucination":[8],"(OH),":[9],"wherein":[10],"they":[11],"generate":[12,64],"descriptions":[13],"containing":[14],"objects":[15],"that":[16,47,60,85,127,153],"are":[17],"not":[18],"actually":[19],"present":[20],"in":[21,30,147],"the":[22,48,93,107,164],"input":[23],"image.":[24],"This":[25],"phenomenon":[26],"is":[27,42],"particularly":[28],"problematic":[29],"real-world":[31],"applications":[32],"such":[33],"as":[34,135],"medical":[35],"imaging":[36],"and":[37,87,115,143],"autonomous":[38],"driving,":[39],"where":[40],"accuracy":[41],"critical.":[43],"Recent":[44],"studies":[45],"suggest":[46],"hallucination":[49,113,158],"problem":[50],"may":[51],"stem":[52],"language":[54],"priors:":[55],"biases":[56],"learned":[57],"during":[58],"pretraining":[59],"cause":[61],"LVLMs":[62],"to":[63,96,111,120],"words":[65],"based":[66],"on":[67],"their":[68],"statistical":[69],"co-occurrence.":[70],"To":[71],"mitigate":[72],"this":[73],"problem,":[74],"we":[75,105],"propose":[76],"Visual":[77],"Contrastive":[78],"Editing":[79],"(VCE),":[80],"a":[81,136],"novel":[82],"post-hoc":[83],"method":[84],"identifies":[86],"suppresses":[88],"hallucinatory":[89],"tendencies":[90],"by":[91],"analyzing":[92],"model's":[94,108,165],"response":[95],"contrastive":[97],"visual":[98],"perturbations.":[99],"Using":[100],"Singular":[101],"Value":[102],"Decomposition":[103],"(SVD),":[104],"decompose":[106],"activation":[109],"patterns":[110],"isolate":[112],"subspaces":[114],"apply":[116],"targeted":[117],"parameter":[118],"edits":[119],"attenuate":[121],"its":[122],"influence.":[123],"Unlike":[124],"existing":[125],"approaches":[126],"require":[128],"fine-tuning":[129],"or":[130],"labeled":[131],"data,":[132],"VCE":[133,154],"operates":[134],"label-free":[137],"intervention,":[138],"making":[139],"it":[140],"both":[141],"scalable":[142],"practical":[144],"for":[145],"deployment":[146],"resource-constrained":[148],"settings.":[149],"Experimental":[150],"results":[151],"demonstrate":[152],"effectively":[155],"reduces":[156],"object":[157],"across":[159],"multiple":[160],"benchmarks":[161],"while":[162],"maintaining":[163],"original":[166],"computational":[167],"efficiency.":[168]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-23T00:00:00"}
