{"id":"https://openalex.org/W4413469110","doi":"https://doi.org/10.1109/tmm.2025.3599076","title":"Mitigating Hallucinations in Large Vision-Language Models via Reasoning Uncertainty-Guided Refinement","display_name":"Mitigating Hallucinations in Large Vision-Language Models via Reasoning Uncertainty-Guided Refinement","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4413469110","doi":"https://doi.org/10.1109/tmm.2025.3599076"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2025.3599076","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3599076","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5043867916","display_name":"Shenshen Li","orcid":"https://orcid.org/0000-0002-6340-012X"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]},{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shenshen Li","raw_affiliation_strings":["School of Computer Science and Technology, Tongji University, Shanghai, China","Center for Future Media and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]},{"raw_affiliation_string":"Center for Future Media and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009074046","display_name":"Xing Xu","orcid":"https://orcid.org/0000-0001-5685-3123"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]},{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xing Xu","raw_affiliation_strings":["School of Computer Science and Technology, Tongji University, Shanghai, China","Center for Future Media and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]},{"raw_affiliation_string":"Center for Future Media and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057871676","display_name":"Wei Meng","orcid":"https://orcid.org/0000-0001-5186-419X"},"institutions":[{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenxin Meng","raw_affiliation_strings":["Center for Future Media and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"Center for Future Media and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108085750","display_name":"Jingkuan Song","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]},{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jingkuan Song","raw_affiliation_strings":["School of Computer Science and Technology, Tongji University, Shanghai, China","Center for Future Media and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]},{"raw_affiliation_string":"Center for Future Media and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017577255","display_name":"Chong Peng","orcid":"https://orcid.org/0000-0002-6942-7358"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chong Peng","raw_affiliation_strings":["Meituan, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Shanghai, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5000395470","display_name":"Hengtao Shen","orcid":"https://orcid.org/0000-0001-8330-2204"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]},{"id":"https://openalex.org/I150229711","display_name":"University of Electronic Science and Technology of China","ror":"https://ror.org/04qr3zq92","country_code":"CN","type":"education","lineage":["https://openalex.org/I150229711"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Heng Tao Shen","raw_affiliation_strings":["School of Computer Science and Technology, Tongji University, Shanghai, China","Center for Future Media and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]},{"raw_affiliation_string":"Center for Future Media and School of Computer Science and Engineering, University of Electronic Science and Technology of China, Chengdu, China","institution_ids":["https://openalex.org/I150229711"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5043867916"],"corresponding_institution_ids":["https://openalex.org/I116953780","https://openalex.org/I150229711"],"apc_list":null,"apc_paid":null,"fwci":6.8844,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.96663822,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"27","issue":null,"first_page":"7380","last_page":"7391"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9575999975204468,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13702","display_name":"Machine Learning in Healthcare","score":0.9575999975204468,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11775","display_name":"COVID-19 diagnosis using AI","score":0.9147999882698059,"subfield":{"id":"https://openalex.org/subfields/2741","display_name":"Radiology, Nuclear Medicine and Imaging"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.911300003528595,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7884110808372498},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.48687997460365295},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4655372202396393},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.45687615871429443},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33284151554107666}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7884110808372498},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.48687997460365295},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4655372202396393},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.45687615871429443},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33284151554107666}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2025.3599076","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3599076","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.5199999809265137}],"awards":[{"id":"https://openalex.org/G3626616767","display_name":null,"funder_award_id":"62476201","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5347999826","display_name":null,"funder_award_id":"62222203","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":34,"referenced_works":["https://openalex.org/W1578800471","https://openalex.org/W1861492603","https://openalex.org/W2277195237","https://openalex.org/W2591669147","https://openalex.org/W2962735233","https://openalex.org/W3111984153","https://openalex.org/W3119635706","https://openalex.org/W3203255241","https://openalex.org/W4307232305","https://openalex.org/W4312933868","https://openalex.org/W4322730934","https://openalex.org/W4323338370","https://openalex.org/W4386038408","https://openalex.org/W4386076314","https://openalex.org/W4387968696","https://openalex.org/W4389519587","https://openalex.org/W4389523832","https://openalex.org/W4391287688","https://openalex.org/W4393160204","https://openalex.org/W4400647053","https://openalex.org/W4400810332","https://openalex.org/W4402670231","https://openalex.org/W4402671548","https://openalex.org/W4402683883","https://openalex.org/W4402704633","https://openalex.org/W4402726945","https://openalex.org/W4402727764","https://openalex.org/W4402727851","https://openalex.org/W4402753774","https://openalex.org/W4404544903","https://openalex.org/W4404784276","https://openalex.org/W4405596328","https://openalex.org/W4410536678","https://openalex.org/W4414198367"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W4387369504","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W3107602296","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4283697347"],"abstract_inverted_index":{"Despite":[0],"demonstrating":[1],"impressive":[2],"capabilities":[3],"in":[4,55,117,203],"comprehending":[5],"multi-modal":[6],"contexts,":[7],"large":[8],"vision-language":[9],"models":[10,73,145],"(LVLMs)":[11],"are":[12],"invariably":[13],"prone":[14],"to":[15,86,161,192],"generate":[16],"unreliable":[17],"answers,":[18],"i.e.,":[19],"hallucinations.":[20,87],"Existing":[21],"methods":[22,39],"mainly":[23],"mitigate":[24,200],"this":[25,90,152],"hallucination":[26],"by":[27,58,138,184],"introducing":[28],"specific":[29],"designed":[30],"datasets":[31,47],"or":[32],"employing":[33],"contrastive":[34],"decoding":[35],"techniques.":[36],"However,":[37],"these":[38],"heavily":[40],"rely":[41],"on":[42,60,151,216],"the":[43,52,72,77,132,140,147,157,163,174],"quality":[44],"of":[45,177],"constructed":[46],"and":[48,63,146,169,180,199],"negative":[49],"samples,":[50],"overlooking":[51],"inherent":[53],"ambiguity":[54],"reasoning":[56,67,134,164,185],"caused":[57],"over-reliance":[59],"linguistic":[61],"priors":[62],"data":[64],"complexity,":[65],"termed":[66],"uncertainty.":[68],"This":[69],"oversight":[70],"hinders":[71],"from":[74,119],"effectively":[75],"identifying":[76],"causal":[78,133,144],"relationships":[79,135],"behind":[80],"each":[81],"token,":[82],"increasing":[83],"their":[84],"susceptibility":[85],"To":[88],"address":[89],"issue,":[91],"we":[92,129,154,187],"propose":[93],"a":[94],"novel":[95],"framework":[96],"named":[97],"<bold":[98,103,108],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[99,101,104,106,109,111],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">R</b><italic":[100,110],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">easoning</i>":[102],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">U</b><italic":[105],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">ncertainty-guided</i>":[107],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">efinement":[112],"(RUR)</i>":[113],"for":[114],"mitigating":[115],"hallucinations":[116,202],"LVLMs":[118],"an":[120],"uncertainty":[121,126,165,198],"perspective.":[122],"Specifically,":[123],"unlike":[124],"conventional":[125],"quantification":[127],"methods,":[128],"first":[130],"extract":[131],"between":[136,142],"tokens":[137,179,195],"exploiting":[139],"link":[141],"structural":[143],"Transformer":[148],"architecture.":[149],"Based":[150],"relationship,":[153],"then":[155],"employ":[156],"Subjective":[158],"Logic":[159],"principle":[160],"model":[162],"at":[166],"both":[167],"token":[168],"sentence":[170],"levels,":[171],"which":[172],"reflects":[173],"unreliability":[175],"degree":[176],"generated":[178],"sentences.":[181,204],"Finally,":[182],"guided":[183],"uncertainty,":[186],"develop":[188],"multi-level":[189],"uncertainty-based":[190],"adjustment":[191],"eliminate":[193],"deceptive":[194],"exhibiting":[196],"severe":[197],"potential":[201],"Extensive":[205],"experiments":[206],"demonstrate":[207],"that":[208],"our":[209],"RUR":[210],"method":[211],"consistently":[212],"achieves":[213],"state-of-the-art":[214],"performance":[215],"five":[217],"benchmarks.":[218]},"counts_by_year":[{"year":2026,"cited_by_count":3}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
