{"id":"https://openalex.org/W4413146493","doi":"https://doi.org/10.1109/cvpr52734.2025.02782","title":"HalLoc: Token-level Localization of Hallucinations for Vision Language Models","display_name":"HalLoc: Token-level Localization of Hallucinations for Vision Language Models","publication_year":2025,"publication_date":"2025-06-10","ids":{"openalex":"https://openalex.org/W4413146493","doi":"https://doi.org/10.1109/cvpr52734.2025.02782"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr52734.2025.02782","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52734.2025.02782","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028403649","display_name":"EunKyu Park","orcid":null},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Eunkyu Park","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067888301","display_name":"Minyeong Kim","orcid":"https://orcid.org/0000-0002-3207-4616"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Minyeong Kim","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100664729","display_name":"Gunhee Kim","orcid":"https://orcid.org/0000-0002-9543-7453"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Gunhee Kim","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5028403649"],"corresponding_institution_ids":["https://openalex.org/I139264467"],"apc_list":null,"apc_paid":null,"fwci":1.5558,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.85501061,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"29893","last_page":"29903"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10094","display_name":"Epilepsy research and treatment","score":0.92330002784729,"subfield":{"id":"https://openalex.org/subfields/2738","display_name":"Psychiatry and Mental health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}},"topics":[{"id":"https://openalex.org/T10094","display_name":"Epilepsy research and treatment","score":0.92330002784729,"subfield":{"id":"https://openalex.org/subfields/2738","display_name":"Psychiatry and Mental health"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7342202067375183},{"id":"https://openalex.org/keywords/security-token","display_name":"Security token","score":0.7078283429145813},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.47946298122406006},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.43851327896118164},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3312312960624695},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3311503827571869},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.2137000560760498}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7342202067375183},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.7078283429145813},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47946298122406006},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.43851327896118164},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3312312960624695},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3311503827571869},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.2137000560760498}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvpr52734.2025.02782","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52734.2025.02782","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.49000000953674316,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Hallucinations":[0],"pose":[1],"a":[2,65,113,143],"significant":[3],"challenge":[4],"to":[5,32,43],"the":[6,49,95,154],"reliability":[7,136],"of":[8,97,142,156],"large":[9],"vision-language":[10,157],"models,":[11,30],"making":[12],"their":[13],"detection":[14,23,123,147],"essential":[15],"for":[16,45,68,152],"ensuring":[17],"accuracy":[18],"in":[19,159],"critical":[20],"applications.":[21,161],"Current":[22],"methods":[24],"often":[25],"rely":[26],"on":[27,117],"computationally":[28],"intensive":[29],"leading":[31],"high":[33],"latency":[34],"and":[35,53,88,165],"resource":[36],"demands.":[37],"Their":[38],"definitive":[39],"outcomes":[40],"also":[41],"fail":[42],"account":[44],"real-world":[46,160],"scenarios":[47],"where":[48],"line":[50],"between":[51],"hallucinated":[52],"truthful":[54],"information":[55],"is":[56],"unclear.":[57],"To":[58],"address":[59],"these":[60],"issues,":[61],"we":[62,111],"propose":[63],"HalLoc,":[64,118],"dataset":[66,93,164],"designed":[67],"efficient,":[69],"probabilistic":[70],"hallucination":[71,80,122,146],"detection.":[72],"It":[73],"features":[74],"150K":[75],"token-level":[76],"annotated":[77],"samples,":[78],"including":[79],"types,":[81],"across":[82],"Visual":[83],"Question":[84],"Answering":[85],"(VQA),":[86],"instruction-following,":[87],"image":[89],"captioning":[90],"tasks.":[91],"This":[92],"facilitates":[94],"development":[96],"models":[98,158],"that":[99],"detect":[100],"hallucinations":[101],"with":[102],"graded":[103],"confidence,":[104],"enabling":[105],"more":[106],"informed":[107],"user":[108],"interactions.":[109],"Additionally,":[110],"introduce":[112],"baseline":[114],"model":[115,127],"trained":[116],"offering":[119],"low-overhead,":[120],"concurrent":[121],"during":[124],"generation.":[125],"The":[126,140,162],"can":[128],"be":[129],"seamlessly":[130],"integrated":[131],"into":[132],"existing":[133],"VLMs,":[134],"improving":[135],"while":[137],"preserving":[138],"efficiency.":[139],"prospect":[141],"robust":[144],"plug-and-play":[145],"module":[148],"opens":[149],"new":[150],"avenues":[151],"enhancing":[153],"trustworthiness":[155],"HalLoc":[163],"code":[166],"are":[167],"publicly":[168],"available":[169],"at:":[170],"https://github.com/dbsltm/cvpr25_halloc.":[171]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2025-12-28T23:10:05.387466","created_date":"2025-10-10T00:00:00"}
