{"id":"https://openalex.org/W7151584744","doi":"https://doi.org/10.48550/arxiv.2604.04692","title":"Is a Picture Worth a Thousand Words? Adaptive Multimodal Fact-Checking with Visual Evidence Necessity","display_name":"Is a Picture Worth a Thousand Words? Adaptive Multimodal Fact-Checking with Visual Evidence Necessity","publication_year":2026,"publication_date":"2026-04-06","ids":{"openalex":"https://openalex.org/W7151584744","doi":"https://doi.org/10.48550/arxiv.2604.04692"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.04692","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04692","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.04692","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114337163","display_name":"Jaeyoon Jung","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jung, Jaeyoon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133144789","display_name":"Yejun Yoon","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yoon, Yejun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5069120214","display_name":"Kunwoo Park","orcid":"https://orcid.org/0000-0003-2913-9711"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Park, Kunwoo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5114337163"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.661300003528595,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.661300003528595,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.07069999724626541,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.04320000112056732,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6872000098228455},{"id":"https://openalex.org/keywords/multimodal-interaction","display_name":"Multimodal interaction","score":0.38530001044273376},{"id":"https://openalex.org/keywords/visual-attention","display_name":"Visual attention","score":0.3303999900817871},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.296999990940094},{"id":"https://openalex.org/keywords/interpretability","display_name":"Interpretability","score":0.2662999927997589},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.2621999979019165}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7224000096321106},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6872000098228455},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.489300012588501},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.42149999737739563},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.38530001044273376},{"id":"https://openalex.org/C2986089797","wikidata":"https://www.wikidata.org/wiki/Q6501338","display_name":"Visual attention","level":3,"score":0.3303999900817871},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3287000060081482},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3046000003814697},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.296999990940094},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2694999873638153},{"id":"https://openalex.org/C2781067378","wikidata":"https://www.wikidata.org/wiki/Q17027399","display_name":"Interpretability","level":2,"score":0.2662999927997589},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.2621999979019165},{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.25769999623298645},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2547999918460846},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.2540000081062317}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.04692","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04692","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.04692","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.04692","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.5888186097145081,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Automated":[0],"fact-checking":[1,61],"is":[2,25,85],"a":[3,8,22,59,91],"crucial":[4],"task":[5],"that":[6,26,42,63,112],"supports":[7],"responsible":[9],"information":[10],"ecosystem.":[11],"While":[12],"recent":[13],"research":[14],"has":[15],"progressed":[16],"from":[17],"text-only":[18],"to":[19],"multimodal":[20,47,60],"fact-checking,":[21],"prevailing":[23],"assumption":[24,39],"incorporating":[27,113],"visual":[28,77,83,118],"evidence":[29,48,84,101,119],"universally":[30],"improves":[31],"performance.":[32,130],"In":[33],"this":[34,38,54],"work,":[35],"we":[36,56],"challenge":[37],"and":[40,90,102,136],"show":[41,111],"the":[43,73,99,103,114,122],"indiscriminate":[44],"use":[45,75],"of":[46,76,117],"can":[49],"reduce":[50],"accuracy.":[51],"To":[52],"address":[53],"challenge,":[55],"propose":[57],"AMuFC,":[58],"framework":[62],"employs":[64],"two":[65],"collaborative":[66],"vision-language":[67],"models":[68],"with":[69],"distinct":[70],"roles":[71],"for":[72,87],"adaptive":[74],"evidence:":[78],"an":[79],"Analyzer":[80],"determines":[81],"whether":[82],"necessary":[86],"claim":[88,94],"verification,":[89],"Verifier":[92],"predicts":[93],"veracity":[95],"conditioned":[96],"on":[97,108],"both":[98],"retrieved":[100],"Analyzer's":[104,115],"assessment.":[105],"Experimental":[106],"results":[107],"three":[109],"datasets":[110,137],"assessment":[116],"necessity":[120],"into":[121],"Verifier's":[123],"prediction":[124],"yields":[125],"substantial":[126],"improvements":[127],"in":[128],"verification":[129],"We":[131],"will":[132],"release":[133],"all":[134],"code":[135],"at":[138],"https://github.com/ssu-humane/AMuFC.":[139]},"counts_by_year":[],"updated_date":"2026-05-15T06:05:50.897203","created_date":"2026-04-08T00:00:00"}
