{"id":"https://openalex.org/W4405030341","doi":"https://doi.org/10.48550/arxiv.2411.19466","title":"ForgerySleuth: Empowering Multimodal Large Language Models for Image Manipulation Detection","display_name":"ForgerySleuth: Empowering Multimodal Large Language Models for Image Manipulation Detection","publication_year":2024,"publication_date":"2024-11-29","ids":{"openalex":"https://openalex.org/W4405030341","doi":"https://doi.org/10.48550/arxiv.2411.19466"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2411.19466","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.19466","pdf_url":"https://arxiv.org/pdf/2411.19466","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2411.19466","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102744130","display_name":"Zhihao Sun","orcid":"https://orcid.org/0009-0000-4018-6194"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sun, Zhihao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101694702","display_name":"Haoran Jiang","orcid":"https://orcid.org/0000-0002-1533-1887"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Haoran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076186276","display_name":"Haoran Chen","orcid":"https://orcid.org/0009-0006-1067-7391"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Haoran","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023326846","display_name":"Yixin Cao","orcid":"https://orcid.org/0000-0001-7157-6961"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Yixin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044665993","display_name":"Xipeng Qiu","orcid":"https://orcid.org/0000-0001-7163-5247"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qiu, Xipeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026167547","display_name":"Zuxuan Wu","orcid":"https://orcid.org/0000-0002-8689-5807"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Zuxuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5047962986","display_name":"Yu\u2013Gang Jiang","orcid":"https://orcid.org/0000-0002-1907-8567"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiang, Yu-Gang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5102744130"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9133999943733215,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9133999943733215,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5752837061882019},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.5546688437461853},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48191550374031067},{"id":"https://openalex.org/keywords/image-manipulation","display_name":"Image manipulation","score":0.4780583679676056},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.45971420407295227},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.4150083661079407}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5752837061882019},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.5546688437461853},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48191550374031067},{"id":"https://openalex.org/C2987933465","wikidata":"https://www.wikidata.org/wiki/Q141130","display_name":"Image manipulation","level":3,"score":0.4780583679676056},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.45971420407295227},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4150083661079407}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2411.19466","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.19466","pdf_url":"https://arxiv.org/pdf/2411.19466","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2411.19466","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2411.19466","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2411.19466","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2411.19466","pdf_url":"https://arxiv.org/pdf/2411.19466","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G37568934","display_name":null,"funder_award_id":"Grant","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Multimodal":[0],"large":[1],"language":[2],"models":[3],"have":[4],"unlocked":[5],"new":[6],"possibilities":[7],"for":[8,98],"various":[9],"multimodal":[10],"tasks.":[11],"However,":[12],"their":[13],"potential":[14],"in":[15,118],"image":[16,83],"manipulation":[17,84],"detection":[18,85],"remains":[19],"unexplored.":[20],"When":[21],"directly":[22],"applied":[23],"to":[24,48,80,93],"the":[25,67,71,82,99,106],"IMD":[26],"task,":[27],"M-LLMs":[28,47],"often":[29],"produce":[30],"reasoning":[31,78],"texts":[32],"that":[33,60,112],"suffer":[34],"from":[35],"hallucinations":[36],"and":[37,53,77,110,121],"overthinking.":[38],"To":[39],"address":[40],"this,":[41],"we":[42,65],"propose":[43],"ForgerySleuth,":[44],"which":[45,74],"leverages":[46],"perform":[49],"comprehensive":[50],"clue":[51],"fusion":[52],"generate":[54],"segmentation":[55],"outputs":[56],"indicating":[57],"specific":[58],"regions":[59],"are":[61],"tampered":[62],"with.":[63],"Moreover,":[64],"construct":[66],"ForgeryAnalysis":[68,109],"dataset":[69,97],"through":[70],"Chain-of-Clues":[72],"prompt,":[73],"includes":[75],"analysis":[76],"text":[79],"upgrade":[81],"task.":[86],"A":[87],"data":[88],"engine":[89],"is":[90],"also":[91],"introduced":[92],"build":[94],"a":[95],"larger-scale":[96],"pre-training":[100],"phase.":[101],"Our":[102],"extensive":[103],"experiments":[104],"demonstrate":[105],"effectiveness":[107],"of":[108],"show":[111],"ForgerySleuth":[113],"significantly":[114],"outperforms":[115],"existing":[116],"methods":[117],"generalization,":[119],"robustness,":[120],"explainability.":[122]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2024-12-05T00:00:00"}
