{"id":"https://openalex.org/W4399418571","doi":"https://doi.org/10.1145/3652583.3657600","title":"Enhancing Cheapfake Detection: An Approach Using Prompt Engineering and Interleaved Text-Image Model","display_name":"Enhancing Cheapfake Detection: An Approach Using Prompt Engineering and Interleaved Text-Image Model","publication_year":2024,"publication_date":"2024-05-30","ids":{"openalex":"https://openalex.org/W4399418571","doi":"https://doi.org/10.1145/3652583.3657600"},"language":"en","primary_location":{"id":"doi:10.1145/3652583.3657600","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3652583.3657600","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3657600","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3657600","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103159113","display_name":"Dang Vu","orcid":"https://orcid.org/0009-0003-3268-024X"},"institutions":[{"id":"https://openalex.org/I123565023","display_name":"Vietnam National University Ho Chi Minh City","ror":"https://ror.org/00waaqh38","country_code":"VN","type":"education","lineage":["https://openalex.org/I123565023"]}],"countries":["VN"],"is_corresponding":true,"raw_author_name":"Dang Vu","raw_affiliation_strings":["University of Science &amp; Vietnam National University, Ho Chi Minh City, Vietnam"],"raw_orcid":"https://orcid.org/0009-0003-3268-024X","affiliations":[{"raw_affiliation_string":"University of Science &amp; Vietnam National University, Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I123565023"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032725043","display_name":"M. L. Nguyen","orcid":"https://orcid.org/0009-0008-3746-389X"},"institutions":[{"id":"https://openalex.org/I123565023","display_name":"Vietnam National University Ho Chi Minh City","ror":"https://ror.org/00waaqh38","country_code":"VN","type":"education","lineage":["https://openalex.org/I123565023"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Minh-Nhat Nguyen","raw_affiliation_strings":["University of Science &amp; Vietnam National University, Ho Chi Minh City, Vietnam"],"raw_orcid":"https://orcid.org/0009-0008-3746-389X","affiliations":[{"raw_affiliation_string":"University of Science &amp; Vietnam National University, Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I123565023"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5083265206","display_name":"Quoc-Trung Nguyen","orcid":"https://orcid.org/0009-0001-5959-6107"},"institutions":[{"id":"https://openalex.org/I123565023","display_name":"Vietnam National University Ho Chi Minh City","ror":"https://ror.org/00waaqh38","country_code":"VN","type":"education","lineage":["https://openalex.org/I123565023"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Quoc-Trung Nguyen","raw_affiliation_strings":["University of Science &amp; Vietnam National University, Ho Chi Minh City, Vietnam"],"raw_orcid":"https://orcid.org/0009-0001-5959-6107","affiliations":[{"raw_affiliation_string":"University of Science &amp; Vietnam National University, Ho Chi Minh City, Vietnam","institution_ids":["https://openalex.org/I123565023"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5103159113"],"corresponding_institution_ids":["https://openalex.org/I123565023"],"apc_list":null,"apc_paid":null,"fwci":5.3722,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":{"value":0.95200678,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1306","last_page":"1311"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9972000122070312,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8081092238426208},{"id":"https://openalex.org/keywords/misinformation","display_name":"Misinformation","score":0.7472079992294312},{"id":"https://openalex.org/keywords/closed-captioning","display_name":"Closed captioning","score":0.6788045167922974},{"id":"https://openalex.org/keywords/transparency","display_name":"Transparency (behavior)","score":0.591235876083374},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5467939376831055},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5029510855674744},{"id":"https://openalex.org/keywords/social-media","display_name":"Social media","score":0.48542556166648865},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.48129311203956604},{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.44450801610946655},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.42019781470298767},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3671446442604065},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.33052313327789307},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.32911941409111023},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.26738181710243225},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.18700039386749268}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8081092238426208},{"id":"https://openalex.org/C2776990098","wikidata":"https://www.wikidata.org/wiki/Q13579947","display_name":"Misinformation","level":2,"score":0.7472079992294312},{"id":"https://openalex.org/C157657479","wikidata":"https://www.wikidata.org/wiki/Q2367247","display_name":"Closed captioning","level":3,"score":0.6788045167922974},{"id":"https://openalex.org/C2780233690","wikidata":"https://www.wikidata.org/wiki/Q535347","display_name":"Transparency (behavior)","level":2,"score":0.591235876083374},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5467939376831055},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5029510855674744},{"id":"https://openalex.org/C518677369","wikidata":"https://www.wikidata.org/wiki/Q202833","display_name":"Social media","level":2,"score":0.48542556166648865},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.48129311203956604},{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.44450801610946655},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.42019781470298767},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3671446442604065},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.33052313327789307},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.32911941409111023},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.26738181710243225},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.18700039386749268},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3652583.3657600","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3652583.3657600","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3657600","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3652583.3657600","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3652583.3657600","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3652583.3657600","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2024 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320322308","display_name":"KU Leuven","ror":"https://ror.org/05f950310"},{"id":"https://openalex.org/F4320326592","display_name":"Viet Nam National University Ho Chi Minh City","ror":"https://ror.org/00waaqh38"},{"id":"https://openalex.org/F4320335839","display_name":"National Institute of Information and Communications Technology","ror":"https://ror.org/016bgq349"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4399418571.pdf","grobid_xml":"https://content.openalex.org/works/W4399418571.grobid-xml"},"referenced_works_count":12,"referenced_works":["https://openalex.org/W3042631625","https://openalex.org/W3136860328","https://openalex.org/W4212774754","https://openalex.org/W4225323055","https://openalex.org/W4283511515","https://openalex.org/W4304092670","https://openalex.org/W4304098634","https://openalex.org/W4309589453","https://openalex.org/W4384833492","https://openalex.org/W4384833574","https://openalex.org/W4399418452","https://openalex.org/W6821254711"],"related_works":["https://openalex.org/W4210416330","https://openalex.org/W3164229987","https://openalex.org/W3215212336","https://openalex.org/W4290852288","https://openalex.org/W3217388757","https://openalex.org/W3122720459","https://openalex.org/W4298897568","https://openalex.org/W4289422896","https://openalex.org/W1938708284","https://openalex.org/W4380190185"],"abstract_inverted_index":{"Misinformation":[0],"is":[1,20,26],"a":[2,49,86,108],"widespread":[3],"problem":[4],"in":[5],"the":[6,14,53,59,123],"wake":[7],"of":[8,13,18,58,114],"flourishing":[9],"social":[10],"media.":[11],"One":[12],"most":[15],"common":[16],"forms":[17],"misinformation":[19],"cheapfakes":[21,47,75],"-":[22,76],"multimedia":[23],"content":[24],"that":[25,89],"manipulated":[27],"with":[28,72,78,97],"simple":[29],"techniques":[30],"such":[31],"as":[32],"miscaptioning":[33],"to":[34,41,52],"create":[35],"misleading":[36,79],"or":[37,80],"false":[38],"narratives.":[39],"Due":[40],"their":[42],"simplicity":[43],"and":[44,56,134],"appealing":[45],"nature,":[46],"pose":[48],"formidable":[50],"threat":[51],"reliability,":[54],"transparency":[55],"integrity":[57],"Internet.":[60],"The":[61],"ACM":[62],"ICMR":[63],"2024":[64],"Grand":[65],"Challenge":[66],"on":[67,101,107],"Detecting":[68],"Cheapfakes":[69],"tasks":[70],"participants":[71],"detecting":[73],"out-of-context":[74],"images":[77],"irrelevant":[81],"captions.":[82],"This":[83],"paper":[84],"introduces":[85],"lightweight":[87],"approach":[88],"enhances":[90],"cheapfake":[91],"detection":[92],"by":[93],"combining":[94],"Prompt":[95],"Engineering":[96],"image":[98],"captioning":[99],"running":[100],"an":[102,112],"interleaved":[103],"image-text":[104],"model.":[105],"Testing":[106],"public":[109],"dataset":[110],"gives":[111],"accuracy":[113],"82.9%.":[115],"Despite":[116],"its":[117],"modest":[118],"accuracy,":[119],"our":[120],"method":[121],"demonstrates":[122],"potential":[124],"for":[125,131],"applying":[126],"better":[127],"mixed-media":[128],"learning":[129],"models":[130],"context":[132],"understanding":[133],"Visual":[135],"Question":[136],"Answering.":[137]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
