{"id":"https://openalex.org/W4415428510","doi":"https://doi.org/10.3233/faia251285","title":"LAMM-ViT: AI Face Detection via Layer-Aware Modulation of Region-Guided Attention","display_name":"LAMM-ViT: AI Face Detection via Layer-Aware Modulation of Region-Guided Attention","publication_year":2025,"publication_date":"2025-10-21","ids":{"openalex":"https://openalex.org/W4415428510","doi":"https://doi.org/10.3233/faia251285"},"language":null,"primary_location":{"id":"doi:10.3233/faia251285","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251285","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"type":"book-chapter","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://doi.org/10.3233/faia251285","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5022437227","display_name":"Jun Zhang","orcid":"https://orcid.org/0000-0001-5168-9942"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jiangling Zhang","raw_affiliation_strings":["Wuhan University of Technology"],"affiliations":[{"raw_affiliation_string":"Wuhan University of Technology","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101177133","display_name":"Weijie Zhu","orcid":"https://orcid.org/0009-0000-0830-8331"},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weijie Zhu","raw_affiliation_strings":["Wuhan University of Technology"],"affiliations":[{"raw_affiliation_string":"Wuhan University of Technology","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109747583","display_name":"Jirui Huang","orcid":null},"institutions":[{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jirui Huang","raw_affiliation_strings":["Wuhan University of Technology"],"affiliations":[{"raw_affiliation_string":"Wuhan University of Technology","institution_ids":["https://openalex.org/I196699116"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003775716","display_name":"Yaxiong Chen","orcid":"https://orcid.org/0000-0002-2903-6723"},"institutions":[{"id":"https://openalex.org/I4210149102","display_name":"Sanya University","ror":"https://ror.org/04fa2qd52","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210149102"]},{"id":"https://openalex.org/I196699116","display_name":"Wuhan University of Technology","ror":"https://ror.org/03fe7t173","country_code":"CN","type":"education","lineage":["https://openalex.org/I196699116"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yaxiong Chen","raw_affiliation_strings":["Sanya Science and Education Innovation Park, Wuhan University of Technology, Sanya 572000, China","School of Computer Science and Artificial Intelligence, Wuhan University of Technology, Wuhan 430070, China"],"affiliations":[{"raw_affiliation_string":"Sanya Science and Education Innovation Park, Wuhan University of Technology, Sanya 572000, China","institution_ids":["https://openalex.org/I4210149102","https://openalex.org/I196699116"]},{"raw_affiliation_string":"School of Computer Science and Artificial Intelligence, Wuhan University of Technology, Wuhan 430070, China","institution_ids":["https://openalex.org/I196699116"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5022437227"],"corresponding_institution_ids":["https://openalex.org/I196699116"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.66692059,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.7774999737739563,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10057","display_name":"Face and Expression Recognition","score":0.7774999737739563,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.7681999802589417,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.7024000287055969,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5131000280380249},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.47940000891685486},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4496000111103058},{"id":"https://openalex.org/keywords/facial-expression","display_name":"Facial expression","score":0.4302999973297119},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4228000044822693},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.41830000281333923},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.39969998598098755},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.3880999982357025}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7786999940872192},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6136999726295471},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5131000280380249},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.47940000891685486},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4537999927997589},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4496000111103058},{"id":"https://openalex.org/C195704467","wikidata":"https://www.wikidata.org/wiki/Q327968","display_name":"Facial expression","level":2,"score":0.4302999973297119},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4228000044822693},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.41830000281333923},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.39969998598098755},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.3880999982357025},{"id":"https://openalex.org/C123079801","wikidata":"https://www.wikidata.org/wiki/Q750240","display_name":"Modulation (music)","level":2,"score":0.3589000105857849},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3375999927520752},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.33239999413490295},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3224000036716461},{"id":"https://openalex.org/C4641261","wikidata":"https://www.wikidata.org/wiki/Q11681085","display_name":"Face detection","level":4,"score":0.3111000061035156},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.303600013256073},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2867000102996826},{"id":"https://openalex.org/C193415008","wikidata":"https://www.wikidata.org/wiki/Q639681","display_name":"Network architecture","level":2,"score":0.28139999508857727},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.28130000829696655},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.2808000147342682},{"id":"https://openalex.org/C194544171","wikidata":"https://www.wikidata.org/wiki/Q21105679","display_name":"Gating","level":2,"score":0.2736999988555908},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.26570001244544983},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.2603999972343445}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3233/faia251285","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251285","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},{"id":"pmh:doi:10.48550/arxiv.2505.07734","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"}],"best_oa_location":{"id":"doi:10.3233/faia251285","is_oa":true,"landing_page_url":"https://doi.org/10.3233/faia251285","pdf_url":null,"source":{"id":"https://openalex.org/S4210201731","display_name":"Frontiers in artificial intelligence and applications","issn_l":"0922-6389","issn":["0922-6389","1879-8314"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by-nc","license_id":"https://openalex.org/licenses/cc-by-nc","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Frontiers in Artificial Intelligence and Applications","raw_type":"book-chapter"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Detecting":[0],"AI-synthetic":[1],"faces":[2],"presents":[3],"a":[4,53],"critical":[5],"challenge:":[6],"it":[7],"is":[8,200],"hard":[9],"to":[10,83,91,186],"capture":[11,139],"consistent":[12],"structural":[13],"relationships":[14],"between":[15],"facial":[16,59,81,97],"regions":[17],"across":[18,95,132],"diverse":[19,147],"generation":[20,148],"techniques.":[21],"Current":[22],"methods,":[23],"which":[24],"focus":[25,131],"on":[26,115],"specific":[27],"artifacts":[28],"rather":[29],"than":[30],"fundamental":[31],"inconsistencies,":[32],"often":[33],"fail":[34],"when":[35],"confronted":[36],"with":[37],"novel":[38],"generative":[39],"models.":[40],"To":[41],"address":[42],"this":[43],"limitation,":[44],"we":[45],"introduce":[46],"Layer-aware":[47,71],"Mask":[48,72],"Modulation":[49,73],"Vision":[50,54],"Transformer":[51,55],"(LAMM-ViT),":[52],"designed":[56],"for":[57,191],"robust":[58],"forgery":[60,143],"detection.":[61],"This":[62,135],"model":[63,90],"integrates":[64],"distinct":[65],"Region-Guided":[66],"Multi-Head":[67],"Attention":[68],"(RG-MHA)":[69],"and":[70,111,153,173,188],"(LAMM)":[74],"components":[75],"within":[76],"each":[77],"layer.":[78],"RG-MHA":[79],"utilizes":[80],"landmarks":[82],"create":[84],"regional":[85,130],"attention":[86],"masks,":[87],"guiding":[88],"the":[89,100,122,138],"scrutinize":[92],"architectural":[93],"inconsistencies":[94],"different":[96],"areas.":[98],"Crucially,":[99],"separate":[101],"LAMM":[102],"module":[103],"dynamically":[104],"generates":[105],"layer-specific":[106],"parameters,":[107],"including":[108],"mask":[109],"weights":[110],"gating":[112],"values,":[113],"based":[114],"network":[116,133],"context.":[117],"These":[118,180],"parameters":[119],"then":[120],"modulate":[121],"behavior":[123],"of":[124,129,140],"RG-MHA,":[125],"enabling":[126],"adaptive":[127],"adjustment":[128],"depths.":[134],"architecture":[136],"facilitates":[137],"subtle,":[141],"hierarchical":[142],"cues":[144],"ubiquitous":[145],"among":[146],"techniques,":[149],"such":[150],"as":[151],"GANs":[152],"Diffusion":[154],"Models.":[155],"In":[156],"cross-model":[157],"generalization":[158],"tests,":[159],"LAMM-ViT":[160],"demonstrates":[161],"superior":[162],"performance,":[163],"achieving":[164],"94.09%":[165],"mean":[166,175],"ACC":[167],"(a":[168,177],"+5.45%":[169],"improvement":[170],"over":[171],"SoTA)":[172],"98.62%":[174],"AP":[176],"+3.09%":[178],"improvement).":[179],"results":[181],"demonstrate":[182],"LAMM-ViT\u2019s":[183],"exceptional":[184],"ability":[185],"generalize":[187],"its":[189],"potential":[190],"reliable":[192],"deployment":[193],"against":[194],"evolving":[195],"synthetic":[196],"media":[197],"threats.The":[198],"code":[199],"available":[201],"at":[202],"https://github.com/WHUT-ZJL/LAMM-ViT.":[203]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2025-10-24T00:00:00"}
