{"id":"https://openalex.org/W7159674818","doi":"https://doi.org/10.48550/arxiv.2604.27875","title":"Frequency-Aware Semantic Fusion with Gated Injection for AI-generated Image Detection","display_name":"Frequency-Aware Semantic Fusion with Gated Injection for AI-generated Image Detection","publication_year":2026,"publication_date":"2026-04-30","ids":{"openalex":"https://openalex.org/W7159674818","doi":"https://doi.org/10.48550/arxiv.2604.27875"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.27875","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.27875","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.27875","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008993224","display_name":"Shuchang Zhou","orcid":"https://orcid.org/0000-0002-7294-5869"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhou, Shuchang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134941013","display_name":"Shangkun Wu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, Shangkun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134937438","display_name":"Jiwei Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Jiwei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134943956","display_name":"Ke Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Ke","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134986911","display_name":"Ran Ran","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ran, Ran","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134983842","display_name":"Caiyan Qin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Qin, Caiyan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134993010","display_name":"Yang Yang","orcid":"https://orcid.org/0000-0002-4833-8575"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5008993224"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.39719998836517334,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.39719998836517334,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.12409999966621399,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.12300000339746475,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.6241999864578247},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5745999813079834},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.538100004196167},{"id":"https://openalex.org/keywords/discriminator","display_name":"Discriminator","score":0.5285000205039978},{"id":"https://openalex.org/keywords/abstraction","display_name":"Abstraction","score":0.5091000199317932},{"id":"https://openalex.org/keywords/generalization","display_name":"Generalization","score":0.4729999899864197},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.46560001373291016},{"id":"https://openalex.org/keywords/masking","display_name":"Masking (illustration)","score":0.4578000009059906},{"id":"https://openalex.org/keywords/frequency-domain","display_name":"Frequency domain","score":0.4544999897480011},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.43810001015663147}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7904999852180481},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6434999704360962},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.6241999864578247},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5745999813079834},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.538100004196167},{"id":"https://openalex.org/C2779803651","wikidata":"https://www.wikidata.org/wiki/Q5282088","display_name":"Discriminator","level":3,"score":0.5285000205039978},{"id":"https://openalex.org/C124304363","wikidata":"https://www.wikidata.org/wiki/Q673661","display_name":"Abstraction","level":2,"score":0.5091000199317932},{"id":"https://openalex.org/C177148314","wikidata":"https://www.wikidata.org/wiki/Q170084","display_name":"Generalization","level":2,"score":0.4729999899864197},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.46560001373291016},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.4578000009059906},{"id":"https://openalex.org/C19118579","wikidata":"https://www.wikidata.org/wiki/Q786423","display_name":"Frequency domain","level":2,"score":0.4544999897480011},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.43810001015663147},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.42500001192092896},{"id":"https://openalex.org/C165064840","wikidata":"https://www.wikidata.org/wiki/Q1321061","display_name":"Matching (statistics)","level":2,"score":0.4081999957561493},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.38519999384880066},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.382099986076355},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3580999970436096},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.35019999742507935},{"id":"https://openalex.org/C2221639","wikidata":"https://www.wikidata.org/wiki/Q2877","display_name":"Discrete cosine transform","level":3,"score":0.3449999988079071},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3294999897480011},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.31850001215934753},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.304500013589859},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.30059999227523804},{"id":"https://openalex.org/C2779010991","wikidata":"https://www.wikidata.org/wiki/Q2720909","display_name":"Artifact (error)","level":2,"score":0.2921999990940094},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.288100004196167},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.28439998626708984},{"id":"https://openalex.org/C2911011789","wikidata":"https://www.wikidata.org/wiki/Q130741","display_name":"Hallucinating","level":2,"score":0.2809999883174896},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.2741999924182892},{"id":"https://openalex.org/C2776836416","wikidata":"https://www.wikidata.org/wiki/Q1364844","display_name":"False alarm","level":2,"score":0.26739999651908875},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.2619999945163727},{"id":"https://openalex.org/C2778493491","wikidata":"https://www.wikidata.org/wiki/Q7449072","display_name":"Semantic matching","level":3,"score":0.25839999318122864},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.2524999976158142},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.25119999051094055},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.25119999051094055}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.27875","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.27875","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.27875","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.27875","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"AI-generated":[0],"images":[1],"are":[2],"becoming":[3],"increasingly":[4],"realistic":[5],"and":[6,23,68,75,116,120,150,171,182],"diverse,":[7],"posing":[8],"significant":[9],"challenges":[10],"for":[11],"generalizable":[12,121],"detection.":[13],"While":[14],"Vision":[15],"Foundation":[16],"Models":[17],"(VFMs)":[18],"provide":[19],"rich":[20],"semantic":[21],"representations":[22],"frequency-based":[24],"methods":[25],"capture":[26],"complementary":[27],"artifact":[28],"cues,":[29],"existing":[30],"approaches":[31],"that":[32,102,177],"combine":[33],"these":[34,81],"modalities":[35],"still":[36],"suffer":[37],"from":[38],"limited":[39],"generalization,":[40],"with":[41,65,142,146,163],"notable":[42],"performance":[43,181],"degradation":[44],"on":[45,113],"unseen":[46],"generative":[47],"models.":[48],"We":[49,123],"attribute":[50],"this":[51],"limitation":[52],"to":[53,91,110,133,168],"two":[54],"key":[55],"factors:":[56],"frequency":[57,77,108,136],"shortcut":[58],"bias":[59],"toward":[60],"easily":[61],"distinguishable":[62],"cues":[63,137],"associated":[64],"specific":[66],"generators":[67],"cross-domain":[69],"representation":[70,152],"conflict":[71],"between":[72],"high-level":[73],"semantics":[74],"low-level":[76],"patterns.":[78],"To":[79],"address":[80],"issues,":[82],"we":[83,95,155],"propose":[84,156],"a":[85,97,126,157,164],"Frequency-aware":[86],"Gated":[87,128],"Injection":[88,130],"Network":[89],"(FGINet)":[90],"improve":[92],"generalization.":[93],"Specifically,":[94],"design":[96],"Band-Masked":[98],"Frequency":[99,129],"Encoder":[100],"(BMFE)":[101],"applies":[103],"cross-band":[104],"masking":[105],"in":[106],"the":[107,139],"domain":[109],"reduce":[111],"reliance":[112],"generator-specific":[114],"patterns":[115],"encourage":[117],"more":[118],"diverse":[119],"representations.":[122,173],"further":[124],"introduce":[125],"Layer-wise":[127],"(LGFI)":[131],"mechanism":[132],"progressively":[134],"inject":[135],"into":[138],"VFM":[140],"backbone":[141],"adaptive":[143],"gating,":[144],"aligning":[145],"its":[147],"hierarchical":[148],"abstraction":[149],"alleviating":[151],"conflict.":[153],"Moreover,":[154],"Hyperspherical":[158],"Compactness":[159],"Learning":[160],"(HCL)":[161],"framework":[162],"cosine":[165],"margin":[166],"objective":[167],"learn":[169],"compact":[170],"well-separated":[172],"Extensive":[174],"experiments":[175],"demonstrate":[176],"FGINet":[178],"achieves":[179],"state-of-the-art":[180],"strong":[183],"generalization":[184],"across":[185],"multiple":[186],"challenging":[187],"datasets.":[188]},"counts_by_year":[],"updated_date":"2026-05-02T06:10:54.344120","created_date":"2026-05-02T00:00:00"}
