{"id":"https://openalex.org/W4416798407","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249178","title":"NE-PADD: Leveraging Named Entity Knowledge for Robust Partial Audio Deepfake Detection via Attention Aggregation","display_name":"NE-PADD: Leveraging Named Entity Knowledge for Robust Partial Audio Deepfake Detection via Attention Aggregation","publication_year":2025,"publication_date":"2025-10-22","ids":{"openalex":"https://openalex.org/W4416798407","doi":"https://doi.org/10.1109/apsipaasc65261.2025.11249178"},"language":null,"primary_location":{"id":"doi:10.1109/apsipaasc65261.2025.11249178","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249178","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120619678","display_name":"Huhong Xian","orcid":null},"institutions":[{"id":"https://openalex.org/I2722730","display_name":"Inner Mongolia University","ror":"https://ror.org/0106qb496","country_code":"CN","type":"education","lineage":["https://openalex.org/I2722730"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Huhong Xian","raw_affiliation_strings":["Inner Mongolia University,Hohhot,China"],"affiliations":[{"raw_affiliation_string":"Inner Mongolia University,Hohhot,China","institution_ids":["https://openalex.org/I2722730"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100448456","display_name":"Rui Liu","orcid":"https://orcid.org/0000-0002-2967-6296"},"institutions":[{"id":"https://openalex.org/I2722730","display_name":"Inner Mongolia University","ror":"https://ror.org/0106qb496","country_code":"CN","type":"education","lineage":["https://openalex.org/I2722730"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Liu","raw_affiliation_strings":["Inner Mongolia University,Hohhot,China"],"affiliations":[{"raw_affiliation_string":"Inner Mongolia University,Hohhot,China","institution_ids":["https://openalex.org/I2722730"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001303929","display_name":"Berrak \u015ei\u015fman","orcid":"https://orcid.org/0000-0001-8078-3305"},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]},{"id":"https://openalex.org/I4210098364","display_name":"Institute for Language and Speech Processing","ror":"https://ror.org/00z24kr14","country_code":"GR","type":"nonprofit","lineage":["https://openalex.org/I4210098364"]}],"countries":["GR","US"],"is_corresponding":false,"raw_author_name":"Berrak Sisman","raw_affiliation_strings":["Johns Hopkins University,Center for Language and Speech Processing (CLSP),USA"],"affiliations":[{"raw_affiliation_string":"Johns Hopkins University,Center for Language and Speech Processing (CLSP),USA","institution_ids":["https://openalex.org/I4210098364","https://openalex.org/I145311948"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5032690182","display_name":"Haizhou Li","orcid":"https://orcid.org/0000-0001-9158-9401"},"institutions":[{"id":"https://openalex.org/I4210116924","display_name":"Chinese University of Hong Kong, Shenzhen","ror":"https://ror.org/02d5ks197","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633","https://openalex.org/I180726961","https://openalex.org/I4210116924"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haizhou Li","raw_affiliation_strings":["School of Artificial Intelligence, The Chinese University of Hong Kong,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, The Chinese University of Hong Kong,Shenzhen,China","institution_ids":["https://openalex.org/I4210116924"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5120619678"],"corresponding_institution_ids":["https://openalex.org/I2722730"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.2069717,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2199","last_page":"2204"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.26019999384880066,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.26019999384880066,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.2046000063419342,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.05689999833703041,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.6955000162124634},{"id":"https://openalex.org/keywords/entity-linking","display_name":"Entity linking","score":0.6428999900817871},{"id":"https://openalex.org/keywords/named-entity-recognition","display_name":"Named-entity recognition","score":0.6398000121116638},{"id":"https://openalex.org/keywords/named-entity","display_name":"Named entity","score":0.47769999504089355},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.3953000009059906}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8765000104904175},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.6955000162124634},{"id":"https://openalex.org/C96711827","wikidata":"https://www.wikidata.org/wiki/Q17012245","display_name":"Entity linking","level":3,"score":0.6428999900817871},{"id":"https://openalex.org/C2779135771","wikidata":"https://www.wikidata.org/wiki/Q403574","display_name":"Named-entity recognition","level":3,"score":0.6398000121116638},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5315999984741211},{"id":"https://openalex.org/C2777889803","wikidata":"https://www.wikidata.org/wiki/Q25047676","display_name":"Named entity","level":2,"score":0.47769999504089355},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.46230000257492065},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.3953000009059906},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.36739999055862427},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36320000886917114},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.33059999346733093},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.30410000681877136},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.2978000044822693},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.2524999976158142}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/apsipaasc65261.2025.11249178","is_oa":false,"landing_page_url":"https://doi.org/10.1109/apsipaasc65261.2025.11249178","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Asia Pacific Signal and Information Processing Association Annual Summit and Conference (APSIPA ASC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W2519091744","https://openalex.org/W2964243274","https://openalex.org/W3095918555","https://openalex.org/W3163475957","https://openalex.org/W3163596559","https://openalex.org/W3196774886","https://openalex.org/W3197457172","https://openalex.org/W3200876013","https://openalex.org/W3201773091","https://openalex.org/W4221141917","https://openalex.org/W4225939199","https://openalex.org/W4313306150","https://openalex.org/W4372259784","https://openalex.org/W4372260053","https://openalex.org/W4375869244","https://openalex.org/W4385245566","https://openalex.org/W4392903271","https://openalex.org/W4402112367","https://openalex.org/W4408345868","https://openalex.org/W4408346014","https://openalex.org/W4408353590"],"related_works":[],"abstract_inverted_index":{"Different":[0],"from":[1,34,107,123],"traditional":[2],"sentence-level":[3],"audio":[4,9,60],"deepfake":[5,10,61],"detection":[6,11,62],"(ADD),":[7],"partial":[8,59],"(PADD)":[12],"requires":[13],"frame-level":[14],"positioning":[15],"of":[16,19,68,153,172],"the":[17,143,154,170],"location":[18],"fake":[20],"speech.":[21],"While":[22],"some":[23],"progress":[24],"has":[25],"been":[26],"made":[27],"in":[28,130],"this":[29,44],"area,":[30],"leveraging":[31],"semantic":[32],"information":[33],"audio,":[35],"especially":[36],"named":[37,54,92,132,174],"entities,":[38],"remains":[39],"an":[40,120,137],"underexplored":[41],"aspect.":[42],"To":[43],"end,":[45],"we":[46,80],"propose":[47],"a":[48,149],"novel":[49],"method,":[50],"NE-PADD,":[51],"which":[52],"leverages":[53],"entity":[55,93,133,175],"knowledge":[56,176],"for":[57,111],"robust":[58,98],"through":[63],"attention":[64,83,106,125,156],"aggregation.":[65],"NE-PADD":[66],"consists":[67],"two":[69,82,155],"parallel":[70],"branches:":[71],"Speech":[72],"Named":[73],"Entity":[74],"Recognition":[75],"(SpeechNER)":[76],"and":[77,109,147,168],"PADD.":[78,178],"Specifically,":[79],"introduce":[81],"aggregation":[84,157],"mechanisms":[85],"to":[86,127],"help":[87],"PADD":[88,99,110,129],"models":[89],"better":[90],"understand":[91],"knowledge,":[94],"thus":[95],"achieving":[96],"more":[97,112],"performance.":[100],"(1)":[101],"Attention":[102,116],"Fusion":[103],"(AF)":[104],"combines":[105],"SpeechNER":[108],"accurate":[113],"weights.":[114],"(2)":[115],"Transfer":[117],"(AT)":[118],"uses":[119],"auxiliary":[121],"loss":[122],"their":[124],"distributions":[126],"guide":[128],"learning":[131],"semantics.":[134],"We":[135],"construct":[136],"appropriative":[138],"PartialSpoofNER":[139],"dataset":[140,146],"based":[141],"on":[142],"existing":[144],"PartialSpoof":[145],"conduct":[148],"detailed":[150],"comparative":[151],"analysis":[152],"methods.":[158],"Experiments":[159],"demonstrate":[160],"that":[161],"our":[162],"method":[163],"exceeds":[164],"all":[165],"advanced":[166],"baselines":[167],"demonstrates":[169],"effectiveness":[171],"fusing":[173],"during":[177],"The":[179],"code":[180],"is":[181],"available":[182],"at":[183],"https://github.com/AI-S2-Lab/NE-PADD.":[184]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-11-28T00:00:00"}
