{"id":"https://openalex.org/W7131084170","doi":"https://doi.org/10.1109/iccvw69036.2025.00169","title":"Phoneme-Level Analysis for Person-of-Interest Speech Deepfake Detection","display_name":"Phoneme-Level Analysis for Person-of-Interest Speech Deepfake Detection","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W7131084170","doi":"https://doi.org/10.1109/iccvw69036.2025.00169"},"language":null,"primary_location":{"id":"doi:10.1109/iccvw69036.2025.00169","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccvw69036.2025.00169","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision Workshops (ICCVW)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Davide Salvi","orcid":null},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Davide Salvi","raw_affiliation_strings":["Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB),Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB),Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Viola Negroni","orcid":null},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Viola Negroni","raw_affiliation_strings":["Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB),Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB),Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Sara Mandelli","orcid":null},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Sara Mandelli","raw_affiliation_strings":["Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB),Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB),Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Paolo Bestagini","orcid":null},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Paolo Bestagini","raw_affiliation_strings":["Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB),Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB),Italy","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"last","author":{"id":null,"display_name":"Stefano Tubaro","orcid":null},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Stefano Tubaro","raw_affiliation_strings":["Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB),Italy"],"affiliations":[{"raw_affiliation_string":"Politecnico di Milano,Dipartimento di Elettronica, Informazione e Bioingegneria (DEIB),Italy","institution_ids":["https://openalex.org/I93860229"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I93860229"],"apc_list":null,"apc_paid":null,"fwci":2.5147,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.93763658,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1597","last_page":"1606"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.25040000677108765,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.25040000677108765,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10775","display_name":"Generative Adversarial Networks and Image Synthesis","score":0.16410000622272491,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.15860000252723694,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.6686999797821045},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5745000243186951},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.5478000044822693},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.5446000099182129},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4609000086784363},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.4277999997138977},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.353300005197525}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7944999933242798},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.6686999797821045},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5745000243186951},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.5478000044822693},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.5446000099182129},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5228000283241272},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.47780001163482666},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4609000086784363},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.4277999997138977},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.374099999666214},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.353300005197525},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3357999920845032},{"id":"https://openalex.org/C204201278","wikidata":"https://www.wikidata.org/wiki/Q1332614","display_name":"Voice activity detection","level":3,"score":0.3206999897956848},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.3149000108242035},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.3124000132083893},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.3052999973297119},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.25429999828338623},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.25130000710487366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iccvw69036.2025.00169","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccvw69036.2025.00169","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision Workshops (ICCVW)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":42,"referenced_works":["https://openalex.org/W90720583","https://openalex.org/W1494198834","https://openalex.org/W2125534887","https://openalex.org/W2327501763","https://openalex.org/W2749090340","https://openalex.org/W2801514793","https://openalex.org/W2884483159","https://openalex.org/W2936802426","https://openalex.org/W2940385840","https://openalex.org/W3034530968","https://openalex.org/W3036198682","https://openalex.org/W3127781933","https://openalex.org/W3135809943","https://openalex.org/W3200527256","https://openalex.org/W3201773091","https://openalex.org/W4210730577","https://openalex.org/W4213449918","https://openalex.org/W4214876496","https://openalex.org/W4225527248","https://openalex.org/W4297841787","https://openalex.org/W4311591887","https://openalex.org/W4311737082","https://openalex.org/W4375869230","https://openalex.org/W4381708595","https://openalex.org/W4385466335","https://openalex.org/W4385801058","https://openalex.org/W4392910532","https://openalex.org/W4393170828","https://openalex.org/W4393372892","https://openalex.org/W4396785992","https://openalex.org/W4399556715","https://openalex.org/W4402111459","https://openalex.org/W4402915903","https://openalex.org/W4403331203","https://openalex.org/W4403791925","https://openalex.org/W4406803348","https://openalex.org/W4408054937","https://openalex.org/W4408353669","https://openalex.org/W4408354307","https://openalex.org/W4409369335","https://openalex.org/W4410815513","https://openalex.org/W4417054079"],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,130],"generative":[3],"AI":[4],"have":[5,28],"made":[6],"the":[7,55,78],"creation":[8],"of":[9,40,110],"speech":[10,24,71],"deepfakes":[11],"widely":[12],"accessible,":[13],"posing":[14],"serious":[15],"challenges":[16],"to":[17,88,119],"digital":[18],"trust.":[19],"To":[20],"counter":[21],"this,":[22],"various":[23],"deepfake":[25,72,147],"detection":[26,73,109],"strategies":[27],"been":[29],"proposed,":[30],"including":[31],"Person-of-Interest":[32],"(POI)":[33],"approaches,":[34],"which":[35],"focus":[36],"on":[37,135],"identifying":[38],"impersonations":[39],"specific":[41],"individuals":[42],"by":[43],"modeling":[44],"and":[45,61,126],"analyzing":[46],"their":[47,52],"unique":[48],"vocal":[49],"traits.":[50],"Despite":[51],"excellent":[53],"performance,":[54],"existing":[56],"methods":[57],"offer":[58],"limited":[59],"granularity":[60],"lack":[62],"interpretability.":[63],"In":[64,94],"this":[65,105,138],"work,":[66],"we":[67],"propose":[68],"a":[69,90,98,141],"POI-based":[70],"method":[74,115],"that":[75],"operates":[76],"at":[77],"phoneme":[79,136],"level.":[80],"Our":[81],"approach":[82],"decomposes":[83],"reference":[84],"audio":[85],"into":[86],"phonemes":[87,96],"construct":[89],"detailed":[91],"speaker":[92],"profile.":[93],"inference,":[95],"from":[97],"test":[99],"sample":[100],"are":[101],"individually":[102],"compared":[103],"against":[104],"profile,":[106],"enabling":[107],"fine-grained":[108],"synthetic":[111],"artifacts.":[112],"The":[113],"proposed":[114],"achieves":[116],"comparable":[117],"accuracy":[118],"traditional":[120],"approaches":[121],"while":[122],"offering":[123],"superior":[124],"robustness":[125],"interpretability,":[127],"key":[128],"aspects":[129],"multimedia":[131],"forensics.":[132],"By":[133],"focusing":[134],"analysis,":[137],"work":[139],"explores":[140],"novel":[142],"direction":[143],"for":[144],"explainable,":[145],"speaker-centric":[146],"detection.":[148]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-27T14:29:43.386196","created_date":"2025-12-10T00:00:00"}
