{"id":"https://openalex.org/W4391766598","doi":"https://doi.org/10.48550/arxiv.2402.06304","title":"A New Approach to Voice Authenticity","display_name":"A New Approach to Voice Authenticity","publication_year":2024,"publication_date":"2024-02-09","ids":{"openalex":"https://openalex.org/W4391766598","doi":"https://doi.org/10.48550/arxiv.2402.06304"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2402.06304","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.06304","pdf_url":"https://arxiv.org/pdf/2402.06304","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2402.06304","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064235660","display_name":"Nicolas M. M\u00fcller","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"M\u00fcller, Nicolas M.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032526628","display_name":"Piotr Kawa","orcid":"https://orcid.org/0000-0002-2025-0547"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kawa, Piotr","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045272769","display_name":"Shen Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Shen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5093917312","display_name":"Matthias Neu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Neu, Matthias","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113469351","display_name":"Jennifer Williams","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Williams, Jennifer","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011742469","display_name":"Philip Sperl","orcid":"https://orcid.org/0000-0002-7901-7168"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sperl, Philip","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5091848694","display_name":"Konstantin B\u00f6ttinger","orcid":"https://orcid.org/0000-0002-9337-7506"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"B\u00f6ttinger, Konstantin","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5064235660"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.8644000291824341,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.8644000291824341,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.43060630559921265},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.39861011505126953},{"id":"https://openalex.org/keywords/communication","display_name":"Communication","score":0.32388609647750854},{"id":"https://openalex.org/keywords/aesthetics","display_name":"Aesthetics","score":0.32026195526123047},{"id":"https://openalex.org/keywords/sociology","display_name":"Sociology","score":0.308623731136322},{"id":"https://openalex.org/keywords/art","display_name":"Art","score":0.24821266531944275},{"id":"https://openalex.org/keywords/philosophy","display_name":"Philosophy","score":0.1393449902534485}],"concepts":[{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.43060630559921265},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.39861011505126953},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.32388609647750854},{"id":"https://openalex.org/C107038049","wikidata":"https://www.wikidata.org/wiki/Q35986","display_name":"Aesthetics","level":1,"score":0.32026195526123047},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.308623731136322},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.24821266531944275},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.1393449902534485}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2402.06304","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.06304","pdf_url":"https://arxiv.org/pdf/2402.06304","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},{"id":"doi:10.48550/arxiv.2402.06304","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2402.06304","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2402.06304","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2402.06304","pdf_url":"https://arxiv.org/pdf/2402.06304","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320331012","display_name":"Bayerische Staatsministerium f\u00fcr Wirtschaft, Landesentwicklung und Energie","ror":null},{"id":"https://openalex.org/F4320337041","display_name":"Department of Artificial Intelligence, Korea University","ror":null}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4391766598.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2748952813","https://openalex.org/W2361156571","https://openalex.org/W2352945052","https://openalex.org/W2609183841","https://openalex.org/W2356786183","https://openalex.org/W2377200558","https://openalex.org/W2373944280","https://openalex.org/W2384031875","https://openalex.org/W2377618934","https://openalex.org/W2358230173"],"abstract_inverted_index":{"Voice":[0],"faking,":[1],"driven":[2],"primarily":[3],"by":[4],"recent":[5],"advances":[6],"in":[7,56,76,143],"text-to-speech":[8],"(TTS)":[9],"synthesis":[10,128],"technology,":[11],"poses":[12],"significant":[13],"societal":[14],"challenges.":[15],"Currently,":[16],"the":[17,57,98,144,176],"prevailing":[18],"assumption":[19],"is":[20,42,111,167],"that":[21,38,159,171],"unaltered":[22],"human":[23],"speech":[24,31,179],"can":[25,49,67,83],"be":[26,50,68],"considered":[27],"genuine,":[28],"while":[29],"fake":[30,164],"comes":[32],"from":[33,97],"TTS":[34,127],"synthesis.":[35],"We":[36,132],"argue":[37,158],"this":[39,89],"binary":[40,99],"distinction":[41],"oversimplified.":[43],"For":[44],"instance,":[45],"altered":[46],"playback":[47],"speeds":[48],"used":[51],"for":[52,72,147],"malicious":[53],"purposes,":[54],"like":[55,120],"'Drunken":[58],"Nancy":[59],"Pelosi'":[60],"incident.":[61],"Similarly,":[62],"editing":[63,82],"of":[64,101,178],"audio":[65,102,162],"clips":[66],"done":[69],"ethically,":[70],"e.g.,":[71],"brevity":[73],"or":[74,79,106,165],"summarization":[75],"news":[77],"reporting":[78],"podcasts,":[80],"but":[81],"also":[84],"create":[85],"misleading":[86],"narratives.":[87],"In":[88],"paper,":[90],"we":[91,149,157],"propose":[92],"a":[93,138,168],"conceptual":[94],"shift":[95],"away":[96],"paradigm":[100],"being":[103],"either":[104],"'fake'":[105],"'real'.":[107],"Instead,":[108],"our":[109],"focus":[110],"on":[112],"pinpointing":[113],"'voice":[114],"edits',":[115],"which":[116,148],"encompass":[117],"traditional":[118],"modifications":[119],"filters":[121],"and":[122,129,136],"cuts,":[123],"as":[124,126,163],"well":[125],"VC":[130],"systems.":[131,153],"delineate":[133],"6":[134],"categories":[135],"curate":[137],"new":[139],"challenge":[140],"dataset":[141],"rooted":[142],"M-AILABS":[145],"corpus,":[146],"present":[150],"baseline":[151],"detection":[152],"And":[154],"most":[155],"importantly,":[156],"merely":[160],"categorizing":[161],"real":[166],"dangerous":[169],"over-simplification":[170],"will":[172],"fail":[173],"to":[174],"move":[175],"field":[177],"technology":[180],"forward.":[181]},"counts_by_year":[],"updated_date":"2026-03-10T16:38:18.471706","created_date":"2025-10-10T00:00:00"}
