{"id":"https://openalex.org/W4405754882","doi":"https://doi.org/10.1109/metroxraine62247.2024.10795959","title":"Towards a Predictive Model of Speech Signatures: Insights from Spectral Analysis and Generative AI Models","display_name":"Towards a Predictive Model of Speech Signatures: Insights from Spectral Analysis and Generative AI Models","publication_year":2024,"publication_date":"2024-10-21","ids":{"openalex":"https://openalex.org/W4405754882","doi":"https://doi.org/10.1109/metroxraine62247.2024.10795959"},"language":"en","primary_location":{"id":"doi:10.1109/metroxraine62247.2024.10795959","is_oa":false,"landing_page_url":"https://doi.org/10.1109/metroxraine62247.2024.10795959","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Metrology for eXtended Reality, Artificial Intelligence and Neural Engineering (MetroXRAINE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004167892","display_name":"Stefano Regondi","orcid":"https://orcid.org/0000-0002-5335-3374"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Stefano Regondi","raw_affiliation_strings":["Nemo Lab"],"affiliations":[{"raw_affiliation_string":"Nemo Lab","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068979918","display_name":"Raffaele Pugliese","orcid":"https://orcid.org/0000-0001-7669-4457"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Raffaele Pugliese","raw_affiliation_strings":["Nemo Lab"],"affiliations":[{"raw_affiliation_string":"Nemo Lab","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5072968890","display_name":"Atieh Mahroo","orcid":"https://orcid.org/0000-0002-2962-3661"},"institutions":[{"id":"https://openalex.org/I4210155236","display_name":"National Research Council","ror":"https://ror.org/04zaypm56","country_code":"IT","type":"funder","lineage":["https://openalex.org/I4210155236"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Atieh Mahroo","raw_affiliation_strings":["Institute of Intelligent Industrial, Technologies and Systems for Advanced Manufacturing (STIIMA), National Research Council of Italy, (CNR)"],"affiliations":[{"raw_affiliation_string":"Institute of Intelligent Industrial, Technologies and Systems for Advanced Manufacturing (STIIMA), National Research Council of Italy, (CNR)","institution_ids":["https://openalex.org/I4210155236"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5004167892"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21419641,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"782","last_page":"786"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9842000007629395,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9842000007629395,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9330000281333923,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9082000255584717,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6917538642883301},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.6380123496055603},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4977741539478302},{"id":"https://openalex.org/keywords/spectral-analysis","display_name":"Spectral analysis","score":0.49722960591316223},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.49454209208488464},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4285365343093872},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.38233423233032227},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.05428719520568848}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6917538642883301},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.6380123496055603},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4977741539478302},{"id":"https://openalex.org/C2983668108","wikidata":"https://www.wikidata.org/wiki/Q280453","display_name":"Spectral analysis","level":3,"score":0.49722960591316223},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.49454209208488464},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4285365343093872},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.38233423233032227},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.05428719520568848},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C32891209","wikidata":"https://www.wikidata.org/wiki/Q483666","display_name":"Spectroscopy","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/metroxraine62247.2024.10795959","is_oa":false,"landing_page_url":"https://doi.org/10.1109/metroxraine62247.2024.10795959","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Metrology for eXtended Reality, Artificial Intelligence and Neural Engineering (MetroXRAINE)","raw_type":"proceedings-article"},{"id":"pmh:oai:boa.unimib.it:10281/573625","is_oa":false,"landing_page_url":"https://hdl.handle.net/10281/573625","pdf_url":null,"source":{"id":"https://openalex.org/S4306401259","display_name":"BOA (University of Milano-Bicocca)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I66752286","host_organization_name":"University of Milano-Bicocca","host_organization_lineage":["https://openalex.org/I66752286"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/conferenceObject"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Gender equality","id":"https://metadata.un.org/sdg/5","score":0.4000000059604645}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W2088382258","https://openalex.org/W3137249133","https://openalex.org/W3217636171","https://openalex.org/W4200484186","https://openalex.org/W4211091296","https://openalex.org/W4214531455","https://openalex.org/W4295514200","https://openalex.org/W4307955901","https://openalex.org/W4311591823","https://openalex.org/W4377820918","https://openalex.org/W4382599495","https://openalex.org/W4384261732","https://openalex.org/W4386293515","https://openalex.org/W4392004446","https://openalex.org/W6748881466","https://openalex.org/W6783867762"],"related_works":["https://openalex.org/W4365211920","https://openalex.org/W3014948380","https://openalex.org/W4391584540","https://openalex.org/W4380551139","https://openalex.org/W4317695495","https://openalex.org/W4395044357","https://openalex.org/W4287117424","https://openalex.org/W4387506531","https://openalex.org/W2087346071","https://openalex.org/W2967848559"],"abstract_inverted_index":{"This":[0,204],"study":[1],"delves":[2],"into":[3],"a":[4,39,97],"comprehensive":[5],"analysis":[6,48],"and":[7,56,67,106,113,130,144,166,201,216],"identification":[8],"of":[9,16,49,53,59,89,101,118,133,168,190,198,220],"potential":[10],"vocal":[11,177],"cues":[12],"influencing":[13],"the":[14,28,57,87,128,149,152,188,196,207,218],"perception":[15,88],"authenticity":[17],"versus":[18],"artificiality":[19,92],"in":[20,93,142,148,181,211],"speech.":[21],"Our":[22],"primary":[23],"aim":[24,79],"is":[25,80],"to":[26,81,154],"pinpoint":[27],"pivotal":[29,83],"parameters":[30],"distinguishing":[31,103],"genuine":[32],"voices":[33,109,157],"from":[34,75,158],"artificially":[35,107],"synthesized":[36],"ones.":[37],"Employing":[38],"multifaceted":[40],"approach,":[41],"we":[42],"leverage":[43],"advanced":[44],"methodologies":[45],"encompassing":[46],"spectral":[47],"speech":[50],"signals,":[51],"discernment":[52],"prosodic":[54],"patterns,":[55],"application":[58],"cutting-edge":[60],"machine":[61],"learning":[62],"techniques":[63],"such":[64,172],"as":[65,173],"Hifi-GAN":[66],"generative":[68],"AI.":[69],"By":[70],"examining":[71],"voice":[72,135],"data":[73,202],"sourced":[74],"diverse":[76],"origins,":[77],"our":[78],"uncover":[82],"markers":[84],"that":[85],"impact":[86],"truthfulness":[90],"or":[91,176],"voices,":[94],"ultimately":[95],"constructing":[96],"predictive":[98],"model":[99],"capable":[100],"reliably":[102],"between":[104],"authentic":[105,156],"crafted":[108],"across":[110],"both":[111],"pathological":[112],"non-pathological":[114],"conditions.":[115],"The":[116],"culmination":[117],"this":[119,184],"research":[120,185],"holds":[121],"significant":[122],"implications":[123],"not":[124],"only":[125],"for":[126,139,209],"advancing":[127],"scientific":[129],"technological":[131],"understanding":[132],"human":[134],"distinctiveness":[136],"but":[137],"also":[138],"practical":[140],"applications":[141],"healthcare":[143,150,214],"security":[145,182,212],"domains.":[146],"Indeed,":[147],"field":[151],"ability":[153],"discern":[155],"artificial":[159],"ones":[160],"could":[161,186,205],"facilitate":[162],"more":[163],"accurate":[164],"diagnosis":[165],"monitoring":[167],"conditions":[169],"affecting":[170],"speech,":[171],"neurodegenerative":[174],"diseases":[175],"cord":[178],"disorders.":[179],"Additionally,":[180],"contexts,":[183],"enhance":[187],"reliability":[189,219],"voice-based":[191,221],"authentication":[192],"systems,":[193],"thereby":[194],"bolstering":[195,217],"integrity":[197],"sensitive":[199],"communications":[200],"transmission.":[203],"pave":[206],"way":[208],"advancements":[210],"protocols,":[213],"applications,":[215],"technologies.":[222]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
