{"id":"https://openalex.org/W3198730944","doi":"https://doi.org/10.21437/interspeech.2021-1610","title":"ADEPT: A Dataset for Evaluating Prosody Transfer","display_name":"ADEPT: A Dataset for Evaluating Prosody Transfer","publication_year":2021,"publication_date":"2021-08-27","ids":{"openalex":"https://openalex.org/W3198730944","doi":"https://doi.org/10.21437/interspeech.2021-1610","mag":"3198730944"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2021-1610","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2021-1610","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2021","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5083188961","display_name":"Alexandra Torresquintero","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alexandra Torresquintero","raw_affiliation_strings":["Papercup Technologies Ltd., United Kingdom"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Papercup Technologies Ltd., United Kingdom","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038517086","display_name":"Tian Huey Teh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian Huey Teh","raw_affiliation_strings":["Papercup Technologies Ltd., United Kingdom"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Papercup Technologies Ltd., United Kingdom","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087090605","display_name":"Christopher G. R. Wallis","orcid":"https://orcid.org/0000-0001-7383-4186"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Christopher G.R. Wallis","raw_affiliation_strings":["Papercup Technologies Ltd., United Kingdom"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Papercup Technologies Ltd., United Kingdom","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008306627","display_name":"Marlene Staib","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Marlene Staib","raw_affiliation_strings":["Papercup Technologies Ltd., United Kingdom"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Papercup Technologies Ltd., United Kingdom","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024033876","display_name":"Devang S Ram Mohan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Devang S. Ram Mohan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017825726","display_name":"Vivian Hu","orcid":"https://orcid.org/0000-0002-5548-9283"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vivian Hu","raw_affiliation_strings":["Papercup Technologies Ltd., United Kingdom"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Papercup Technologies Ltd., United Kingdom","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068657700","display_name":"Lorenzo Foglianti","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lorenzo Foglianti","raw_affiliation_strings":["Papercup Technologies Ltd., United Kingdom"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Papercup Technologies Ltd., United Kingdom","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5007377741","display_name":"Jiameng Gao","orcid":"https://orcid.org/0000-0003-4161-938X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jiameng Gao","raw_affiliation_strings":["Papercup Technologies Ltd., United Kingdom"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Papercup Technologies Ltd., United Kingdom","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062516688","display_name":"Simon King","orcid":"https://orcid.org/0000-0002-2694-2843"},"institutions":[{"id":"https://openalex.org/I98677209","display_name":"University of Edinburgh","ror":"https://ror.org/01nrxwf90","country_code":"GB","type":"education","lineage":["https://openalex.org/I98677209"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Simon King","raw_affiliation_strings":["Papercup Technologies Ltd., United Kingdom","University of Edinburgh, United Kingdom"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Papercup Technologies Ltd., United Kingdom","institution_ids":[]},{"raw_affiliation_string":"University of Edinburgh, United Kingdom","institution_ids":["https://openalex.org/I98677209"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.4198,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.69827321,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"3880","last_page":"3884"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/prosody","display_name":"Prosody","score":0.9509506821632385},{"id":"https://openalex.org/keywords/naturalness","display_name":"Naturalness","score":0.889567494392395},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7145721912384033},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6207827925682068},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5648623108863831},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5310397744178772},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.478400319814682},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4598570466041565},{"id":"https://openalex.org/keywords/sample","display_name":"Sample (material)","score":0.4271010458469391},{"id":"https://openalex.org/keywords/natural","display_name":"Natural (archaeology)","score":0.4151949882507324},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.06451457738876343}],"concepts":[{"id":"https://openalex.org/C542774811","wikidata":"https://www.wikidata.org/wiki/Q10880526","display_name":"Prosody","level":2,"score":0.9509506821632385},{"id":"https://openalex.org/C134537474","wikidata":"https://www.wikidata.org/wiki/Q17144832","display_name":"Naturalness","level":2,"score":0.889567494392395},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7145721912384033},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6207827925682068},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5648623108863831},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5310397744178772},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.478400319814682},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4598570466041565},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.4271010458469391},{"id":"https://openalex.org/C2776608160","wikidata":"https://www.wikidata.org/wiki/Q4785462","display_name":"Natural (archaeology)","level":2,"score":0.4151949882507324},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.06451457738876343},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/interspeech.2021-1610","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2021-1610","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2021","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.ed.ac.uk:publications/68da9bd1-92ac-4ca0-8eae-740225e5061a","is_oa":false,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/68da9bd1-92ac-4ca0-8eae-740225e5061a","pdf_url":null,"source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":24,"referenced_works":["https://openalex.org/W336605389","https://openalex.org/W2020738862","https://openalex.org/W2030438891","https://openalex.org/W2041771838","https://openalex.org/W2071138147","https://openalex.org/W2118657004","https://openalex.org/W2120847449","https://openalex.org/W2277581165","https://openalex.org/W2611773338","https://openalex.org/W2948238043","https://openalex.org/W2964138190","https://openalex.org/W2964243274","https://openalex.org/W2972473628","https://openalex.org/W2991417167","https://openalex.org/W3016021263","https://openalex.org/W3019748000","https://openalex.org/W3022876224","https://openalex.org/W3081488690","https://openalex.org/W3176247099","https://openalex.org/W3196843885","https://openalex.org/W4241454614","https://openalex.org/W4246892066","https://openalex.org/W4295731579","https://openalex.org/W4298304696"],"related_works":["https://openalex.org/W2029561777","https://openalex.org/W172797710","https://openalex.org/W3165080709","https://openalex.org/W2945105049","https://openalex.org/W4392904630","https://openalex.org/W169399214","https://openalex.org/W1949369849","https://openalex.org/W2621401062","https://openalex.org/W2054460271","https://openalex.org/W2312868712"],"abstract_inverted_index":{"Text-to-speech":[0],"is":[1,18],"now":[2],"able":[3,103],"to":[4,13,19,36,104,139],"achieve":[5],"near-human":[6],"naturalness":[7],"and":[8,54,79,82,92,109],"research":[9],"focus":[10],"has":[11],"shifted":[12],"increasing":[14],"expressivity.One":[15],"popular":[16],"method":[17,56],"transfer":[20,35,52,121],"the":[21,42,126,137],"prosody":[22,34,51,71,120,146],"from":[23],"a":[24,45,55,61,115,129],"reference":[25,65],"speech":[26,67],"sample.There":[27],"have":[28],"been":[29],"considerable":[30],"advances":[31],"in":[32],"using":[33,136],"generate":[37],"more":[38],"expressive":[39],"speech,":[40],"but":[41],"field":[43],"lacks":[44],"clear":[46],"definition":[47],"of":[48,63,131],"what":[49],"successful":[50],"means":[53],"for":[57,69],"measuring":[58],"it.We":[59],"introduce":[60],"dataset":[62],"prosodically-varied":[64],"natural":[66],"samples":[68,73],"evaluating":[70],"transfer.The":[72],"include":[74],"global":[75],"variations":[76,84,99],"reflecting":[77,85],"emotion":[78],"interpersonal":[80],"attitude,":[81,89],"local":[83],"topical":[86],"emphasis,":[87],"propositional":[88],"syntactic":[90],"phrasing":[91],"marked":[93],"tonicity.The":[94],"corpus":[95,138],"only":[96],"includes":[97],"prosodic":[98],"that":[100,144],"listeners":[101],"are":[102],"distinguish":[105],"with":[106,128],"reasonable":[107],"accuracy,":[108],"we":[110],"report":[111],"these":[112],"figures":[113],"as":[114],"benchmark":[116],"against":[117],"which":[118],"text-to-speech":[119],"can":[122],"be":[123],"compared.We":[124],"conclude":[125],"paper":[127],"demonstration":[130],"our":[132],"proposed":[133],"evaluation":[134],"methodology,":[135],"evaluate":[140],"two":[141],"textto-speech":[142],"models":[143],"perform":[145],"transfer.":[147]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
