{"id":"https://openalex.org/W1589684606","doi":"https://doi.org/10.21437/interspeech.2011-701","title":"Rapid adaptation of foreign-accented HMM-based speech synthesis","display_name":"Rapid adaptation of foreign-accented HMM-based speech synthesis","publication_year":2011,"publication_date":"2011-08-27","ids":{"openalex":"https://openalex.org/W1589684606","doi":"https://doi.org/10.21437/interspeech.2011-701","mag":"1589684606"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2011-701","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2011-701","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2011","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://www.pure.ed.ac.uk/ws/files/15322997/Rapid_Adaptation_of_Foreign_accented_HMM_based_Speech_Synthesis.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023689975","display_name":"Reima Karhila","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Reima Karhila","raw_affiliation_strings":["Helsinki University of Technology"],"affiliations":[{"raw_affiliation_string":"Helsinki University of Technology","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060282305","display_name":"Mirjam Wester","orcid":"https://orcid.org/0000-0002-3199-0081"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mirjam Wester","raw_affiliation_strings":["School of Informatics"],"affiliations":[{"raw_affiliation_string":"School of Informatics","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5023689975"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.3207,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.8329064,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"2801","last_page":"2804"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stress","display_name":"Stress (linguistics)","score":0.8384073972702026},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6310739517211914},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5675965547561646},{"id":"https://openalex.org/keywords/identity","display_name":"Identity (music)","score":0.5603215098381042},{"id":"https://openalex.org/keywords/perception","display_name":"Perception","score":0.5519782304763794},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.4842959940433502},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.47671765089035034},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4569757878780365},{"id":"https://openalex.org/keywords/speaker-diarisation","display_name":"Speaker diarisation","score":0.4356222450733185},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.434982031583786},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.35750246047973633},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.33617717027664185},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.19568803906440735},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.07126539945602417}],"concepts":[{"id":"https://openalex.org/C2776756274","wikidata":"https://www.wikidata.org/wiki/Q181767","display_name":"Stress (linguistics)","level":2,"score":0.8384073972702026},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6310739517211914},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5675965547561646},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.5603215098381042},{"id":"https://openalex.org/C26760741","wikidata":"https://www.wikidata.org/wiki/Q160402","display_name":"Perception","level":2,"score":0.5519782304763794},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.4842959940433502},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.47671765089035034},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4569757878780365},{"id":"https://openalex.org/C149838564","wikidata":"https://www.wikidata.org/wiki/Q7574248","display_name":"Speaker diarisation","level":3,"score":0.4356222450733185},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.434982031583786},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.35750246047973633},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.33617717027664185},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.19568803906440735},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.07126539945602417},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.21437/interspeech.2011-701","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2011-701","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2011","raw_type":"proceedings-article"},{"id":"pmh:oai:pure.ed.ac.uk:publications/fe33d053-adab-4a37-b585-acce24e130c6","is_oa":true,"landing_page_url":"http://hdl.handle.net/20.500.11820/fe33d053-adab-4a37-b585-acce24e130c6","pdf_url":"https://www.pure.ed.ac.uk/ws/files/15322997/Rapid_Adaptation_of_Foreign_accented_HMM_based_Speech_Synthesis.pdf","source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.220.9527","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.220.9527","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cstr.inf.ed.ac.uk/downloads/publications/2011/karhila_wester_interspeech_2011.pdf","raw_type":"text"},{"id":"pmh:oai:pure.ed.ac.uk:openaire/fe33d053-adab-4a37-b585-acce24e130c6","is_oa":true,"landing_page_url":"https://www.research.ed.ac.uk/en/publications/fe33d053-adab-4a37-b585-acce24e130c6","pdf_url":null,"source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Karhila, R & Wester, M 2011, Rapid Adaptation of Foreign-accented HMM-based Speech Synthesis. in Proc. Interspeech. < http://www.isca-speech.org/archive/interspeech_2011/i11_2801.html >","raw_type":"contributionToPeriodical"}],"best_oa_location":{"id":"pmh:oai:pure.ed.ac.uk:publications/fe33d053-adab-4a37-b585-acce24e130c6","is_oa":true,"landing_page_url":"http://hdl.handle.net/20.500.11820/fe33d053-adab-4a37-b585-acce24e130c6","pdf_url":"https://www.pure.ed.ac.uk/ws/files/15322997/Rapid_Adaptation_of_Foreign_accented_HMM_based_Speech_Synthesis.pdf","source":{"id":"https://openalex.org/S4406922455","display_name":"Edinburgh Research Explorer","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":""},"sustainable_development_goals":[{"score":0.6200000047683716,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"},{"score":0.4000000059604645,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W1589684606.pdf"},"referenced_works_count":14,"referenced_works":["https://openalex.org/W118315650","https://openalex.org/W152891837","https://openalex.org/W1484402186","https://openalex.org/W1572989473","https://openalex.org/W1962947832","https://openalex.org/W1984905644","https://openalex.org/W1995565802","https://openalex.org/W2061406848","https://openalex.org/W2106647610","https://openalex.org/W2152776867","https://openalex.org/W2153914468","https://openalex.org/W2169066045","https://openalex.org/W2905660394","https://openalex.org/W4246488987"],"related_works":["https://openalex.org/W2206035908","https://openalex.org/W4247736853","https://openalex.org/W2162158162","https://openalex.org/W1493012537","https://openalex.org/W1999004162","https://openalex.org/W2175373321","https://openalex.org/W2125642021","https://openalex.org/W1521049138","https://openalex.org/W2938358845","https://openalex.org/W2997340161"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"findings":[3],"of":[4,8,25,42,105,145],"listeners":[5,63,153,165],"\u2019":[6,154],"perception":[7],"speaker":[9,27,52,59,123,155,179],"identity":[10,24],"in":[11,72,170],"synthetic":[12,49,69,107,172],"speech.":[13],"Specifically,":[14],"we":[15],"investigated":[16],"what":[17],"the":[18,22,48,82,87,102,106,116,126,143,146,160,171],"effect":[19],"is":[20],"on":[21,182],"perceived":[23,103,183],"a":[26,43],"when":[28,125,138],"using":[29,131,139],"differently":[30],"accented":[31],"average":[32,147],"voice":[33,148],"models":[34],"and":[35,39,68,74],"limited":[36],"amounts":[37],"(five":[38],"fifteen":[40,134],"sentences)":[41],"speaker\u2019s":[44],"data":[45],"to":[46,57,77,100],"create":[47],"stimuli.":[50,109,173],"A":[51],"discrimination":[53,124,156],"task":[54,95,163],"was":[55,96],"used":[56],"measure":[58,101],"identity.":[60],"Native":[61],"English":[62,73],"were":[64,75,84],"presented":[65],"with":[66],"natural":[67],"speech":[70,108,187],"stimuli":[71,127],"asked":[76],"decide":[78],"whether":[79],"they":[80],"thought":[81],"sentences":[83,136],"spoken":[85],"by":[86],"same":[88],"person":[89],"or":[90,133],"not.":[91],"An":[92],"accent":[93,144,161],"rating":[94,162],"also":[97],"carried":[98],"out":[99],"accents":[104,169],"The":[110],"results":[111],"show":[112],"that":[113],"listeners,":[114],"for":[115],"most":[117],"part,":[118],"perform":[119],"as":[120,137],"well":[121],"at":[122],"have":[128],"been":[129],"created":[130],"five":[132],"adaptation":[135,190],"105":[140],"sentences.":[141],"Furthermore,":[142],"model":[149],"does":[150],"not":[151,176],"affect":[152],"performance":[157],"even":[158],"though":[159],"shows":[164],"are":[166],"perceiving":[167],"different":[168],"Listeners":[174],"do":[175],"base":[177],"their":[178],"similarity":[180],"decisions":[181],"accent.":[184],"Index":[185],"Terms:":[186],"synthesis,":[188],"rapid":[189],"1.":[191]},"counts_by_year":[{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2012,"cited_by_count":2}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
