{"id":"https://openalex.org/W4297570641","doi":"https://doi.org/10.21437/interspeech.2022-10922","title":"SOMOS: The Samsung Open MOS Dataset for the Evaluation of Neural Text-to-Speech Synthesis","display_name":"SOMOS: The Samsung Open MOS Dataset for the Evaluation of Neural Text-to-Speech Synthesis","publication_year":2022,"publication_date":"2022-09-16","ids":{"openalex":"https://openalex.org/W4297570641","doi":"https://doi.org/10.21437/interspeech.2022-10922"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2022-10922","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2022-10922","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2022","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037667852","display_name":"Georgia Maniati","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Georgia Maniati","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015840293","display_name":"Alexandra Vioni","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alexandra Vioni","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052196585","display_name":"Nikolaos Ellinas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nikolaos Ellinas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047616042","display_name":"Karolos Nikitaras","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Karolos Nikitaras","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061031679","display_name":"Konstantinos Klapsas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Konstantinos Klapsas","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5110947099","display_name":"June Sig Sung","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"June Sig Sung","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041656238","display_name":"Gunu Jho","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gunu Jho","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091595884","display_name":"Aimilios Chalamandaris","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aimilios Chalamandaris","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5027494724","display_name":"Pirros Tsiakoulis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pirros Tsiakoulis","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5037667852"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.2949,"has_fulltext":false,"cited_by_count":27,"citation_normalized_percentile":{"value":0.90211977,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"2388","last_page":"2392"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8027297258377075},{"id":"https://openalex.org/keywords/naturalness","display_name":"Naturalness","score":0.7272965312004089},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6607628464698792},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.634368360042572},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.5920501351356506},{"id":"https://openalex.org/keywords/mean-opinion-score","display_name":"Mean opinion score","score":0.5651041865348816},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5465407967567444},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.5022971630096436},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.4974348843097687},{"id":"https://openalex.org/keywords/face","display_name":"Face (sociological concept)","score":0.4791768789291382},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.44096970558166504},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4341309368610382},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.36526164412498474},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.07327461242675781}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8027297258377075},{"id":"https://openalex.org/C134537474","wikidata":"https://www.wikidata.org/wiki/Q17144832","display_name":"Naturalness","level":2,"score":0.7272965312004089},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6607628464698792},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.634368360042572},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.5920501351356506},{"id":"https://openalex.org/C62897895","wikidata":"https://www.wikidata.org/wiki/Q1915482","display_name":"Mean opinion score","level":3,"score":0.5651041865348816},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5465407967567444},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.5022971630096436},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.4974348843097687},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.4791768789291382},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.44096970558166504},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4341309368610382},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.36526164412498474},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.07327461242675781},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C44870925","wikidata":"https://www.wikidata.org/wiki/Q37547","display_name":"Astrophysics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2022-10922","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2022-10922","pdf_url":null,"source":{"id":"https://openalex.org/S4363604309","display_name":"Interspeech 2022","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"public-domain","license_id":"https://openalex.org/licenses/public-domain","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2022","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W1914543332","https://openalex.org/W2946856121","https://openalex.org/W2108985546","https://openalex.org/W2038801705","https://openalex.org/W2433276473","https://openalex.org/W2077992636","https://openalex.org/W1537411440","https://openalex.org/W2535215250","https://openalex.org/W290673751","https://openalex.org/W2688184458"],"abstract_inverted_index":{"In":[0],"this":[1,147],"work,":[2],"we":[3],"present":[4],"the":[5,8,35,55,106,112,159,164],"SOMOS":[6,160],"dataset,":[7],"first":[9],"large-scale":[10],"mean":[11],"opinion":[12],"scores":[13],"(MOS)":[14],"dataset":[15,63,161],"consisting":[16],"of":[17,37,50,54,153],"solely":[18],"neural":[19,71,85],"text-to-speech":[20],"(TTS)":[21],"samples.":[22],"It":[23,48],"can":[24,41],"be":[25],"employed":[26],"to":[27,142,172],"train":[28],"automatic":[29],"MOS":[30,128,155],"prediction":[31,156],"systems":[32,82],"focused":[33],"on":[34,111,131,158],"assessment":[36],"modern":[38],"synthesizers,":[39],"and":[40,74,120,123,138,162],"stimulate":[42],"advancements":[43],"in":[44],"acoustic":[45,72,86,113],"model":[46],"evaluation.":[47],"consists":[49],"20K":[51],"synthetic":[52],"utterances":[53,117],"LJ":[56],"Speech":[57],"voice,":[58],"a":[59,66],"public":[60],"domain":[61,122],"speech":[62],"which":[64,92],"is":[65,99],"common":[67],"benchmark":[68],"for":[69,101,146],"building":[70],"models":[73,87,91,157,168],"vocoders.":[75],"Utterances":[76],"are":[77],"generated":[78],"from":[79],"200":[80],"TTS":[81,174],"including":[83],"vanilla":[84],"as":[88,90],"well":[89],"allow":[93],"prosodic":[94],"variations.":[95],"An":[96],"LPCNet":[97],"vocoder":[98],"used":[100],"all":[102],"systems,":[103],"so":[104],"that":[105,166],"samples'":[107],"variation":[108],"depends":[109],"only":[110],"models.":[114],"The":[115],"synthesized":[116],"provide":[118,150],"balanced":[119],"adequate":[121],"length":[124],"coverage.":[125],"We":[126,149],"collect":[127],"naturalness":[129],"evaluations":[130],"3":[132],"English":[133],"Amazon":[134],"Mechanical":[135],"Turk":[136],"locales":[137],"share":[139],"practices":[140],"leading":[141],"reliable":[143],"crowdsourced":[144],"annotations":[145],"task.":[148],"baseline":[151],"results":[152],"state-of-the-art":[154],"show":[163],"limitations":[165],"such":[167],"face":[169],"when":[170],"assigned":[171],"evaluate":[173],"utterances.":[175]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":7}],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2025-10-10T00:00:00"}
