{"id":"https://openalex.org/W4313225802","doi":"https://doi.org/10.1109/o-cocosda202257103.2022.9997860","title":"The Speech Labeling and Modeling Toolkit (SLMTK) Version 1.0","display_name":"The Speech Labeling and Modeling Toolkit (SLMTK) Version 1.0","publication_year":2022,"publication_date":"2022-11-01","ids":{"openalex":"https://openalex.org/W4313225802","doi":"https://doi.org/10.1109/o-cocosda202257103.2022.9997860"},"language":"en","primary_location":{"id":"doi:10.1109/o-cocosda202257103.2022.9997860","is_oa":false,"landing_page_url":"https://doi.org/10.1109/o-cocosda202257103.2022.9997860","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 25th Conference of the Oriental COCOSDA International Committee for the Co-ordination and Standardisation of Speech Databases and Assessment Techniques (O-COCOSDA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101446417","display_name":"Chen-Yu Chiang","orcid":"https://orcid.org/0000-0003-4997-8774"},"institutions":[{"id":"https://openalex.org/I99613584","display_name":"National Taipei University","ror":"https://ror.org/03e29r284","country_code":"TW","type":"education","lineage":["https://openalex.org/I99613584"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Chen-Yu Chiang","raw_affiliation_strings":["National Taipei University,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taipei University,Taiwan","institution_ids":["https://openalex.org/I99613584"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089113904","display_name":"Wu-Hao Li","orcid":null},"institutions":[{"id":"https://openalex.org/I99613584","display_name":"National Taipei University","ror":"https://ror.org/03e29r284","country_code":"TW","type":"education","lineage":["https://openalex.org/I99613584"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Wu-Hao Li","raw_affiliation_strings":["National Taipei University,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taipei University,Taiwan","institution_ids":["https://openalex.org/I99613584"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031455640","display_name":"Yen-Ting Lin","orcid":"https://orcid.org/0000-0003-2970-2455"},"institutions":[{"id":"https://openalex.org/I99613584","display_name":"National Taipei University","ror":"https://ror.org/03e29r284","country_code":"TW","type":"education","lineage":["https://openalex.org/I99613584"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yen-Ting Lin","raw_affiliation_strings":["National Taipei University,Taiwan","udnDigital Co., Ltd,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taipei University,Taiwan","institution_ids":["https://openalex.org/I99613584"]},{"raw_affiliation_string":"udnDigital Co., Ltd,Taiwan","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058007471","display_name":"Jia-Jyu Su","orcid":null},"institutions":[{"id":"https://openalex.org/I99613584","display_name":"National Taipei University","ror":"https://ror.org/03e29r284","country_code":"TW","type":"education","lineage":["https://openalex.org/I99613584"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Jia-Jyu Su","raw_affiliation_strings":["National Taipei University,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taipei University,Taiwan","institution_ids":["https://openalex.org/I99613584"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100726716","display_name":"Wei\u2010Cheng Chen","orcid":"https://orcid.org/0000-0001-9680-7500"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei-Cheng Chen","raw_affiliation_strings":["AcoustInTek Co., Ltd,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AcoustInTek Co., Ltd,Taiwan","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065628907","display_name":"Cheng-Che Kao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cheng-Che Kao","raw_affiliation_strings":["AcoustInTek Co., Ltd,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AcoustInTek Co., Ltd,Taiwan","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039009330","display_name":"Shu-Lei Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I99613584","display_name":"National Taipei University","ror":"https://ror.org/03e29r284","country_code":"TW","type":"education","lineage":["https://openalex.org/I99613584"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Shu-Lei Lin","raw_affiliation_strings":["National Taipei University,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taipei University,Taiwan","institution_ids":["https://openalex.org/I99613584"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102919914","display_name":"Pin-Han Lin","orcid":"https://orcid.org/0009-0007-0282-1944"},"institutions":[{"id":"https://openalex.org/I99613584","display_name":"National Taipei University","ror":"https://ror.org/03e29r284","country_code":"TW","type":"education","lineage":["https://openalex.org/I99613584"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Pin-Han Lin","raw_affiliation_strings":["National Taipei University,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taipei University,Taiwan","institution_ids":["https://openalex.org/I99613584"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091029429","display_name":"Shao-Wei Hong","orcid":null},"institutions":[{"id":"https://openalex.org/I99613584","display_name":"National Taipei University","ror":"https://ror.org/03e29r284","country_code":"TW","type":"education","lineage":["https://openalex.org/I99613584"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Shao-Wei Hong","raw_affiliation_strings":["National Taipei University,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taipei University,Taiwan","institution_ids":["https://openalex.org/I99613584"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050372484","display_name":"Guan-Ting Liou","orcid":null},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Guan-Ting Liou","raw_affiliation_strings":["National Yang Ming Chiao Tung University,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University,Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041739103","display_name":"Wen-Yang Chang","orcid":"https://orcid.org/0000-0002-2377-4127"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wen-Yang Chang","raw_affiliation_strings":["AcoustInTek Co., Ltd,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AcoustInTek Co., Ltd,Taiwan","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028209484","display_name":"Jen-Chieh Chiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jen-Chieh Chiang","raw_affiliation_strings":["AcoustInTek Co., Ltd,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"AcoustInTek Co., Ltd,Taiwan","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031455640","display_name":"Yen-Ting Lin","orcid":"https://orcid.org/0000-0003-2970-2455"},"institutions":[{"id":"https://openalex.org/I99613584","display_name":"National Taipei University","ror":"https://ror.org/03e29r284","country_code":"TW","type":"education","lineage":["https://openalex.org/I99613584"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yen-Ting Lin","raw_affiliation_strings":["National Taipei University,Taiwan","udnDigital Co., Ltd,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Taipei University,Taiwan","institution_ids":["https://openalex.org/I99613584"]},{"raw_affiliation_string":"udnDigital Co., Ltd,Taiwan","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071941088","display_name":"Yih\u2010Ru Wang","orcid":"https://orcid.org/0000-0002-4483-1418"},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Yih-Ru Wang","raw_affiliation_strings":["National Yang Ming Chiao Tung University,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University,Taiwan","institution_ids":["https://openalex.org/I148366613"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015529786","display_name":"Sin\u2010Horng Chen","orcid":"https://orcid.org/0000-0002-9820-2318"},"institutions":[{"id":"https://openalex.org/I148366613","display_name":"National Yang Ming Chiao Tung University","ror":"https://ror.org/00se2k293","country_code":"TW","type":"education","lineage":["https://openalex.org/I148366613"]}],"countries":["TW"],"is_corresponding":false,"raw_author_name":"Sin-Horng Chen","raw_affiliation_strings":["National Yang Ming Chiao Tung University,Taiwan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"National Yang Ming Chiao Tung University,Taiwan","institution_ids":["https://openalex.org/I148366613"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":15,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.6937,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.76116218,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9937000274658203,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/prosody","display_name":"Prosody","score":0.8982486724853516},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7507063150405884},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.7440741658210754},{"id":"https://openalex.org/keywords/mandarin-chinese","display_name":"Mandarin Chinese","score":0.6911106109619141},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.665447473526001},{"id":"https://openalex.org/keywords/syllable","display_name":"Syllable","score":0.627313494682312},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5119472742080688},{"id":"https://openalex.org/keywords/speech-corpus","display_name":"Speech corpus","score":0.5051863789558411},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.41710174083709717},{"id":"https://openalex.org/keywords/acoustic-model","display_name":"Acoustic model","score":0.41355741024017334},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.39976680278778076},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.29307934641838074}],"concepts":[{"id":"https://openalex.org/C542774811","wikidata":"https://www.wikidata.org/wiki/Q10880526","display_name":"Prosody","level":2,"score":0.8982486724853516},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7507063150405884},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.7440741658210754},{"id":"https://openalex.org/C138954614","wikidata":"https://www.wikidata.org/wiki/Q9192","display_name":"Mandarin Chinese","level":2,"score":0.6911106109619141},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.665447473526001},{"id":"https://openalex.org/C109089402","wikidata":"https://www.wikidata.org/wiki/Q8188","display_name":"Syllable","level":2,"score":0.627313494682312},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5119472742080688},{"id":"https://openalex.org/C91863865","wikidata":"https://www.wikidata.org/wiki/Q4349497","display_name":"Speech corpus","level":3,"score":0.5051863789558411},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.41710174083709717},{"id":"https://openalex.org/C155635449","wikidata":"https://www.wikidata.org/wiki/Q4674699","display_name":"Acoustic model","level":3,"score":0.41355741024017334},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.39976680278778076},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.29307934641838074},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/o-cocosda202257103.2022.9997860","is_oa":false,"landing_page_url":"https://doi.org/10.1109/o-cocosda202257103.2022.9997860","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 25th Conference of the Oriental COCOSDA International Committee for the Co-ordination and Standardisation of Speech Databases and Assessment Techniques (O-COCOSDA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.6700000166893005,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1524333225","https://openalex.org/W2019862519","https://openalex.org/W2136320814","https://openalex.org/W2146921187","https://openalex.org/W2153914468","https://openalex.org/W2504361220","https://openalex.org/W2537421476","https://openalex.org/W2747874407","https://openalex.org/W2761478804","https://openalex.org/W2808301194","https://openalex.org/W2889234690","https://openalex.org/W2936103087","https://openalex.org/W2943395818","https://openalex.org/W2946200149","https://openalex.org/W2951418500","https://openalex.org/W2963609956","https://openalex.org/W2964243274","https://openalex.org/W2996317213","https://openalex.org/W3011026433","https://openalex.org/W3033411150","https://openalex.org/W3044514286","https://openalex.org/W3048768961","https://openalex.org/W3049756574","https://openalex.org/W3183102188","https://openalex.org/W6631362777","https://openalex.org/W6736996214","https://openalex.org/W6757079273","https://openalex.org/W6763832098","https://openalex.org/W6771405711","https://openalex.org/W6778823374"],"related_works":["https://openalex.org/W2396586136","https://openalex.org/W1505084104","https://openalex.org/W2599935372","https://openalex.org/W10581632","https://openalex.org/W1927421023","https://openalex.org/W3149582125","https://openalex.org/W1984347656","https://openalex.org/W157238252","https://openalex.org/W2169632867","https://openalex.org/W2161314515"],"abstract_inverted_index":{"This":[0],"paper":[1],"introduces":[2],"the":[3,37,46,87,139,175,178],"Speech":[4],"Labeling":[5],"and":[6,19,26,36,63,75,104,114,134,147,169],"Modeling":[7],"Toolkit":[8],"version":[9],"1.0":[10,31,123,161],"(SLMTK":[11],"1.0),":[12],"which":[13],"facilitates":[14],"automatic":[15],"labeling":[16,149],"of":[17,60,71,78,86,150,177],"text":[18,49],"speech":[20,27,35,82,119,153],"for":[21,81,118,132,166],"constructing":[22,128],"text-to-speech":[23],"(TTS)":[24],"systems":[25,131],"analysis.":[28],"The":[29,40,84,121,159],"SLMTK":[30,122,160],"supports":[32],"mixed":[33],"Mandarin-English":[34],"associated":[38],"texts.":[39],"following":[41],"seven":[42,88],"steps":[43,89],"then":[44],"process":[45],"inputs:":[47],"1)":[48,92],"analysis,":[50],"2)":[51,95],"acoustic":[52,79,96,116],"feature":[53],"extraction,":[54],"3)":[55,98],"linguistic-speech":[56,99],"alignment,":[57,100],"4)":[58,101],"integration":[59],"syllable-based":[61,102],"linguistic":[62,93,103],"prosodic-acoustic":[64,105],"features,":[65,97,106],"5)":[66,107],"prosody":[67,72,108,111,156],"labeling,":[68],"6)":[69,110],"construction":[70,77],"generation":[73,112],"model,":[74,113],"7)":[76,115],"models":[80,117],"synthesis.":[83,120],"outputs":[85],"are,":[90],"respectively,":[91],"labels,":[94],"tags,":[109],"has":[124,141],"been":[125,143],"applied":[126,144],"to":[127,145,154,173],"personalized":[129],"TTS":[130],"augmentative":[133],"alternative":[135],"communication.":[136],"In":[137],"addition,":[138],"toolkit":[140],"also":[142],"phonetic":[146],"prosodic":[148],"L2":[151],"Mandarin":[152],"facilitate":[155],"analysis":[157],"studies.":[158],"is":[162],"available":[163],"at":[164],"https://slmtk.ce.ntpu.edu.tw":[165],"non-commercial":[167],"use":[168],"welcomes":[170],"all":[171],"parties":[172],"enrich":[174],"functions":[176],"SLMTK.":[179]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
