{"id":"https://openalex.org/W2894690744","doi":"https://doi.org/10.21437/sltu.2018-35","title":"Building an ASR System for Mboshi Using A Cross-Language Definition of Acoustic Units Approach","display_name":"Building an ASR System for Mboshi Using A Cross-Language Definition of Acoustic Units Approach","publication_year":2018,"publication_date":"2018-08-29","ids":{"openalex":"https://openalex.org/W2894690744","doi":"https://doi.org/10.21437/sltu.2018-35","mag":"2894690744"},"language":"en","primary_location":{"id":"doi:10.21437/sltu.2018-35","is_oa":false,"landing_page_url":"https://doi.org/10.21437/sltu.2018-35","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"6th Workshop on Spoken Language Technologies for Under-Resourced Languages (SLTU 2018)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048860892","display_name":"Odette Scharenborg","orcid":"https://orcid.org/0000-0003-0693-8852"},"institutions":[{"id":"https://openalex.org/I145872427","display_name":"Radboud University Nijmegen","ror":"https://ror.org/016xsfp80","country_code":"NL","type":"education","lineage":["https://openalex.org/I145872427"]},{"id":"https://openalex.org/I98358874","display_name":"Delft University of Technology","ror":"https://ror.org/02e2c7k09","country_code":"NL","type":"education","lineage":["https://openalex.org/I98358874"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Odette Scharenborg","raw_affiliation_strings":["Centre for Language Studies, Radboud University, Nijmegen, the Netherlands","Multimedia Computing Group, Delft University of Technology, Delft, the Netherlands"],"affiliations":[{"raw_affiliation_string":"Centre for Language Studies, Radboud University, Nijmegen, the Netherlands","institution_ids":["https://openalex.org/I145872427"]},{"raw_affiliation_string":"Multimedia Computing Group, Delft University of Technology, Delft, the Netherlands","institution_ids":["https://openalex.org/I98358874"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5060929395","display_name":"Patrick Ebel","orcid":"https://orcid.org/0000-0002-4437-2821"},"institutions":[{"id":"https://openalex.org/I145872427","display_name":"Radboud University Nijmegen","ror":"https://ror.org/016xsfp80","country_code":"NL","type":"education","lineage":["https://openalex.org/I145872427"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Patrick Ebel","raw_affiliation_strings":["Centre for Language Studies, Radboud University, Nijmegen, the Netherlands"],"affiliations":[{"raw_affiliation_string":"Centre for Language Studies, Radboud University, Nijmegen, the Netherlands","institution_ids":["https://openalex.org/I145872427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004778663","display_name":"Mark Hasegawa\u2010Johnson","orcid":"https://orcid.org/0000-0002-5631-2893"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mark Hasegawa-Johnson","raw_affiliation_strings":["ECE Department & Beckman Institute, University of Illinois, Urbana-Champaign, IL, USA"],"affiliations":[{"raw_affiliation_string":"ECE Department & Beckman Institute, University of Illinois, Urbana-Champaign, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5050632169","display_name":"Najim Dehak","orcid":"https://orcid.org/0000-0002-4489-5753"},"institutions":[{"id":"https://openalex.org/I145311948","display_name":"Johns Hopkins University","ror":"https://ror.org/00za53h95","country_code":"US","type":"education","lineage":["https://openalex.org/I145311948"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Najim Dehak","raw_affiliation_strings":["Center for Language and Speech Processing, Johns Hopkins University, Baltimore, MD, USA"],"affiliations":[{"raw_affiliation_string":"Center for Language and Speech Processing, Johns Hopkins University, Baltimore, MD, USA","institution_ids":["https://openalex.org/I145311948"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5048860892"],"corresponding_institution_ids":["https://openalex.org/I145872427","https://openalex.org/I98358874"],"apc_list":null,"apc_paid":null,"fwci":0.8462,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.80766972,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"167","last_page":"171"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/initialization","display_name":"Initialization","score":0.8687926530838013},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8227774500846863},{"id":"https://openalex.org/keywords/retraining","display_name":"Retraining","score":0.8078315258026123},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6013443470001221},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.524914562702179},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.5112063884735107},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.498826265335083},{"id":"https://openalex.org/keywords/layer","display_name":"Layer (electronics)","score":0.4754871129989624},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.4404739737510681},{"id":"https://openalex.org/keywords/training-set","display_name":"Training set","score":0.421045184135437},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.417097806930542},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3872700035572052}],"concepts":[{"id":"https://openalex.org/C114466953","wikidata":"https://www.wikidata.org/wiki/Q6034165","display_name":"Initialization","level":2,"score":0.8687926530838013},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8227774500846863},{"id":"https://openalex.org/C2778712577","wikidata":"https://www.wikidata.org/wiki/Q3505966","display_name":"Retraining","level":2,"score":0.8078315258026123},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6013443470001221},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.524914562702179},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.5112063884735107},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.498826265335083},{"id":"https://openalex.org/C2779227376","wikidata":"https://www.wikidata.org/wiki/Q6505497","display_name":"Layer (electronics)","level":2,"score":0.4754871129989624},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.4404739737510681},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.421045184135437},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.417097806930542},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3872700035572052},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C155202549","wikidata":"https://www.wikidata.org/wiki/Q178803","display_name":"International trade","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C153294291","wikidata":"https://www.wikidata.org/wiki/Q25261","display_name":"Meteorology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/sltu.2018-35","is_oa":false,"landing_page_url":"https://doi.org/10.21437/sltu.2018-35","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"6th Workshop on Spoken Language Technologies for Under-Resourced Languages (SLTU 2018)","raw_type":"proceedings-article"},{"id":"pmh:oai:tudelft.nl:uuid:fece6820-ab82-48d8-9cc2-e010a0f645a5","is_oa":false,"landing_page_url":"http://resolver.tudelft.nl/uuid:fece6820-ab82-48d8-9cc2-e010a0f645a5","pdf_url":null,"source":{"id":"https://openalex.org/S4306400906","display_name":"Research Repository (Delft University of Technology)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I98358874","host_organization_name":"Delft University of Technology","host_organization_lineage":["https://openalex.org/I98358874"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"conference paper"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8100000023841858,"id":"https://metadata.un.org/sdg/4"}],"awards":[{"id":"https://openalex.org/G5832103344","display_name":null,"funder_award_id":"276-89-003","funder_id":"https://openalex.org/F4320321800","funder_display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek"},{"id":"https://openalex.org/G7875773839","display_name":null,"funder_award_id":"Vidi-grant","funder_id":"https://openalex.org/F4320321800","funder_display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek"}],"funders":[{"id":"https://openalex.org/F4320321800","display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek","ror":"https://ror.org/04jsz6e67"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W1520968739","https://openalex.org/W1524333225","https://openalex.org/W2025482506","https://openalex.org/W2099621636","https://openalex.org/W2160003195","https://openalex.org/W2271840356","https://openalex.org/W2307960051","https://openalex.org/W2347098582","https://openalex.org/W2347145335","https://openalex.org/W2545319977","https://openalex.org/W2747287964","https://openalex.org/W2762715843","https://openalex.org/W2885643293","https://openalex.org/W2889500720","https://openalex.org/W2962862718","https://openalex.org/W4206864474"],"related_works":["https://openalex.org/W2081982437","https://openalex.org/W4394857231","https://openalex.org/W3204184292","https://openalex.org/W2027050655","https://openalex.org/W2900841314","https://openalex.org/W4394050964","https://openalex.org/W2551249631","https://openalex.org/W4287644835","https://openalex.org/W3092281475","https://openalex.org/W3098003361"],"abstract_inverted_index":{"For":[0],"many":[1],"languages":[2],"in":[3,65],"the":[4,41,62,66,86,91,113,117,125,134,144],"world,":[5],"not":[6],"enough":[7],"(annotated)":[8],"speech":[9],"data":[10],"is":[11],"available":[12],"to":[13,40,120],"train":[14],"an":[15,26,46],"ASR":[16,27,47],"system.":[17],"Recently,":[18],"we":[19,36],"proposed":[20],"a":[21,129,139],"cross-language":[22,59],"method":[23],"for":[24,133,143],"training":[25,79,136],"system":[28,48,72,100],"using":[29,58,75],"linguistic":[30],"knowledge":[31],"and":[32,89,110,121],"semi-supervised":[33],"training.":[34],"Here,":[35],"apply":[37],"this":[38,70],"approach":[39],"low-resource":[42],"language":[43],"Mboshi.":[44],"Using":[45],"trained":[49],"on":[50],"Dutch,":[51],"Mboshi":[52,76,99],"acoustic":[53],"units":[54],"were":[55,81],"first":[56],"created":[57],"initialization":[60],"of":[61,84,116],"phoneme":[63,106,108,141],"vectors":[64],"output":[67,87],"layer.":[68],"Subsequently,":[69],"adapted":[71],"was":[73,101],"retrained":[74,146],"self-labels.":[77,126],"Two":[78],"methods":[80,137],"investigated:":[82],"retraining":[83,90,123],"only":[85],"layer":[88],"full":[92],"deep":[93],"neural":[94],"network":[95],"(DNN).":[96],"The":[97],"resulting":[98],"analyzed":[102],"by":[103,111],"investigating":[104],"per":[105],"accuracies,":[107],"confusions,":[109],"visualizing":[112],"hidden":[114],"layers":[115],"DNNs":[118],"prior":[119],"following":[122],"with":[124],"Results":[127],"showed":[128],"fairly":[130],"similar":[131],"performance":[132],"two":[135],"but":[138],"better":[140],"representation":[142],"fully":[145],"DNN.":[147]},"counts_by_year":[{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
