{"id":"https://openalex.org/W7143475284","doi":"https://doi.org/10.48550/arxiv.2603.26248","title":"Automatic Speech Recognition for Documenting Endangered Languages: Case Study of Ikema Miyakoan","display_name":"Automatic Speech Recognition for Documenting Endangered Languages: Case Study of Ikema Miyakoan","publication_year":2026,"publication_date":"2026-03-27","ids":{"openalex":"https://openalex.org/W7143475284","doi":"https://doi.org/10.48550/arxiv.2603.26248"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.26248","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26248","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.26248","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130929254","display_name":"Chihiro Taguchi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Taguchi, Chihiro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130952771","display_name":"Yukinori Takubo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Takubo, Yukinori","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5130924580","display_name":"David Chiang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chiang, David","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.44670000672340393,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.44670000672340393,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.0966000035405159,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.06840000301599503,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/transcription","display_name":"Transcription (linguistics)","score":0.6531000137329102},{"id":"https://openalex.org/keywords/documentation","display_name":"Documentation","score":0.6424000263214111},{"id":"https://openalex.org/keywords/endangered-species","display_name":"Endangered species","score":0.47429999709129333},{"id":"https://openalex.org/keywords/field","display_name":"Field (mathematics)","score":0.4629000127315521},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4237000048160553},{"id":"https://openalex.org/keywords/speech-technology","display_name":"Speech technology","score":0.375}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6782000064849854},{"id":"https://openalex.org/C179926584","wikidata":"https://www.wikidata.org/wiki/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.6531000137329102},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.6424000263214111},{"id":"https://openalex.org/C179345059","wikidata":"https://www.wikidata.org/wiki/Q11394","display_name":"Endangered species","level":3,"score":0.47429999709129333},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.4629000127315521},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4300000071525574},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.42989999055862427},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4237000048160553},{"id":"https://openalex.org/C504749915","wikidata":"https://www.wikidata.org/wiki/Q9010971","display_name":"Speech technology","level":3,"score":0.375},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.3646000027656555},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3531000018119812},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3386000096797943},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3294999897480011},{"id":"https://openalex.org/C2776230583","wikidata":"https://www.wikidata.org/wiki/Q1322198","display_name":"Spoken language","level":2,"score":0.3188999891281128},{"id":"https://openalex.org/C2781316041","wikidata":"https://www.wikidata.org/wiki/Q1230584","display_name":"Diversity (politics)","level":2,"score":0.30640000104904175},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.29490000009536743},{"id":"https://openalex.org/C91863865","wikidata":"https://www.wikidata.org/wiki/Q4349497","display_name":"Speech corpus","level":3,"score":0.25699999928474426}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.26248","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26248","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.26248","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.26248","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7647752165794373}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Language":[0],"endangerment":[1],"poses":[2],"a":[3,45,87,101,138],"major":[4],"challenge":[5],"to":[6,31,72],"linguistic":[7],"diversity":[8],"worldwide,":[9],"and":[10,19,109,134],"technological":[11],"advances":[12],"have":[13],"opened":[14],"new":[15],"avenues":[16],"for":[17,77],"documentation":[18,144],"revitalization.":[20],"Among":[21],"these,":[22],"automatic":[23],"speech":[24,89,121],"recognition":[25],"(ASR)":[26],"has":[27],"shown":[28],"increasing":[29],"potential":[30],"assist":[32],"in":[33,51],"the":[34,112,118],"transcription":[35,132],"of":[36,60,114,120,145],"endangered":[37,47,146],"language":[38,49],"data.":[39],"This":[40],"study":[41],"focuses":[42],"on":[43,80,117],"Ikema,":[44],"severely":[46],"Ryukyuan":[48],"spoken":[50],"Okinawa,":[52],"Japan,":[53],"with":[54],"approximately":[55],"1,300":[56],"remaining":[57],"speakers,":[58],"most":[59],"whom":[61],"are":[62],"over":[63],"60":[64],"years":[65],"old.":[66],"We":[67],"present":[68],"an":[69,74,96],"ongoing":[70],"effort":[71],"develop":[73],"ASR":[75,97,115,127],"system":[76],"Ikema":[78],"based":[79],"field":[81,92],"recordings.":[82],"Specifically,":[83],"we":[84],"(1)":[85],"construct":[86],"6.33-hour":[88],"corpus":[90],"from":[91],"recordings,":[93],"(2)":[94],"train":[95],"model":[98],"that":[99,126],"achieves":[100],"character":[102],"error":[103],"rate":[104],"as":[105,107],"low":[106],"15%,":[108],"(3)":[110],"evaluate":[111],"impact":[113],"assistance":[116],"efficiency":[119],"transcription.":[122],"Our":[123],"results":[124],"demonstrate":[125],"integration":[128],"can":[129],"substantially":[130],"reduce":[131],"time":[133],"cognitive":[135],"load,":[136],"offering":[137],"practical":[139],"pathway":[140],"toward":[141],"scalable,":[142],"technology-supported":[143],"languages.":[147]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-31T00:00:00"}
