{"id":"https://openalex.org/W4383068138","doi":"https://doi.org/10.3390/mti7070068","title":"Using Open-Source Automatic Speech Recognition Tools for the Annotation of Dutch Infant-Directed Speech","display_name":"Using Open-Source Automatic Speech Recognition Tools for the Annotation of Dutch Infant-Directed Speech","publication_year":2023,"publication_date":"2023-07-03","ids":{"openalex":"https://openalex.org/W4383068138","doi":"https://doi.org/10.3390/mti7070068"},"language":"en","primary_location":{"id":"doi:10.3390/mti7070068","is_oa":true,"landing_page_url":"https://doi.org/10.3390/mti7070068","pdf_url":"https://www.mdpi.com/2414-4088/7/7/68/pdf?version=1688367476","source":{"id":"https://openalex.org/S4210226272","display_name":"Multimodal Technologies and Interaction","issn_l":"2414-4088","issn":["2414-4088"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Multimodal Technologies and Interaction","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2414-4088/7/7/68/pdf?version=1688367476","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030984341","display_name":"Anika van der Klis","orcid":"https://orcid.org/0000-0001-5807-0667"},"institutions":[{"id":"https://openalex.org/I193662353","display_name":"Utrecht University","ror":"https://ror.org/04pp8hn57","country_code":"NL","type":"education","lineage":["https://openalex.org/I193662353"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Anika van der Klis","raw_affiliation_strings":["Institute for Language Sciences, Utrecht University, 3512 JK Utrecht, The Netherlands"],"raw_orcid":"https://orcid.org/0000-0001-5807-0667","affiliations":[{"raw_affiliation_string":"Institute for Language Sciences, Utrecht University, 3512 JK Utrecht, The Netherlands","institution_ids":["https://openalex.org/I193662353"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067849643","display_name":"Frans Adriaans","orcid":"https://orcid.org/0000-0003-4342-7947"},"institutions":[{"id":"https://openalex.org/I193662353","display_name":"Utrecht University","ror":"https://ror.org/04pp8hn57","country_code":"NL","type":"education","lineage":["https://openalex.org/I193662353"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Frans Adriaans","raw_affiliation_strings":["Institute for Language Sciences, Utrecht University, 3512 JK Utrecht, The Netherlands"],"raw_orcid":"https://orcid.org/0000-0003-4342-7947","affiliations":[{"raw_affiliation_string":"Institute for Language Sciences, Utrecht University, 3512 JK Utrecht, The Netherlands","institution_ids":["https://openalex.org/I193662353"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041268881","display_name":"Mengru Han","orcid":"https://orcid.org/0000-0002-2231-5922"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mengru Han","raw_affiliation_strings":["Department of Chinese Language and Literature, East China Normal University, Shanghai 200241, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Chinese Language and Literature, East China Normal University, Shanghai 200241, China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5009314121","display_name":"Ren\u00e9 Kager","orcid":"https://orcid.org/0000-0002-5811-839X"},"institutions":[{"id":"https://openalex.org/I193662353","display_name":"Utrecht University","ror":"https://ror.org/04pp8hn57","country_code":"NL","type":"education","lineage":["https://openalex.org/I193662353"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Ren\u00e9 Kager","raw_affiliation_strings":["Institute for Language Sciences, Utrecht University, 3512 JK Utrecht, The Netherlands"],"raw_orcid":"https://orcid.org/0000-0002-5811-839X","affiliations":[{"raw_affiliation_string":"Institute for Language Sciences, Utrecht University, 3512 JK Utrecht, The Netherlands","institution_ids":["https://openalex.org/I193662353"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5030984341","https://openalex.org/A5067849643"],"corresponding_institution_ids":["https://openalex.org/I193662353"],"apc_list":{"value":1600,"currency":"CHF","value_usd":1732},"apc_paid":{"value":1600,"currency":"CHF","value_usd":1732},"fwci":1.6169,"has_fulltext":true,"cited_by_count":4,"citation_normalized_percentile":{"value":0.84020632,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":97},"biblio":{"volume":"7","issue":"7","first_page":"68","last_page":"68"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10730","display_name":"Language Development and Disorders","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10730","display_name":"Language Development and Disorders","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/3204","display_name":"Developmental and Educational Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9951000213623047,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/annotation","display_name":"Annotation","score":0.8130944967269897},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7362831830978394},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6446326375007629},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5945330858230591},{"id":"https://openalex.org/keywords/reading","display_name":"Reading (process)","score":0.5487561225891113},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4437388479709625},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4315144717693329},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4290417730808258},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.1800154447555542}],"concepts":[{"id":"https://openalex.org/C2776321320","wikidata":"https://www.wikidata.org/wiki/Q857525","display_name":"Annotation","level":2,"score":0.8130944967269897},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7362831830978394},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6446326375007629},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5945330858230591},{"id":"https://openalex.org/C554936623","wikidata":"https://www.wikidata.org/wiki/Q199657","display_name":"Reading (process)","level":2,"score":0.5487561225891113},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4437388479709625},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4315144717693329},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4290417730808258},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.1800154447555542},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.3390/mti7070068","is_oa":true,"landing_page_url":"https://doi.org/10.3390/mti7070068","pdf_url":"https://www.mdpi.com/2414-4088/7/7/68/pdf?version=1688367476","source":{"id":"https://openalex.org/S4210226272","display_name":"Multimodal Technologies and Interaction","issn_l":"2414-4088","issn":["2414-4088"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Multimodal Technologies and Interaction","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:ea2ddf69cb564f179e004d4de5f91c32","is_oa":true,"landing_page_url":"https://doaj.org/article/ea2ddf69cb564f179e004d4de5f91c32","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Multimodal Technologies and Interaction, Vol 7, Iss 7, p 68 (2023)","raw_type":"article"},{"id":"pmh:oai:dspace.library.uu.nl:1874/434191","is_oa":true,"landing_page_url":"https://dspace.library.uu.nl/handle/1874/434191","pdf_url":null,"source":{"id":"https://openalex.org/S4306401649","display_name":"Utrecht University Repository (Utrecht University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I193662353","host_organization_name":"Utrecht University","host_organization_lineage":["https://openalex.org/I193662353"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"pmh:oai:mdpi.com:/2414-4088/7/7/68/","is_oa":true,"landing_page_url":"https://dx.doi.org/10.3390/mti7070068","pdf_url":null,"source":{"id":"https://openalex.org/S4306400947","display_name":"MDPI (MDPI AG)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I4210097602","host_organization_name":"Multidisciplinary Digital Publishing Institute (Switzerland)","host_organization_lineage":["https://openalex.org/I4210097602"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Multimodal Technologies and Interaction; Volume 7; Issue 7; Pages: 68","raw_type":"Text"}],"best_oa_location":{"id":"doi:10.3390/mti7070068","is_oa":true,"landing_page_url":"https://doi.org/10.3390/mti7070068","pdf_url":"https://www.mdpi.com/2414-4088/7/7/68/pdf?version=1688367476","source":{"id":"https://openalex.org/S4210226272","display_name":"Multimodal Technologies and Interaction","issn_l":"2414-4088","issn":["2414-4088"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Multimodal Technologies and Interaction","raw_type":"journal-article"},"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5099999904632568}],"awards":[{"id":"https://openalex.org/G2138816107","display_name":null,"funder_award_id":"024.001.003","funder_id":"https://openalex.org/F4320321800","funder_display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek"}],"funders":[{"id":"https://openalex.org/F4320321800","display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek","ror":"https://ror.org/04jsz6e67"}],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4383068138.pdf"},"referenced_works_count":45,"referenced_works":["https://openalex.org/W87954838","https://openalex.org/W200479330","https://openalex.org/W1574649457","https://openalex.org/W1951724000","https://openalex.org/W1966536015","https://openalex.org/W1980096805","https://openalex.org/W1986498119","https://openalex.org/W2012575176","https://openalex.org/W2018913061","https://openalex.org/W2036502463","https://openalex.org/W2068529404","https://openalex.org/W2079226288","https://openalex.org/W2079408923","https://openalex.org/W2086880169","https://openalex.org/W2087508909","https://openalex.org/W2106597857","https://openalex.org/W2123292690","https://openalex.org/W2125979649","https://openalex.org/W2131694695","https://openalex.org/W2133514592","https://openalex.org/W2137564956","https://openalex.org/W2143562645","https://openalex.org/W2152711352","https://openalex.org/W2154600605","https://openalex.org/W2157846663","https://openalex.org/W2172097686","https://openalex.org/W2505877856","https://openalex.org/W2578159187","https://openalex.org/W2582743722","https://openalex.org/W2610616322","https://openalex.org/W2619115632","https://openalex.org/W2626106289","https://openalex.org/W2729190387","https://openalex.org/W2938610567","https://openalex.org/W2978863170","https://openalex.org/W2991832884","https://openalex.org/W3115995371","https://openalex.org/W3118559131","https://openalex.org/W3209383001","https://openalex.org/W4299401138","https://openalex.org/W4301056580","https://openalex.org/W4319656473","https://openalex.org/W4385822293","https://openalex.org/W6684361878","https://openalex.org/W6768605710"],"related_works":["https://openalex.org/W2361861616","https://openalex.org/W2263699433","https://openalex.org/W2377979023","https://openalex.org/W2218034408","https://openalex.org/W2392921965","https://openalex.org/W2358755282","https://openalex.org/W2625833328","https://openalex.org/W1533177136","https://openalex.org/W4380994516","https://openalex.org/W2556260348"],"abstract_inverted_index":{"There":[0],"is":[1,51,178],"a":[2,22,190,200],"large":[3,201],"interest":[4],"in":[5,109,123,130,141],"the":[6,42,91,100,139,154,183],"annotation":[7,43],"of":[8,120,159,203],"speech":[9,14,26,33,49,71,204],"addressed":[10],"to":[11,24,59,83,137,198],"infants.":[12,207],"Infant-directed":[13],"(IDS)":[15,89],"has":[16],"acoustic":[17],"properties":[18],"that":[19,115,169,186],"might":[20],"pose":[21],"challenge":[23],"automatic":[25,187],"recognition":[27],"(ASR)":[28],"tools":[29,37,64],"developed":[30],"for":[31,181,194],"adult-directed":[32],"(ADS).":[34,93],"While":[35,176],"ASR":[36,63,101,162],"could":[38],"potentially":[39],"speed":[40],"up":[41],"process,":[44],"their":[45,84],"effectiveness":[46],"on":[47],"this":[48,55],"register":[50],"currently":[52],"unknown.":[53],"In":[54,94,132],"study,":[56],"we":[57,97,135],"assessed":[58],"what":[60],"extent":[61],"open-source":[62],"can":[65],"successfully":[66],"transcribe":[67,199],"IDS.":[68],"We":[69,113,167],"used":[70],"data":[72],"from":[73],"21":[74],"Dutch":[75],"mothers":[76],"reading":[77],"picture":[78],"books":[79],"containing":[80],"target":[81,107,121],"words":[82,108,122],"18-":[85],"and":[86,90,152,165],"24-month-old":[87],"children":[88],"experimenter":[92],"Experiment":[95,133],"1,":[96],"examined":[98],"how":[99],"tool":[102],"Kaldi-NL":[103,116,164],"performs":[104,171],"at":[105,206],"annotating":[106,142],"IDS":[110,143,149],"vs.":[111],"ADS.":[112,131],"found":[114,118,168],"only":[117],"55.8%":[119],"IDS,":[124],"while":[125],"it":[126],"annotated":[127],"66.8%":[128],"correctly":[129],"2,":[134],"aimed":[136],"assess":[138],"difficulties":[140],"more":[144],"broadly":[145],"by":[146],"transcribing":[147],"all":[148],"utterances":[150],"manually":[151],"comparing":[153],"word":[155],"error":[156],"rates":[157],"(WERs)":[158],"two":[160],"different":[161],"systems:":[163],"WhisperX.":[166],"WhisperX":[170],"significantly":[172],"better":[173],"than":[174],"Kaldi-NL.":[175],"there":[177],"much":[179],"room":[180],"improvement,":[182],"results":[184],"show":[185],"transcriptions":[188],"provide":[189],"promising":[191],"starting":[192],"point":[193],"researchers":[195],"who":[196],"have":[197],"amount":[202],"directed":[205]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":3}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
