{"id":"https://openalex.org/W2111372986","doi":"https://doi.org/10.21437/interspeech.2004-675","title":"Investigating speech style specific pronunciation variation in large spoken language corpora","display_name":"Investigating speech style specific pronunciation variation in large spoken language corpora","publication_year":2004,"publication_date":"2004-10-04","ids":{"openalex":"https://openalex.org/W2111372986","doi":"https://doi.org/10.21437/interspeech.2004-675","mag":"2111372986"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2004-675","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2004-675","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2004","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"http://hdl.handle.net/2066/61950","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041743748","display_name":"Christophe Van Bael","orcid":null},"institutions":[{"id":"https://openalex.org/I145872427","display_name":"Radboud University Nijmegen","ror":"https://ror.org/016xsfp80","country_code":"NL","type":"education","lineage":["https://openalex.org/I145872427"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Christophe Van Bael","raw_affiliation_strings":["Radboud University Nijmegen#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Radboud University Nijmegen#TAB#","institution_ids":["https://openalex.org/I145872427"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042937911","display_name":"Henk van den Heuvel","orcid":"https://orcid.org/0000-0003-2064-0630"},"institutions":[{"id":"https://openalex.org/I145872427","display_name":"Radboud University Nijmegen","ror":"https://ror.org/016xsfp80","country_code":"NL","type":"education","lineage":["https://openalex.org/I145872427"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Henk van den Heuvel","raw_affiliation_strings":["Radboud University Nijmegen#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Radboud University Nijmegen#TAB#","institution_ids":["https://openalex.org/I145872427"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019585114","display_name":"Helmer Strik","orcid":"https://orcid.org/0000-0003-1722-3465"},"institutions":[{"id":"https://openalex.org/I145872427","display_name":"Radboud University Nijmegen","ror":"https://ror.org/016xsfp80","country_code":"NL","type":"education","lineage":["https://openalex.org/I145872427"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Helmer Strik","raw_affiliation_strings":["Radboud University Nijmegen#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Radboud University Nijmegen#TAB#","institution_ids":["https://openalex.org/I145872427"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.313,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.89785876,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"2793","last_page":"2796"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10403","display_name":"Phonetics and Phonology Research","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/3205","display_name":"Experimental and Cognitive Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8093425035476685},{"id":"https://openalex.org/keywords/pronunciation","display_name":"Pronunciation","score":0.7559812664985657},{"id":"https://openalex.org/keywords/spoken-language","display_name":"Spoken language","score":0.7525745630264282},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6666110157966614},{"id":"https://openalex.org/keywords/variation","display_name":"Variation (astronomy)","score":0.608547031879425},{"id":"https://openalex.org/keywords/style","display_name":"Style (visual arts)","score":0.5946813821792603},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.546353816986084},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5402289628982544},{"id":"https://openalex.org/keywords/speech-corpus","display_name":"Speech corpus","score":0.5142166614532471},{"id":"https://openalex.org/keywords/transcription","display_name":"Transcription (linguistics)","score":0.4992380142211914},{"id":"https://openalex.org/keywords/corpus-linguistics","display_name":"Corpus linguistics","score":0.4402981698513031},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3441472053527832},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.21764299273490906},{"id":"https://openalex.org/keywords/history","display_name":"History","score":0.08481615781784058}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8093425035476685},{"id":"https://openalex.org/C2780844864","wikidata":"https://www.wikidata.org/wiki/Q184377","display_name":"Pronunciation","level":2,"score":0.7559812664985657},{"id":"https://openalex.org/C2776230583","wikidata":"https://www.wikidata.org/wiki/Q1322198","display_name":"Spoken language","level":2,"score":0.7525745630264282},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6666110157966614},{"id":"https://openalex.org/C2778334786","wikidata":"https://www.wikidata.org/wiki/Q1586270","display_name":"Variation (astronomy)","level":2,"score":0.608547031879425},{"id":"https://openalex.org/C2776445246","wikidata":"https://www.wikidata.org/wiki/Q1792644","display_name":"Style (visual arts)","level":2,"score":0.5946813821792603},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.546353816986084},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5402289628982544},{"id":"https://openalex.org/C91863865","wikidata":"https://www.wikidata.org/wiki/Q4349497","display_name":"Speech corpus","level":3,"score":0.5142166614532471},{"id":"https://openalex.org/C179926584","wikidata":"https://www.wikidata.org/wiki/Q207714","display_name":"Transcription (linguistics)","level":2,"score":0.4992380142211914},{"id":"https://openalex.org/C532629269","wikidata":"https://www.wikidata.org/wiki/Q865083","display_name":"Corpus linguistics","level":2,"score":0.4402981698513031},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3441472053527832},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.21764299273490906},{"id":"https://openalex.org/C95457728","wikidata":"https://www.wikidata.org/wiki/Q309","display_name":"History","level":0,"score":0.08481615781784058},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C44870925","wikidata":"https://www.wikidata.org/wiki/Q37547","display_name":"Astrophysics","level":1,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.21437/interspeech.2004-675","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2004-675","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2004","raw_type":"proceedings-article"},{"id":"pmh:ru:oai:repository.ubn.ru.nl:2066/61950","is_oa":true,"landing_page_url":"http://hdl.handle.net/2066/61950","pdf_url":"http://hdl.handle.net/2066/61950","source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Proceedings of Interspeech-ICSLP 2004, CD-ROM. Jeju, Korea : [S.n.]","raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.5.4243","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.5.4243","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://lands.let.kun.nl/literature/vanbael.2004.2.pdf","raw_type":"text"}],"best_oa_location":{"id":"pmh:ru:oai:repository.ubn.ru.nl:2066/61950","is_oa":true,"landing_page_url":"http://hdl.handle.net/2066/61950","pdf_url":"http://hdl.handle.net/2066/61950","source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Proceedings of Interspeech-ICSLP 2004, CD-ROM. Jeju, Korea : [S.n.]","raw_type":"info:eu-repo/semantics/article"},"sustainable_development_goals":[{"display_name":"Quality Education","score":0.8199999928474426,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2111372986.pdf","grobid_xml":"https://content.openalex.org/works/W2111372986.grobid-xml"},"referenced_works_count":5,"referenced_works":["https://openalex.org/W29952999","https://openalex.org/W2096883086","https://openalex.org/W2105275276","https://openalex.org/W2116854048","https://openalex.org/W2132133133"],"related_works":["https://openalex.org/W2917843404","https://openalex.org/W3114261385","https://openalex.org/W1533950946","https://openalex.org/W2141266967","https://openalex.org/W113515668","https://openalex.org/W2155576284","https://openalex.org/W2068512280","https://openalex.org/W4366957107","https://openalex.org/W1587721369","https://openalex.org/W3096124370"],"abstract_inverted_index":{"In":[0],"the":[1,17,31,54,98,133],"past,":[2],"linguistic":[3,42,63,128],"research":[4,18,44],"was":[5,50,66,81],"typically":[6],"conducted":[7,51,82],"on":[8,46],"relatively":[9],"small":[10],"datasets":[11],"that":[12,102,118],"were":[13],"specifically":[14],"designed":[15],"for":[16,62,132],"at":[19],"hand.Whereas":[20],"to":[21,52,127],"date":[22],"many":[23],"large":[24,57,85,115,119],"spoken":[25,59,87,122],"language":[26,60,88,123],"corpora":[27,35,61,124],"have":[28],"become":[29],"available,":[30],"usefulness":[32],"of":[33,56,68,97,135],"these":[34],"is":[36],"still":[37],"not":[38],"fully":[39],"established":[40],"in":[41,47,72,112],"research.The":[43,64],"reported":[45],"this":[48,76],"paper":[49],"illustrate":[53],"potential":[55],"multi-purpose":[58,86],"possibility":[65],"investigated":[67],"identifying":[69],"phonetic":[70,95],"regularities":[71],"different":[73],"speech":[74,103],"styles.To":[75],"end,":[77],"a":[78,84,91,114],"datadriven":[79],"study":[80],"with":[83],"corpus":[89],"comprising":[90],"manually":[92],"corrected":[93],"broad":[94],"transcription":[96],"data.Our":[99],"results":[100],"show":[101],"style":[104],"specific":[105],"pronunciation":[106],"processes":[107],"can":[108,125],"indeed":[109],"be":[110],"found":[111],"such":[113],"corpus.This":[116],"indicates":[117],"multi":[120],"purpose":[121,134],"contribute":[126],"research,":[129],"if":[130],"only":[131],"hypothesis":[136],"generation":[137],"and":[138],"verification.":[139]},"counts_by_year":[{"year":2021,"cited_by_count":1},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
