{"id":"https://openalex.org/W2947006333","doi":"https://doi.org/10.1109/spcom.2018.8724478","title":"Exploring the Role of Speaking-Rate Adaptation on Children's Speech Recognition","display_name":"Exploring the Role of Speaking-Rate Adaptation on Children's Speech Recognition","publication_year":2018,"publication_date":"2018-07-01","ids":{"openalex":"https://openalex.org/W2947006333","doi":"https://doi.org/10.1109/spcom.2018.8724478","mag":"2947006333"},"language":"en","primary_location":{"id":"doi:10.1109/spcom.2018.8724478","is_oa":false,"landing_page_url":"https://doi.org/10.1109/spcom.2018.8724478","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 International Conference on Signal Processing and Communications (SPCOM)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063682063","display_name":"S. Shahnawazuddin","orcid":"https://orcid.org/0000-0002-3916-9693"},"institutions":[{"id":"https://openalex.org/I11793825","display_name":"National Institute of Technology Patna","ror":"https://ror.org/056wyhh33","country_code":"IN","type":"education","lineage":["https://openalex.org/I11793825","https://openalex.org/I4210152752"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"S. Shahnawazuddin","raw_affiliation_strings":["Department of Electronics and Communication Engineering, NIT Patna, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Communication Engineering, NIT Patna, India","institution_ids":["https://openalex.org/I11793825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003438160","display_name":"Hemant Kumar Kathania","orcid":"https://orcid.org/0000-0002-6367-5203"},"institutions":[{"id":"https://openalex.org/I101326570","display_name":"National Institute of Technology Sikkim","ror":"https://ror.org/04pam3b03","country_code":"IN","type":"education","lineage":["https://openalex.org/I101326570"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Hemant K. Kathania","raw_affiliation_strings":["Department of Electronics and Communication Engineering, NIT Sikkim, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Communication Engineering, NIT Sikkim, India","institution_ids":["https://openalex.org/I101326570"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055274772","display_name":"Chaman Singh","orcid":null},"institutions":[{"id":"https://openalex.org/I11793825","display_name":"National Institute of Technology Patna","ror":"https://ror.org/056wyhh33","country_code":"IN","type":"education","lineage":["https://openalex.org/I11793825","https://openalex.org/I4210152752"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Chaman Singh","raw_affiliation_strings":["Department of Electronics and Communication Engineering, NIT Patna, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Communication Engineering, NIT Patna, India","institution_ids":["https://openalex.org/I11793825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070407855","display_name":"Waquar Ahmad","orcid":"https://orcid.org/0000-0001-7817-3313"},"institutions":[{"id":"https://openalex.org/I101326570","display_name":"National Institute of Technology Sikkim","ror":"https://ror.org/04pam3b03","country_code":"IN","type":"education","lineage":["https://openalex.org/I101326570"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Waquar Ahmad","raw_affiliation_strings":["Department of Electronics and Communication Engineering, NIT Sikkim, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Communication Engineering, NIT Sikkim, India","institution_ids":["https://openalex.org/I101326570"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038771729","display_name":"Gayadhar Pradhan","orcid":"https://orcid.org/0000-0001-7385-6684"},"institutions":[{"id":"https://openalex.org/I11793825","display_name":"National Institute of Technology Patna","ror":"https://ror.org/056wyhh33","country_code":"IN","type":"education","lineage":["https://openalex.org/I11793825","https://openalex.org/I4210152752"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Gayadhar Pradhan","raw_affiliation_strings":["Department of Electronics and Communication Engineering, NIT Patna, India"],"affiliations":[{"raw_affiliation_string":"Department of Electronics and Communication Engineering, NIT Patna, India","institution_ids":["https://openalex.org/I11793825"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5063682063"],"corresponding_institution_ids":["https://openalex.org/I11793825"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.21998662,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"257","issue":null,"first_page":"21","last_page":"25"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9947999715805054,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.8006644248962402},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7144194841384888},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6124239563941956},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.5961211323738098},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.5807874798774719},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5612835884094238},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.46213406324386597},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.4515279531478882},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4193337559700012},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.30947211384773254},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.13383066654205322},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.06732973456382751}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.8006644248962402},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7144194841384888},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6124239563941956},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.5961211323738098},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.5807874798774719},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5612835884094238},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.46213406324386597},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.4515279531478882},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4193337559700012},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30947211384773254},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.13383066654205322},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.06732973456382751},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/spcom.2018.8724478","is_oa":false,"landing_page_url":"https://doi.org/10.1109/spcom.2018.8724478","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2018 International Conference on Signal Processing and Communications (SPCOM)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W93383444","https://openalex.org/W132121590","https://openalex.org/W160885690","https://openalex.org/W192280404","https://openalex.org/W1524333225","https://openalex.org/W1532531043","https://openalex.org/W1540779870","https://openalex.org/W1969176743","https://openalex.org/W1984446451","https://openalex.org/W1994888226","https://openalex.org/W2066159843","https://openalex.org/W2094954292","https://openalex.org/W2100118853","https://openalex.org/W2115008841","https://openalex.org/W2124243855","https://openalex.org/W2159300614","https://openalex.org/W2160815625","https://openalex.org/W2163089518","https://openalex.org/W2164931619","https://openalex.org/W2338914793","https://openalex.org/W2402172738","https://openalex.org/W2507923760","https://openalex.org/W2587488139","https://openalex.org/W2736786568","https://openalex.org/W2747399100","https://openalex.org/W2755431812","https://openalex.org/W2990489528","https://openalex.org/W4237620266","https://openalex.org/W6603725097","https://openalex.org/W6605448002","https://openalex.org/W6606647699","https://openalex.org/W6631362777","https://openalex.org/W6631949791","https://openalex.org/W6676284021","https://openalex.org/W6703681455","https://openalex.org/W6741240231","https://openalex.org/W6744394073"],"related_works":["https://openalex.org/W1491159402","https://openalex.org/W4297807400","https://openalex.org/W4313854686","https://openalex.org/W2249138175","https://openalex.org/W1197719229","https://openalex.org/W3162054169","https://openalex.org/W2381158726","https://openalex.org/W1516392727","https://openalex.org/W2499802997","https://openalex.org/W2112059504"],"abstract_inverted_index":{"Earlier":[0],"studies":[1],"have":[2,79],"shown":[3],"that,":[4,85],"both":[5],"intra-speaker":[6],"and":[7,135],"inter-speaker":[8],"variabilities":[9],"affect":[10],"the":[11,26,33,45,60,104,114,133,152,183,190],"recognition":[12,18],"performance":[13],"of":[14,47,62,87,106,116,161,185],"any":[15],"automatic":[16],"speech":[17,50,139],"(ASR)":[19],"system.":[20],"The":[21,159],"differences":[22],"in":[23,110,113,147,156,171,182,194,197],"speaking-rate":[24,40,72],"among":[25],"speakers":[27],"is":[28,44,108,129,168,176],"one":[29],"such":[30,63],"factor":[31],"affecting":[32],"system":[34,54],"performance.":[35],"An":[36],"extreme":[37],"example":[38],"where":[39],"variations":[41],"become":[42],"detrimental":[43],"task":[46],"recognizing":[48],"children's":[49,186],"on":[51,71,91],"an":[52],"ASR":[53,65,92,117],"trained":[55],"using":[56,95],"adults'":[57],"speech.":[58],"In":[59,82],"context":[61,115],"mismatched":[64,187],"tasks,":[66],"only":[67],"a":[68],"few":[69],"works":[70],"adaptation":[73,128],"(SRA)":[74],"through":[75],"time-scale":[76],"modification":[77,167,175],"(TSM)":[78],"been":[80],"reported.":[81],"addition":[83],"to":[84,144,178],"effect":[86,160],"TSM":[88],"was":[89],"explored":[90],"systems":[93,118],"developed":[94],"Gaussian":[96],"mixture":[97],"models":[98],"(GMM).":[99],"Motivated":[100],"by":[101,131,151],"these":[102],"facts,":[103],"role":[105],"SRA":[107,142,163],"studied":[109,170],"this":[111,157,172],"work":[112],"employing":[119],"deep":[120],"neural":[121],"networks":[122],"(DNN)":[123],"for":[124],"statistical":[125],"modeling.":[126],"Further,":[127],"done":[130],"changing":[132],"frame-length":[134],"overlap":[136],"during":[137],"front-end":[138],"parameterization":[140],"phase.":[141],"leads":[143],"significant":[145],"reductions":[146,196],"errors":[148],"as":[149],"demonstrated":[150],"experimental":[153],"evaluations":[154],"reported":[155,177],"work.":[158],"combining":[162],"with":[164],"explicit":[165],"pitch":[166],"also":[169],"paper.":[173],"Pitch":[174],"be":[179],"very":[180],"effective":[181],"case":[184],"ASR.":[188],"Combining":[189],"two":[191],"techniques":[192],"results":[193],"additive":[195],"errors.":[198]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
