{"id":"https://openalex.org/W3027727382","doi":"https://doi.org/10.1142/s2717554520500034","title":"A Study on the Robustness of Pitch-Range Estimation from Brief Speech Segments","display_name":"A Study on the Robustness of Pitch-Range Estimation from Brief Speech Segments","publication_year":2020,"publication_date":"2020-03-01","ids":{"openalex":"https://openalex.org/W3027727382","doi":"https://doi.org/10.1142/s2717554520500034","mag":"3027727382"},"language":"en","primary_location":{"id":"doi:10.1142/s2717554520500034","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s2717554520500034","pdf_url":null,"source":{"id":"https://openalex.org/S4210231678","display_name":"International Journal of Asian Language Processing","issn_l":"2424-791X","issn":["2424-791X","2717-5545"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Asian Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5044523094","display_name":"Wenjie Peng","orcid":"https://orcid.org/0009-0004-9891-9898"},"institutions":[{"id":"https://openalex.org/I115212828","display_name":"Beijing Language and Culture University","ror":"https://ror.org/03te2zs36","country_code":"CN","type":"education","lineage":["https://openalex.org/I115212828"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wenjie Peng","raw_affiliation_strings":["Research Institute of International Chinese Language Education, Beijing Language and Culture University, Beijing 100083, P. R. China","School of Information Science, Beijing Language and Culture University, Beijing 100083, P. R. China"],"affiliations":[{"raw_affiliation_string":"Research Institute of International Chinese Language Education, Beijing Language and Culture University, Beijing 100083, P. R. China","institution_ids":["https://openalex.org/I115212828"]},{"raw_affiliation_string":"School of Information Science, Beijing Language and Culture University, Beijing 100083, P. R. China","institution_ids":["https://openalex.org/I115212828"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074965408","display_name":"Kaiqi Fu","orcid":null},"institutions":[{"id":"https://openalex.org/I115212828","display_name":"Beijing Language and Culture University","ror":"https://ror.org/03te2zs36","country_code":"CN","type":"education","lineage":["https://openalex.org/I115212828"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaiqi Fu","raw_affiliation_strings":["Beijing Advanced Innovation Center for Language Resources, Beijing Language and Culture University, Beijing 100083, P. R. China","School of Information Science, Beijing Language and Culture University, Beijing 100083, P. R. China"],"affiliations":[{"raw_affiliation_string":"Beijing Advanced Innovation Center for Language Resources, Beijing Language and Culture University, Beijing 100083, P. R. China","institution_ids":["https://openalex.org/I115212828"]},{"raw_affiliation_string":"School of Information Science, Beijing Language and Culture University, Beijing 100083, P. R. China","institution_ids":["https://openalex.org/I115212828"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100666890","display_name":"Zhang Wei","orcid":"https://orcid.org/0000-0003-2705-9822"},"institutions":[{"id":"https://openalex.org/I115212828","display_name":"Beijing Language and Culture University","ror":"https://ror.org/03te2zs36","country_code":"CN","type":"education","lineage":["https://openalex.org/I115212828"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Zhang","raw_affiliation_strings":["School of Information Science, Beijing Language and Culture University, Beijing 100083, P. R. China"],"affiliations":[{"raw_affiliation_string":"School of Information Science, Beijing Language and Culture University, Beijing 100083, P. R. China","institution_ids":["https://openalex.org/I115212828"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006684220","display_name":"Yanlu Xie","orcid":"https://orcid.org/0000-0001-6765-4808"},"institutions":[{"id":"https://openalex.org/I115212828","display_name":"Beijing Language and Culture University","ror":"https://ror.org/03te2zs36","country_code":"CN","type":"education","lineage":["https://openalex.org/I115212828"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanlu Xie","raw_affiliation_strings":["School of Information Science, Beijing Language and Culture University, Beijing 100083, P. R. China"],"affiliations":[{"raw_affiliation_string":"School of Information Science, Beijing Language and Culture University, Beijing 100083, P. R. China","institution_ids":["https://openalex.org/I115212828"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052176517","display_name":"Jinsong Zhang","orcid":"https://orcid.org/0000-0002-1603-3136"},"institutions":[{"id":"https://openalex.org/I115212828","display_name":"Beijing Language and Culture University","ror":"https://ror.org/03te2zs36","country_code":"CN","type":"education","lineage":["https://openalex.org/I115212828"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jinsong Zhang","raw_affiliation_strings":["Beijing Advanced Innovation Center for Language Resources, Beijing Language and Culture University, Beijing 100083, P. R. China","Research Institute of International Chinese Language Education, Beijing Language and Culture University, Beijing 100083, P. R. China","School of Information Science, Beijing Language and Culture University, Beijing 100083, P. R. China"],"affiliations":[{"raw_affiliation_string":"Beijing Advanced Innovation Center for Language Resources, Beijing Language and Culture University, Beijing 100083, P. R. China","institution_ids":["https://openalex.org/I115212828"]},{"raw_affiliation_string":"Research Institute of International Chinese Language Education, Beijing Language and Culture University, Beijing 100083, P. R. China","institution_ids":["https://openalex.org/I115212828"]},{"raw_affiliation_string":"School of Information Science, Beijing Language and Culture University, Beijing 100083, P. R. China","institution_ids":["https://openalex.org/I115212828"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5052176517"],"corresponding_institution_ids":["https://openalex.org/I115212828"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.05168538,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"30","issue":"01","first_page":"2050003","last_page":"2050003"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.8364554643630981},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7035442590713501},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6904584169387817},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.6590186357498169},{"id":"https://openalex.org/keywords/word-error-rate","display_name":"Word error rate","score":0.5853074193000793},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.4818117022514343},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.37383902072906494},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.33469223976135254},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.06367290019989014}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.8364554643630981},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7035442590713501},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6904584169387817},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.6590186357498169},{"id":"https://openalex.org/C40969351","wikidata":"https://www.wikidata.org/wiki/Q3516228","display_name":"Word error rate","level":2,"score":0.5853074193000793},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.4818117022514343},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.37383902072906494},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.33469223976135254},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.06367290019989014},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1142/s2717554520500034","is_oa":false,"landing_page_url":"https://doi.org/10.1142/s2717554520500034","pdf_url":null,"source":{"id":"https://openalex.org/S4210231678","display_name":"International Journal of Asian Language Processing","issn_l":"2424-791X","issn":["2424-791X","2717-5545"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319815","host_organization_name":"World Scientific","host_organization_lineage":["https://openalex.org/P4310319815"],"host_organization_lineage_names":["World Scientific"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"International Journal of Asian Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.7799999713897705,"display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W397522103","https://openalex.org/W2005708641","https://openalex.org/W2013645463","https://openalex.org/W2038289177","https://openalex.org/W2055517685","https://openalex.org/W2069826235","https://openalex.org/W2130994140","https://openalex.org/W2195693064","https://openalex.org/W2484174190","https://openalex.org/W2944329943","https://openalex.org/W4213127156"],"related_works":["https://openalex.org/W2309273277","https://openalex.org/W2061937230","https://openalex.org/W1769849273","https://openalex.org/W1574295218","https://openalex.org/W113247760","https://openalex.org/W2547793174","https://openalex.org/W2070212102","https://openalex.org/W2544241817","https://openalex.org/W2158882055","https://openalex.org/W2914603036"],"abstract_inverted_index":{"Pitch-range":[0],"estimation":[1,47,110,174],"from":[2,156],"brief":[3,55],"speech":[4,14,51],"segments":[5],"could":[6,43],"bring":[7],"benefits":[8],"to":[9,27,127,148],"many":[10],"tasks":[11],"like":[12],"automatic":[13],"recognition":[15],"and":[16,42,87],"speaker":[17],"recognition.":[18],"To":[19],"estimate":[20],"pitch":[21],"range,":[22],"previous":[23],"studies":[24],"have":[25],"proposed":[26],"utilize":[28],"deep-learning-based":[29],"models":[30],"with":[31,91],"spectrum":[32],"information":[33,136],"as":[34,54,56],"input.":[35],"They":[36],"demonstrated":[37],"that":[38,128],"such":[39],"method":[40,151],"works":[41],"still":[44],"achieve":[45],"reliable":[46],"results":[48,95,166],"when":[49],"the":[50,64,71,109,122,130,139,149,157,168,171],"segment":[52],"is":[53,125,145],"300":[57],"ms.":[58],"In":[59],"this":[60,67,143],"study,":[61],"we":[62],"evaluated":[63,120],"robustness":[65],"of":[66,80,101,105,159,170],"method.":[68,175],"We":[69],"take":[70],"following":[72],"scenarios":[73],"into":[74],"account:":[75],"(1)":[76,98],"a":[77,102],"large":[78,103],"number":[79,104],"training":[81,106],"speakers;":[82],"(2)":[83,112],"different":[84,92],"language":[85],"backgrounds;":[86],"(3)":[88,133],"monosyllabic":[89],"utterances":[90],"tones.":[93],"Experimental":[94],"showed":[96],"that:":[97],"The":[99,113],"use":[100],"speakers":[107,124],"improved":[108],"accuracies.":[111],"mean":[114],"absolute":[115],"percentage":[116],"error":[117],"(MAPE)":[118],"rate":[119],"on":[121,129],"L2":[123],"similar":[126],"native":[131],"speakers.":[132],"Different":[134],"tonal":[135],"will":[137],"affect":[138],"LSTM-based":[140,172],"model,":[141],"but":[142],"influence":[144],"limited":[146],"compared":[147],"baseline":[150],"which":[152],"calculates":[153],"pitch-range":[154,173],"targets":[155],"distribution":[158],"[Formula:":[160],"see":[161],"text]0":[162],"values.":[163],"These":[164],"experimental":[165],"verified":[167],"efficiency":[169]},"counts_by_year":[],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
