{"id":"https://openalex.org/W104734300","doi":"https://doi.org/10.21437/icslp.2000-417","title":"Robust fundamental frequency estimation using instantaneous frequencies of harmonic components","display_name":"Robust fundamental frequency estimation using instantaneous frequencies of harmonic components","publication_year":2000,"publication_date":"2000-10-16","ids":{"openalex":"https://openalex.org/W104734300","doi":"https://doi.org/10.21437/icslp.2000-417","mag":"104734300"},"language":"en","primary_location":{"id":"doi:10.21437/icslp.2000-417","is_oa":false,"landing_page_url":"https://doi.org/10.21437/icslp.2000-417","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"6th International Conference on Spoken Language Processing (ICSLP 2000)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://naist.repo.nii.ac.jp/records/4759","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055382586","display_name":"Yoshinori Atake","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yoshinori Atake","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078342732","display_name":"Toshio Irino","orcid":"https://orcid.org/0000-0002-7691-4189"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Toshio Irino","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072749858","display_name":"Hideki Kawahara","orcid":"https://orcid.org/0000-0001-9360-5700"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hideki Kawahara","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051000206","display_name":"Jinlin Lu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jinlin Lu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011428539","display_name":"Satoshi Nakamura","orcid":"https://orcid.org/0000-0001-7978-0705"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Satoshi Nakamura","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5021868389","display_name":"Kiyohiro Shikano","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kiyohiro Shikano","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.942,"has_fulltext":true,"cited_by_count":27,"citation_normalized_percentile":{"value":0.90671556,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"2","issue":null,"first_page":"vol. 2, 907","last_page":"910"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.8985999822616577,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.8985999822616577,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.828000009059906,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/beijing","display_name":"Beijing","score":0.7378431558609009},{"id":"https://openalex.org/keywords/harmonic","display_name":"Harmonic","score":0.6344776153564453},{"id":"https://openalex.org/keywords/fundamental-frequency","display_name":"Fundamental frequency","score":0.5778385400772095},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5749544501304626},{"id":"https://openalex.org/keywords/harmonic-analysis","display_name":"Harmonic analysis","score":0.5387654304504395},{"id":"https://openalex.org/keywords/estimation","display_name":"Estimation","score":0.44224268198013306},{"id":"https://openalex.org/keywords/time\u2013frequency-analysis","display_name":"Time\u2013frequency analysis","score":0.4324345886707306},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.40771588683128357},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.38557323813438416},{"id":"https://openalex.org/keywords/electronic-engineering","display_name":"Electronic engineering","score":0.368141233921051},{"id":"https://openalex.org/keywords/china","display_name":"China","score":0.28223907947540283},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.2114247977733612},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.18851983547210693},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.17051175236701965},{"id":"https://openalex.org/keywords/geography","display_name":"Geography","score":0.100617915391922}],"concepts":[{"id":"https://openalex.org/C2778304055","wikidata":"https://www.wikidata.org/wiki/Q657474","display_name":"Beijing","level":3,"score":0.7378431558609009},{"id":"https://openalex.org/C127934551","wikidata":"https://www.wikidata.org/wiki/Q1148098","display_name":"Harmonic","level":2,"score":0.6344776153564453},{"id":"https://openalex.org/C10513763","wikidata":"https://www.wikidata.org/wiki/Q1331774","display_name":"Fundamental frequency","level":2,"score":0.5778385400772095},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5749544501304626},{"id":"https://openalex.org/C131770355","wikidata":"https://www.wikidata.org/wiki/Q876215","display_name":"Harmonic analysis","level":2,"score":0.5387654304504395},{"id":"https://openalex.org/C96250715","wikidata":"https://www.wikidata.org/wiki/Q965330","display_name":"Estimation","level":2,"score":0.44224268198013306},{"id":"https://openalex.org/C142433447","wikidata":"https://www.wikidata.org/wiki/Q7806653","display_name":"Time\u2013frequency analysis","level":3,"score":0.4324345886707306},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.40771588683128357},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.38557323813438416},{"id":"https://openalex.org/C24326235","wikidata":"https://www.wikidata.org/wiki/Q126095","display_name":"Electronic engineering","level":1,"score":0.368141233921051},{"id":"https://openalex.org/C191935318","wikidata":"https://www.wikidata.org/wiki/Q148","display_name":"China","level":2,"score":0.28223907947540283},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.2114247977733612},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.18851983547210693},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.17051175236701965},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.100617915391922},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.0},{"id":"https://openalex.org/C166957645","wikidata":"https://www.wikidata.org/wiki/Q23498","display_name":"Archaeology","level":1,"score":0.0},{"id":"https://openalex.org/C201995342","wikidata":"https://www.wikidata.org/wiki/Q682496","display_name":"Systems engineering","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.21437/icslp.2000-417","is_oa":false,"landing_page_url":"https://doi.org/10.21437/icslp.2000-417","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"6th International Conference on Spoken Language Processing (ICSLP 2000)","raw_type":"proceedings-article"},{"id":"pmh:oai:irdb.nii.ac.jp:01146:0005783210","is_oa":true,"landing_page_url":"https://naist.repo.nii.ac.jp/records/4759","pdf_url":null,"source":{"id":"https://openalex.org/S7407056385","display_name":"Institutional Repositories DataBase (IRDB)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I184597095","host_organization_name":"National Institute of Informatics","host_organization_lineage":["https://openalex.org/I184597095"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":null,"raw_type":"conference paper"}],"best_oa_location":{"id":"pmh:oai:irdb.nii.ac.jp:01146:0005783210","is_oa":true,"landing_page_url":"https://naist.repo.nii.ac.jp/records/4759","pdf_url":null,"source":{"id":"https://openalex.org/S7407056385","display_name":"Institutional Repositories DataBase (IRDB)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I184597095","host_organization_name":"National Institute of Informatics","host_organization_lineage":["https://openalex.org/I184597095"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":null,"raw_type":"conference paper"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.5799999833106995}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2394544468","https://openalex.org/W2056455302","https://openalex.org/W2587667458","https://openalex.org/W2068237456","https://openalex.org/W1861882962","https://openalex.org/W2109998678","https://openalex.org/W2164070943","https://openalex.org/W2163128389","https://openalex.org/W2121926536","https://openalex.org/W1497667432"],"abstract_inverted_index":{"This":[0,11],"paper":[1],"proposes":[2],"a":[3,39,58,132,220],"noise-tolerant":[4],"method":[5,12,147,180,195,224],"for":[6,115,167,228,242],"fundamental":[7],"frequency":[8],"(F0)":[9],"extraction.":[10],"includes":[13],"several":[14],"new":[15],"ideas,":[16],"including":[17,102],"the":[18,21,25,30,44,48,53,96,121,124,145,154,158,174,178,182,192,198,206,214,222,226,239],"estimation":[19],"of":[20,24,32,62,65,76,95,106,153,177,205],"instantaneous":[22],"frequencies":[23],"higher":[26],"harmonic":[27,49],"components,":[28],"and":[29,68,83,131,181,188,197,202,232],"design":[31],"an":[33,127],"adaptive":[34],"weighting":[35],"function":[36,200],"based":[37],"on":[38],"bandwidth":[40],"equation":[41],"that":[42],"combines":[43],"F0":[45,134],"information":[46],"in":[47,91,137],"components.":[50],"To":[51],"evaluate":[52],"proposed":[54,122,146,179,223],"method,":[55,123,130],"we":[56],"constructed":[57],"relatively":[59],"large":[60],"database":[61,74],"simultaneous":[63],"recordings":[64],"speech":[66],"waveforms":[67],"EGG":[69],"(Electro":[70],"Glotto":[71],"Graphy).":[72],"The":[73,93,108,139],"consists":[75],"30":[77],"sentences":[78,90],"pronounced":[79],"by":[80],"14":[81,84],"male":[82],"female":[85],"normal":[86],"subjects,":[87],"i.e.,":[88,120],"840":[89],"total.":[92],"duration":[94],"sound":[97],"is":[98,148,160,216],"about":[99,103,163,186],"35":[100],"minutes":[101,105],"20":[104],"voicing.":[107],"experiments":[109],"were":[110,141],"performed":[111],"with":[112],"additive":[113],"noise":[114],"four":[116],"pitch":[117],"extraction":[118,135],"methods,":[119],"original":[125,183,240],"TEMPO,":[126],"improved":[128,193],"cepstrum":[129,194],"common":[133],"program":[136],"ESPS.":[138],"results":[140],"as":[142],"follows:":[143],"1)":[144],"always":[149],"better":[150,190],"than":[151,162,191,211],"any":[152],"other":[155],"methods":[156,207],"when":[157,213],"SNR":[159,169,215,230,244],"greater":[161],"2":[164],"dB;":[165],"2)":[166],"high":[168,235,243],"values":[170,231],"(>":[171],"15":[172],"dB),":[173],"correct":[175],"rates":[176],"TEMPO":[184,241],"are":[185],"95%":[187],"much":[189],"(92%)":[196],"ESPS":[199],"(89%);":[201],"3)":[203],"all":[204],"degrade":[208],"to":[209],"less":[210],"62%":[212],"0":[217],"dB.":[218],"As":[219],"result,":[221],"improves":[225],"performance":[227],"low":[229],"also":[233],"maintains":[234],"accuracy":[236],"inherent":[237],"from":[238],"values.":[245]},"counts_by_year":[{"year":2022,"cited_by_count":1},{"year":2017,"cited_by_count":1},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
