{"id":"https://openalex.org/W2408662956","doi":"https://doi.org/10.21437/interspeech.2010-350","title":"A corpus-based approach to speech enhancement from nonstationary noise","display_name":"A corpus-based approach to speech enhancement from nonstationary noise","publication_year":2010,"publication_date":"2010-09-26","ids":{"openalex":"https://openalex.org/W2408662956","doi":"https://doi.org/10.21437/interspeech.2010-350","mag":"2408662956"},"language":"en","primary_location":{"id":"doi:10.21437/interspeech.2010-350","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2010-350","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2010","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101838286","display_name":"Ji Ming","orcid":"https://orcid.org/0000-0001-6887-2591"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ji Ming","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111724942","display_name":"Ramji Srinivasan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramji Srinivasan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5000739686","display_name":"Danny Crookes","orcid":"https://orcid.org/0000-0002-3533-6095"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Danny Crookes","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101838286"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.6971,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.91226819,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1097","last_page":"1100"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9848999977111816,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9836999773979187,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7936064004898071},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.7694189548492432},{"id":"https://openalex.org/keywords/timit","display_name":"TIMIT","score":0.6929048299789429},{"id":"https://openalex.org/keywords/speech-corpus","display_name":"Speech corpus","score":0.6343575119972229},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.6002755165100098},{"id":"https://openalex.org/keywords/sentence","display_name":"Sentence","score":0.5676239132881165},{"id":"https://openalex.org/keywords/speech-enhancement","display_name":"Speech enhancement","score":0.5226523876190186},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.5110260248184204},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4735026955604553},{"id":"https://openalex.org/keywords/noise-measurement","display_name":"Noise measurement","score":0.4727034568786621},{"id":"https://openalex.org/keywords/background-noise","display_name":"Background noise","score":0.43755853176116943},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3550250828266144},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.25201117992401123},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.21714860200881958},{"id":"https://openalex.org/keywords/speech-synthesis","display_name":"Speech synthesis","score":0.20738255977630615}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7936064004898071},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.7694189548492432},{"id":"https://openalex.org/C2778724510","wikidata":"https://www.wikidata.org/wiki/Q7670405","display_name":"TIMIT","level":3,"score":0.6929048299789429},{"id":"https://openalex.org/C91863865","wikidata":"https://www.wikidata.org/wiki/Q4349497","display_name":"Speech corpus","level":3,"score":0.6343575119972229},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.6002755165100098},{"id":"https://openalex.org/C2777530160","wikidata":"https://www.wikidata.org/wiki/Q41796","display_name":"Sentence","level":2,"score":0.5676239132881165},{"id":"https://openalex.org/C2776182073","wikidata":"https://www.wikidata.org/wiki/Q7575395","display_name":"Speech enhancement","level":3,"score":0.5226523876190186},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.5110260248184204},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4735026955604553},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.4727034568786621},{"id":"https://openalex.org/C100675267","wikidata":"https://www.wikidata.org/wiki/Q1371624","display_name":"Background noise","level":2,"score":0.43755853176116943},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3550250828266144},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.25201117992401123},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.21714860200881958},{"id":"https://openalex.org/C14999030","wikidata":"https://www.wikidata.org/wiki/Q16346","display_name":"Speech synthesis","level":2,"score":0.20738255977630615},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.21437/interspeech.2010-350","is_oa":false,"landing_page_url":"https://doi.org/10.21437/interspeech.2010-350","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Interspeech 2010","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.8199999928474426}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2597829360","https://openalex.org/W4375869169","https://openalex.org/W3127686677","https://openalex.org/W2921661700","https://openalex.org/W2138406058","https://openalex.org/W2157102033","https://openalex.org/W2131486661","https://openalex.org/W2153897396","https://openalex.org/W4375869276","https://openalex.org/W1585241115"],"abstract_inverted_index":{"Temporal":[0],"dynamics":[1,128,176],"and":[2,100,129,133,157,181,194,237,254],"speaker":[3,131],"characteristics":[4],"are":[5,88,94],"two":[6,27],"important":[7],"features":[8,28],"of":[9,29,70,166,231],"speech":[10,13,30,32,65,73,81,86,120,143,226],"that":[11,36],"distinguish":[12],"from":[14,84,139,228],"noise.":[15,56],"In":[16,77],"this":[17,37],"paper,":[18],"we":[19],"propose":[20],"a":[21,85,167],"method":[22],"to":[23,52,170,173,184,204],"maximally":[24],"extract":[25],"these":[26],"for":[31,42,54,225],"enhancement.":[33],"We":[34],"demonstrate":[35],"can":[38,49,134],"reduce":[39],"the":[40,46,60,71,78,97,101,110,116,149,154,159,178,186,191,195,214,222],"requirement":[41],"prior":[43],"information":[44],"about":[45],"noise,":[47],"which":[48],"be":[50,135],"difficult":[51],"estimate":[53,105],"fast-varying":[55],"Given":[57],"noisy":[58,98,192],"speech,":[59,180],"new":[61,163,241],"approach":[62,164,242],"estimates":[63],"clean":[64,72,80],"by":[66,108,207],"recognizing":[67],"long":[68],"segments":[69,93,113,121,152,189],"as":[74,90,122],"whole":[75,123],"units.":[76],"recognition,":[79],"sentences,":[82],"taken":[83],"corpus,":[87],"used":[89],"examples.":[91],"Matching":[92],"identified":[95,136],"between":[96,190],"sentence":[99,193],"corpus":[102,117,179,196,215],"sentences.":[103,118,197,216],"The":[104,162,198,240],"is":[106,200],"formed":[107],"using":[109],"longest":[111,150,187],"matching":[112,188],"found":[114],"in":[115,177,251],"Longer":[119],"units":[124],"contain":[125],"more":[126,137,202],"distinct":[127],"richer":[130],"characteristics,":[132],"accurately":[138],"noise":[140,155,205,211,233],"than":[141],"shorter":[142],"segments.":[144],"Therefore,":[145],"estimation":[146,160],"based":[147,210],"on":[148,221],"recognized":[151],"increases":[153],"immunity":[156],"hence":[158],"accuracy.":[161],"consists":[165],"statistical":[168],"model":[169],"represent":[171],"up":[172],"sentence-long":[174],"temporal":[175],"an":[182],"algorithm":[183,199],"identify":[185],"made":[201],"robust":[203],"uncertainty":[206],"introducing":[208],"missing-feature":[209],"compensation":[212],"into":[213],"Experiments":[217],"have":[218],"been":[219],"conducted":[220],"TIMIT":[223],"database":[224],"enhancement":[227,249],"various":[229],"types":[230],"nonstationary":[232],"including":[234],"song,":[235],"music,":[236],"crosstalk":[238],"speech.":[239],"has":[243],"shown":[244],"improved":[245],"performance":[246],"over":[247],"conventional":[248],"algorithms":[250],"both":[252],"objective":[253],"subjective":[255],"evaluations.":[256]},"counts_by_year":[{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":2},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":2},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
