{"id":"https://openalex.org/W2107508685","doi":"https://doi.org/10.1109/asru.2009.5373230","title":"Robust speech recognition using a Small Power Boosting algorithm","display_name":"Robust speech recognition using a Small Power Boosting algorithm","publication_year":2009,"publication_date":"2009-12-01","ids":{"openalex":"https://openalex.org/W2107508685","doi":"https://doi.org/10.1109/asru.2009.5373230","mag":"2107508685"},"language":"en","primary_location":{"id":"doi:10.1109/asru.2009.5373230","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2009.5373230","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE Workshop on Automatic Speech Recognition &amp; Understanding","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100684423","display_name":"Chanwoo Kim","orcid":"https://orcid.org/0000-0003-2526-4371"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Chanwoo Kim","raw_affiliation_strings":["Language Technologies Institute, Carnegie Mellon University, Pittsburgh, PA, USA","Department of Electrical and Computer Engineering and Language Technologies Institute, Carnegie Mellon University, Pittsburgh PA 15213 USA#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Language Technologies Institute, Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering and Language Technologies Institute, Carnegie Mellon University, Pittsburgh PA 15213 USA#TAB#","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047826067","display_name":"Kshitiz Kumar","orcid":"https://orcid.org/0000-0003-2728-2493"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kshitiz Kumar","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Carnegie Mellon University, Pittsburgh, PA, USA","Department of Electrical and Computer Engineering and Language Technologies Institute, Carnegie Mellon University, Pittsburgh PA 15213 USA#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering and Language Technologies Institute, Carnegie Mellon University, Pittsburgh PA 15213 USA#TAB#","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069424860","display_name":"Richard M. Stern","orcid":"https://orcid.org/0000-0003-0557-7282"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Richard M. Stern","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Language Technologies Institute, Carnegie Mellon University, Pittsburgh, PA, USA","Department of Electrical and Computer Engineering and Language Technologies Institute, Carnegie Mellon University, Pittsburgh PA 15213 USA#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Language Technologies Institute, Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]},{"raw_affiliation_string":"Department of Electrical and Computer Engineering and Language Technologies Institute, Carnegie Mellon University, Pittsburgh PA 15213 USA#TAB#","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100684423"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":1.428,"has_fulltext":false,"cited_by_count":17,"citation_normalized_percentile":{"value":0.81109047,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":"82","issue":null,"first_page":"243","last_page":"248"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/boosting","display_name":"Boosting (machine learning)","score":0.7508231401443481},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7088314294815063},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5564565062522888},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4301599860191345},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.37564271688461304},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3475760221481323}],"concepts":[{"id":"https://openalex.org/C46686674","wikidata":"https://www.wikidata.org/wiki/Q466303","display_name":"Boosting (machine learning)","level":2,"score":0.7508231401443481},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7088314294815063},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5564565062522888},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4301599860191345},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.37564271688461304},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3475760221481323}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/asru.2009.5373230","is_oa":false,"landing_page_url":"https://doi.org/10.1109/asru.2009.5373230","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE Workshop on Automatic Speech Recognition &amp; Understanding","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.155.1430","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.155.1430","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www-2.cs.cmu.edu/afs/cs/user/robust/www/Papers/KimASRU09_SPB.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.368.9733","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.368.9733","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cs.cmu.edu/~chanwook/MyPapers/SPB_ASRU_ver13_PS2PDF.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.8199999928474426,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G1537112261","display_name":"Robust Automatic Speech Recognition Based on Auditory Processing and Sound Separation","funder_award_id":"0420866","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G786853897","display_name":null,"funder_award_id":"IIS-0420866","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W15113896","https://openalex.org/W177521823","https://openalex.org/W1489184006","https://openalex.org/W1545406001","https://openalex.org/W1586342741","https://openalex.org/W1607274768","https://openalex.org/W1840695391","https://openalex.org/W1990005915","https://openalex.org/W2090861223","https://openalex.org/W2103869314","https://openalex.org/W2113911479","https://openalex.org/W2126597753","https://openalex.org/W2128653836","https://openalex.org/W2137737117","https://openalex.org/W2143855671","https://openalex.org/W2146083413","https://openalex.org/W2158483598","https://openalex.org/W2163929346","https://openalex.org/W2164162335","https://openalex.org/W2528357689","https://openalex.org/W4232336823","https://openalex.org/W4244606868","https://openalex.org/W6600618273","https://openalex.org/W6607264330","https://openalex.org/W6632590417"],"related_works":["https://openalex.org/W2125652721","https://openalex.org/W1540371141","https://openalex.org/W1549363203","https://openalex.org/W4231274751","https://openalex.org/W2154063878","https://openalex.org/W2556012038","https://openalex.org/W1489772951","https://openalex.org/W1518215897","https://openalex.org/W2033914206","https://openalex.org/W2042327336"],"abstract_inverted_index":{"In":[0,52],"this":[1,37,85,133],"paper,":[2],"we":[3,57],"present":[4],"a":[5],"noise":[6,42],"robustness":[7],"algorithm":[8],"called":[9],"small":[10,66,79,103,117],"power":[11,25,61,80,86,104,118],"boosting":[12,105,119],"(SPB).":[13],"We":[14,113],"observe":[15,114],"that":[16,115,132],"in":[17,55],"the":[18,41,44,60,70,88,92],"spectral":[19,89],"domain,":[20],"time-frequency":[21,63,76],"bins":[22,64,77],"with":[23,65,78],"smaller":[24],"are":[26],"more":[27],"affected":[28],"by":[29,147],"additive":[30],"noise.":[31],"The":[32],"conventional":[33],"way":[34],"of":[35,62,102],"handling":[36],"problem":[38],"is":[39,106,120,136],"estimating":[40],"from":[43],"test":[45,96],"utterance":[46],"and":[47,72,94],"doing":[48],"normalization":[49],"or":[50],"subtraction.":[51],"our":[53],"work,":[54],"contrast,":[56],"intentionally":[58],"boost":[59],"energy":[67],"for":[68,139],"both":[69],"training":[71],"testing":[73],"datasets.":[74],"Since":[75],"no":[81],"longer":[82],"exist":[83],"after":[84],"boosting,":[87],"distortion":[90],"between":[91],"clean":[93],"corrupt":[95],"sets":[97],"becomes":[98,125],"reduced.":[99],"This":[100],"type":[101],"also":[107],"highly":[108,126],"related":[109],"to":[110],"physiological":[111],"nonlinearity.":[112],"when":[116],"done,":[121],"suitable":[122],"weighting":[123],"smoothing":[124],"important.":[127],"Our":[128],"experimental":[129],"results":[130],"indicate":[131],"simple":[134],"idea":[135],"very":[137,140],"helpful":[138],"difficult":[141],"noisy":[142],"environments":[143],"such":[144],"as":[145],"corruption":[146],"background":[148],"music.":[149]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":3},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2013,"cited_by_count":3},{"year":2012,"cited_by_count":2}],"updated_date":"2026-04-28T14:05:53.105641","created_date":"2025-10-10T00:00:00"}
