{"id":"https://openalex.org/W2122982914","doi":"https://doi.org/10.1109/tasl.2008.2010633","title":"A Supervised Learning Approach to Monaural Segregation of Reverberant Speech","display_name":"A Supervised Learning Approach to Monaural Segregation of Reverberant Speech","publication_year":2009,"publication_date":"2009-03-19","ids":{"openalex":"https://openalex.org/W2122982914","doi":"https://doi.org/10.1109/tasl.2008.2010633","mag":"2122982914"},"language":"en","primary_location":{"id":"doi:10.1109/tasl.2008.2010633","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2008.2010633","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5025797022","display_name":"Zhaozhang Jin","orcid":null},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zhaozhang Jin","raw_affiliation_strings":["Department of Computer Science and Engineering, Ohio State Uinversity, Columbus, OH, USA","Department of Computer Science and Engineering Ohio State University, Columbus OH"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Ohio State Uinversity, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]},{"raw_affiliation_string":"Department of Computer Science and Engineering Ohio State University, Columbus OH","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5051837453","display_name":"DeLiang Wang","orcid":"https://orcid.org/0000-0001-8195-6319"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"DeLiang Wang","raw_affiliation_strings":["Department of Computer Science and Engineering and the Center of Cognitive Science, Ohio State Uinversity, Columbus, OH, USA","Department of Computer Science and Engineering Ohio State University, Columbus OH"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering and the Center of Cognitive Science, Ohio State Uinversity, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]},{"raw_affiliation_string":"Department of Computer Science and Engineering Ohio State University, Columbus OH","institution_ids":["https://openalex.org/I52357470"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5025797022"],"corresponding_institution_ids":["https://openalex.org/I52357470"],"apc_list":null,"apc_paid":null,"fwci":8.8116,"has_fulltext":false,"cited_by_count":102,"citation_normalized_percentile":{"value":0.98416994,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":"17","issue":"4","first_page":"625","last_page":"638"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/monaural","display_name":"Monaural","score":0.946420431137085},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7698525190353394},{"id":"https://openalex.org/keywords/reverberation","display_name":"Reverberation","score":0.7546373605728149},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.712031364440918},{"id":"https://openalex.org/keywords/segmentation","display_name":"Segmentation","score":0.5185702443122864},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.46934378147125244},{"id":"https://openalex.org/keywords/speech-processing","display_name":"Speech processing","score":0.4527164399623871},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4375793933868408},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4082378149032593},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3749954104423523},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.2151464819908142},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.08294400572776794}],"concepts":[{"id":"https://openalex.org/C102894143","wikidata":"https://www.wikidata.org/wiki/Q1323979","display_name":"Monaural","level":2,"score":0.946420431137085},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7698525190353394},{"id":"https://openalex.org/C95851461","wikidata":"https://www.wikidata.org/wiki/Q468809","display_name":"Reverberation","level":2,"score":0.7546373605728149},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.712031364440918},{"id":"https://openalex.org/C89600930","wikidata":"https://www.wikidata.org/wiki/Q1423946","display_name":"Segmentation","level":2,"score":0.5185702443122864},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.46934378147125244},{"id":"https://openalex.org/C61328038","wikidata":"https://www.wikidata.org/wiki/Q3358061","display_name":"Speech processing","level":2,"score":0.4527164399623871},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4375793933868408},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4082378149032593},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3749954104423523},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.2151464819908142},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.08294400572776794},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tasl.2008.2010633","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2008.2010633","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320338279","display_name":"Air Force Office of Scientific Research","ror":"https://ror.org/011e9bt93"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":70,"referenced_works":["https://openalex.org/W10765870","https://openalex.org/W116580109","https://openalex.org/W160800111","https://openalex.org/W1500551892","https://openalex.org/W1554663460","https://openalex.org/W1575829986","https://openalex.org/W1808196926","https://openalex.org/W1825077972","https://openalex.org/W1973045472","https://openalex.org/W1979099822","https://openalex.org/W1980501707","https://openalex.org/W1986515506","https://openalex.org/W1989320958","https://openalex.org/W1995536493","https://openalex.org/W2013312573","https://openalex.org/W2025127228","https://openalex.org/W2025719707","https://openalex.org/W2027804983","https://openalex.org/W2042577118","https://openalex.org/W2042750879","https://openalex.org/W2044222806","https://openalex.org/W2048967079","https://openalex.org/W2057662515","https://openalex.org/W2057889776","https://openalex.org/W2078210373","https://openalex.org/W2096554907","https://openalex.org/W2096779346","https://openalex.org/W2097191389","https://openalex.org/W2103453322","https://openalex.org/W2106525014","https://openalex.org/W2110322414","https://openalex.org/W2111070087","https://openalex.org/W2113131123","https://openalex.org/W2116879786","https://openalex.org/W2117428648","https://openalex.org/W2117678320","https://openalex.org/W2121973264","https://openalex.org/W2123157731","https://openalex.org/W2128334000","https://openalex.org/W2128653836","https://openalex.org/W2137617983","https://openalex.org/W2139393465","https://openalex.org/W2141253686","https://openalex.org/W2149425615","https://openalex.org/W2150924398","https://openalex.org/W2168793898","https://openalex.org/W2401269416","https://openalex.org/W2466833302","https://openalex.org/W2489547515","https://openalex.org/W2550493152","https://openalex.org/W2561557072","https://openalex.org/W2970850616","https://openalex.org/W2981666567","https://openalex.org/W3030884845","https://openalex.org/W3127686677","https://openalex.org/W3147539069","https://openalex.org/W3216401400","https://openalex.org/W4230946174","https://openalex.org/W4254118426","https://openalex.org/W4256399001","https://openalex.org/W4285719527","https://openalex.org/W4301624450","https://openalex.org/W4388297464","https://openalex.org/W6638450331","https://openalex.org/W6675378234","https://openalex.org/W6680690805","https://openalex.org/W6680919041","https://openalex.org/W6684458083","https://openalex.org/W6712692946","https://openalex.org/W6719743294"],"related_works":["https://openalex.org/W2621851636","https://openalex.org/W2401567014","https://openalex.org/W2981428355","https://openalex.org/W1834994814","https://openalex.org/W2041273198","https://openalex.org/W1599055764","https://openalex.org/W2131711534","https://openalex.org/W2149163000","https://openalex.org/W2962858469","https://openalex.org/W2289873871"],"abstract_inverted_index":{"A":[0,126],"major":[1],"source":[2],"of":[3,34,59,70,82,109],"signal":[4],"degradation":[5],"in":[6,15],"real":[7],"environments":[8,17],"is":[9,18,41,131],"room":[10,47],"reverberation.":[11],"Monaural":[12],"speech":[13,36],"segregation":[14,58],"reverberant":[16,35,60,138,157],"a":[19,52,68,75,83,95],"particularly":[20],"challenging":[21],"problem.":[22],"Although":[23],"inverse":[24],"filtering":[25],"has":[26],"been":[27],"proposed":[28],"to":[29,43,56,65,74,106,133,162],"partially":[30],"restore":[31],"the":[32,79,100,107],"harmonicity":[33],"before":[37],"segregation,":[38],"this":[39,117],"approach":[40,55,150],"sensitive":[42],"specific":[44],"source/receiver":[45],"and":[46,128,140,159,165],"configurations.":[48],"This":[49],"paper":[50],"proposes":[51],"supervised":[53],"learning":[54,101],"monaural":[57],"voiced":[61],"speech,":[62],"which":[63,103],"learns":[64],"map":[66],"from":[67],"set":[69],"pitch-based":[71],"auditory":[72],"features":[73],"grouping":[76,129],"cue":[77],"encoding":[78],"posterior":[80],"probability":[81],"time-frequency":[84],"(T-F)":[85],"unit":[86,124],"being":[87],"target":[88],"dominant":[89],"given":[90],"observed":[91],"features.":[92],"We":[93],"devise":[94],"novel":[96],"objective":[97,118],"function":[98,119],"for":[99],"process,":[102],"directly":[104],"relates":[105],"goal":[108],"maximizing":[110],"signal-to-noise":[111],"ratio.":[112],"The":[113],"models":[114],"trained":[115],"using":[116],"yield":[120],"significantly":[121],"better":[122],"T-F":[123],"labeling.":[125],"segmentation":[127],"framework":[130],"utilized":[132],"form":[134],"reliable":[135],"segments":[136],"under":[137,155],"conditions":[139,158],"organize":[141],"them":[142],"into":[143],"streams.":[144],"Systematic":[145],"evaluations":[146],"show":[147],"that":[148],"our":[149],"produces":[151],"very":[152],"promising":[153],"results":[154],"various":[156],"generalizes":[160],"well":[161],"new":[163,166],"utterances":[164],"speakers.":[167]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":3},{"year":2020,"cited_by_count":8},{"year":2019,"cited_by_count":10},{"year":2018,"cited_by_count":15},{"year":2017,"cited_by_count":8},{"year":2016,"cited_by_count":6},{"year":2015,"cited_by_count":9},{"year":2014,"cited_by_count":8},{"year":2013,"cited_by_count":5},{"year":2012,"cited_by_count":12}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
