{"id":"https://openalex.org/W2120838354","doi":"https://doi.org/10.1109/icassp.2011.5946377","title":"Integrating binaural cues and blind source separation method for separating reverberant speech mixtures","display_name":"Integrating binaural cues and blind source separation method for separating reverberant speech mixtures","publication_year":2011,"publication_date":"2011-05-01","ids":{"openalex":"https://openalex.org/W2120838354","doi":"https://doi.org/10.1109/icassp.2011.5946377","mag":"2120838354"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2011.5946377","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2011.5946377","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5048056691","display_name":"Atiyeh Alinaghi","orcid":null},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Atiyeh Alinaghi","raw_affiliation_strings":["Centre of Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford, UK","Centre for Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford GU2 7XH, UK"],"affiliations":[{"raw_affiliation_string":"Centre of Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford, UK","institution_ids":["https://openalex.org/I28290843"]},{"raw_affiliation_string":"Centre for Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford GU2 7XH, UK","institution_ids":["https://openalex.org/I28290843"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100676721","display_name":"Wenwu Wang","orcid":"https://orcid.org/0000-0002-8393-5703"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Wenwu Wang","raw_affiliation_strings":["Centre of Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford, UK","Centre for Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford GU2 7XH, UK"],"affiliations":[{"raw_affiliation_string":"Centre of Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford, UK","institution_ids":["https://openalex.org/I28290843"]},{"raw_affiliation_string":"Centre for Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford GU2 7XH, UK","institution_ids":["https://openalex.org/I28290843"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5022165330","display_name":"Philip J. B. Jackson","orcid":"https://orcid.org/0000-0001-7933-5935"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Philip JB Jackson","raw_affiliation_strings":["Centre of Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford, UK","Centre for Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford GU2 7XH, UK"],"affiliations":[{"raw_affiliation_string":"Centre of Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford, UK","institution_ids":["https://openalex.org/I28290843"]},{"raw_affiliation_string":"Centre for Vision, Speech and Signal Processing (CVSSP), Department of Electronic Engineering (FEPS), University of Surrey, Guildford GU2 7XH, UK","institution_ids":["https://openalex.org/I28290843"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5048056691"],"corresponding_institution_ids":["https://openalex.org/I28290843"],"apc_list":null,"apc_paid":null,"fwci":4.0554,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.94697118,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"209","last_page":"212"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/binaural-recording","display_name":"Binaural recording","score":0.7394380569458008},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6536839008331299},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5978759527206421},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.5963078141212463},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.5529873967170715},{"id":"https://openalex.org/keywords/reverberation","display_name":"Reverberation","score":0.5121455192565918},{"id":"https://openalex.org/keywords/blind-signal-separation","display_name":"Blind signal separation","score":0.5073177218437195},{"id":"https://openalex.org/keywords/mixing","display_name":"Mixing (physics)","score":0.46678316593170166},{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.4267657399177551},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.35220158100128174},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3259273171424866},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.303657203912735},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.2958974838256836},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2842068672180176},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.08005961775779724}],"concepts":[{"id":"https://openalex.org/C201247586","wikidata":"https://www.wikidata.org/wiki/Q5612967","display_name":"Binaural recording","level":2,"score":0.7394380569458008},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6536839008331299},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5978759527206421},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.5963078141212463},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.5529873967170715},{"id":"https://openalex.org/C95851461","wikidata":"https://www.wikidata.org/wiki/Q468809","display_name":"Reverberation","level":2,"score":0.5121455192565918},{"id":"https://openalex.org/C120317606","wikidata":"https://www.wikidata.org/wiki/Q17105967","display_name":"Blind signal separation","level":3,"score":0.5073177218437195},{"id":"https://openalex.org/C138777275","wikidata":"https://www.wikidata.org/wiki/Q6884054","display_name":"Mixing (physics)","level":2,"score":0.46678316593170166},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.4267657399177551},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.35220158100128174},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3259273171424866},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.303657203912735},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.2958974838256836},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2842068672180176},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.08005961775779724},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":5,"locations":[{"id":"doi:10.1109/icassp.2011.5946377","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2011.5946377","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2011 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:alma.44SUR_INST:11138809670002346","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4210197018","display_name":"View","issn_l":"2688-268X","issn":["2688-268X","2688-3988"],"is_oa":false,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310320595","host_organization_name":"Wiley","host_organization_lineage":["https://openalex.org/P4310320595"],"host_organization_lineage_names":["Wiley"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"","raw_type":""},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.688.4774","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.688.4774","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://epubs.surrey.ac.uk/7722/2/AlinaghiWangJackson_ICASSP11.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.705.7577","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.705.7577","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://personal.ee.surrey.ac.uk/Personal/W.Wang/papers/AlinaghiWJ_ICASSP_2011.pdf","raw_type":"text"},{"id":"pmh:oai:epubs.surrey.ac.uk:7722","is_oa":false,"landing_page_url":"http://epubs.surrey.ac.uk/7722/2/AlinaghiWangJackson_ICASSP11.pdf","pdf_url":null,"source":{"id":"https://openalex.org/S4306400680","display_name":"Surrey Research Insight Open Access (The University of Surrey)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I28290843","host_organization_name":"University of Surrey","host_organization_lineage":["https://openalex.org/I28290843"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"Article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.41999998688697815,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W160190058","https://openalex.org/W2020946001","https://openalex.org/W2088399049","https://openalex.org/W2096855653","https://openalex.org/W2104257868","https://openalex.org/W2123649031","https://openalex.org/W2127851351","https://openalex.org/W2129171989","https://openalex.org/W2166458192","https://openalex.org/W2561557072","https://openalex.org/W4233392025"],"related_works":["https://openalex.org/W1982169876","https://openalex.org/W3094316140","https://openalex.org/W3133205200","https://openalex.org/W4289363934","https://openalex.org/W2898145319","https://openalex.org/W2098101267","https://openalex.org/W1509813908","https://openalex.org/W2898606530","https://openalex.org/W2059119686","https://openalex.org/W4289362680"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,125],"new":[4],"method":[5,96],"for":[6,22,57,112],"reverberant":[7],"speech":[8,33,147],"separation,":[9],"based":[10],"on":[11,146],"the":[12,23,27,32,71,83,90,99,103,109,128,138,162],"combination":[13],"of":[14,26,31,102,153],"binaural":[15,121,163],"cues":[16,122],"and":[17,48,60,69,82,123,136,149],"blind":[18],"source":[19,59],"separation":[20],"(BSS)":[21],"automatic":[24],"classification":[25],"time-frequency":[28],"(T-F)":[29],"units":[30,72],"mixture":[34,55],"spectrogram.":[35],"The":[36,79,94,116],"main":[37],"idea":[38],"is":[39,132],"to":[40,76,134],"model":[41,64,80,141],"interaural":[42,45],"phase":[43],"difference,":[44],"level":[46],"difference":[47],"frequency":[49,104,114],"bin-wise":[50],"mixing":[51,110,139],"vectors":[52,111],"by":[53,107],"Gaussian":[54],"models":[56],"each":[58,66,113],"then":[61],"evaluate":[62],"that":[63,77],"at":[65],"T-F":[67],"point":[68],"assign":[70],"with":[73,120],"high":[74],"probability":[75],"source.":[78],"parameters":[81],"assigned":[84],"regions":[85],"are":[86],"refined":[87],"iteratively":[88],"using":[89],"Expectation-Maximization":[91],"(EM)":[92],"algorithm.":[93],"proposed":[95],"also":[97],"addresses":[98],"permutation":[100],"problem":[101],"domain":[105],"BSS":[106],"initializing":[108],"channel.":[115],"EM":[117],"algorithm":[118],"starts":[119],"after":[124],"few":[126],"iterations":[127],"estimated":[129],"probabilistic":[130],"mask":[131],"used":[133],"initialize":[135],"re-estimate":[137],"vector":[140],"parameters.":[142],"We":[143],"performed":[144],"experiments":[145],"mixtures,":[148],"showed":[150],"an":[151],"average":[152],"about":[154],"0.8":[155],"dB":[156],"improvement":[157],"in":[158],"signal-to-distortion":[159],"(SDR)":[160],"over":[161],"only":[164],"baseline.":[165]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":2},{"year":2017,"cited_by_count":2},{"year":2015,"cited_by_count":3},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":9},{"year":2012,"cited_by_count":1}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
