{"id":"https://openalex.org/W4408355341","doi":"https://doi.org/10.1109/icassp49660.2025.10888962","title":"Smr-Awarenet: An Adaptive Smr-Aware Neural Network for EEG Auditory Attention Guided Target Speech Extraction","display_name":"Smr-Awarenet: An Adaptive Smr-Aware Neural Network for EEG Auditory Attention Guided Target Speech Extraction","publication_year":2025,"publication_date":"2025-03-12","ids":{"openalex":"https://openalex.org/W4408355341","doi":"https://doi.org/10.1109/icassp49660.2025.10888962"},"language":"en","primary_location":{"id":"doi:10.1109/icassp49660.2025.10888962","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10888962","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100696136","display_name":"Xuefei Wang","orcid":"https://orcid.org/0000-0002-5343-3788"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Xuefei Wang","raw_affiliation_strings":["Southern University of Science and Technology,Department of Electronic and Electrical Engineering,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Southern University of Science and Technology,Department of Electronic and Electrical Engineering,Shenzhen,China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005473933","display_name":"Yuting Ding","orcid":"https://orcid.org/0000-0001-5007-9288"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuting Ding","raw_affiliation_strings":["Southern University of Science and Technology,Department of Electronic and Electrical Engineering,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Southern University of Science and Technology,Department of Electronic and Electrical Engineering,Shenzhen,China","institution_ids":["https://openalex.org/I3045169105"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100436158","display_name":"Lei Wang","orcid":"https://orcid.org/0000-0003-4415-1268"},"institutions":[{"id":"https://openalex.org/I37987034","display_name":"Guangzhou University","ror":"https://ror.org/05ar8rn06","country_code":"CN","type":"education","lineage":["https://openalex.org/I37987034"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lei Wang","raw_affiliation_strings":["Guangzhou University,School of Electronics and Communication Engineering,Guangzhou,China"],"affiliations":[{"raw_affiliation_string":"Guangzhou University,School of Electronics and Communication Engineering,Guangzhou,China","institution_ids":["https://openalex.org/I37987034"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100405410","display_name":"Fei Chen","orcid":"https://orcid.org/0000-0002-6988-492X"},"institutions":[{"id":"https://openalex.org/I3045169105","display_name":"Southern University of Science and Technology","ror":"https://ror.org/049tv2d57","country_code":"CN","type":"education","lineage":["https://openalex.org/I3045169105"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei Chen","raw_affiliation_strings":["Southern University of Science and Technology,Department of Electronic and Electrical Engineering,Shenzhen,China"],"affiliations":[{"raw_affiliation_string":"Southern University of Science and Technology,Department of Electronic and Electrical Engineering,Shenzhen,China","institution_ids":["https://openalex.org/I3045169105"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100696136"],"corresponding_institution_ids":["https://openalex.org/I3045169105"],"apc_list":null,"apc_paid":null,"fwci":3.8348,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.92224611,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9480000138282776,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9480000138282776,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9104999899864197,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/electroencephalography","display_name":"Electroencephalography","score":0.6878136992454529},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6845257878303528},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6542946100234985},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.6389521360397339},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.35084351897239685},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.1614765226840973},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.10994109511375427}],"concepts":[{"id":"https://openalex.org/C522805319","wikidata":"https://www.wikidata.org/wiki/Q179965","display_name":"Electroencephalography","level":2,"score":0.6878136992454529},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6845257878303528},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6542946100234985},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.6389521360397339},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35084351897239685},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.1614765226840973},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.10994109511375427}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp49660.2025.10888962","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp49660.2025.10888962","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2025 - 2025 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320337504","display_name":"Research and Development","ror":"https://ror.org/027s68j25"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W1852582171","https://openalex.org/W2000842688","https://openalex.org/W2089468765","https://openalex.org/W2106244103","https://openalex.org/W2128495200","https://openalex.org/W2144561273","https://openalex.org/W2160813409","https://openalex.org/W2172139273","https://openalex.org/W2345067732","https://openalex.org/W2939880928","https://openalex.org/W2952218014","https://openalex.org/W3003432884","https://openalex.org/W3015921042","https://openalex.org/W3126966983","https://openalex.org/W3159148248","https://openalex.org/W3168997536","https://openalex.org/W3191474079","https://openalex.org/W4312096632","https://openalex.org/W4405265913","https://openalex.org/W6633786245","https://openalex.org/W6852177738"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2922348724","https://openalex.org/W200322357","https://openalex.org/W2390279801","https://openalex.org/W2130428257","https://openalex.org/W4391913857","https://openalex.org/W4308951944","https://openalex.org/W2358668433"],"abstract_inverted_index":{"Target":[0],"speech":[1,8,21,27,40,52,104],"extraction":[2],"remains":[3,58],"a":[4,67],"significant":[5,114],"challenge":[6],"in":[7,37,55,116],"separation,":[9],"particularly":[10],"within":[11],"complex":[12,56],"multi-speaker":[13],"environments":[14],"where":[15],"accurate":[16],"isolation":[17],"of":[18,24,45],"the":[19,25,31,43,51,77,82,101,110],"target":[20,83,103],"and":[22,84,121],"suppression":[23],"interfering":[26,85],"are":[28],"crucial.":[29],"Despite":[30],"progress":[32],"driven":[33],"by":[34],"deep":[35],"learning":[36],"neural":[38,69],"network-based":[39],"separation":[41,53],"models,":[42],"integration":[44],"electroencephalography":[46],"(EEG)":[47],"signals":[48],"to":[49,99],"guide":[50,100],"process":[54],"scenes":[57],"an":[59],"open":[60],"problem.":[61],"In":[62],"this":[63],"study,":[64],"we":[65],"propose":[66],"novel":[68],"network":[70],"architecture":[71,75],"called":[72],"SMR-AwareNet.":[73],"This":[74],"utilizes":[76],"Signal-to-Masker":[78],"Ratio":[79,119],"(SMR)":[80],"between":[81],"speech,":[86],"along":[87],"with":[88],"attention":[89,95],"information":[90],"obtained":[91],"through":[92],"EEG":[93],"auditory":[94],"detection":[96],"(AAD)":[97],"module,":[98],"adaptive":[102],"extraction.":[105],"Experimental":[106],"results":[107],"show":[108],"that":[109],"SMR-AwareNet":[111],"model":[112],"achieves":[113],"improvements":[115],"Scale-Invariant":[117],"Signal-to-Noise":[118],"(SISNR)":[120],"consistently":[122],"outperforms":[123],"baseline":[124],"models":[125],"under":[126],"various":[127],"challenging":[128],"conditions.":[129]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-23T09:07:50.710637","created_date":"2025-10-10T00:00:00"}
