{"id":"https://openalex.org/W4416251260","doi":"https://doi.org/10.1109/waspaa66052.2025.11230927","title":"IS <sup>3</sup> : Generic Impulsive\u2013Stationary Sound Separation in Acoustic Scenes using Deep Filtering","display_name":"IS <sup>3</sup> : Generic Impulsive\u2013Stationary Sound Separation in Acoustic Scenes using Deep Filtering","publication_year":2025,"publication_date":"2025-10-12","ids":{"openalex":"https://openalex.org/W4416251260","doi":"https://doi.org/10.1109/waspaa66052.2025.11230927"},"language":null,"primary_location":{"id":"doi:10.1109/waspaa66052.2025.11230927","is_oa":false,"landing_page_url":"https://doi.org/10.1109/waspaa66052.2025.11230927","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Cl\u00e9mentine Berger","orcid":null},"institutions":[{"id":"https://openalex.org/I4210145102","display_name":"Institut Polytechnique de Paris","ror":"https://ror.org/042tfbd02","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210145102"]},{"id":"https://openalex.org/I4210165912","display_name":"Laboratoire Traitement et Communication de l\u2019Information","ror":"https://ror.org/057er4c39","country_code":"FR","type":"facility","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102","https://openalex.org/I4210165912"]}],"countries":["FR"],"is_corresponding":true,"raw_author_name":"Cl\u00e9mentine Berger","raw_affiliation_strings":["Institut Polytechnique de Paris,LTCI, T&#x00E9;l&#x00E9;com Paris,France"],"affiliations":[{"raw_affiliation_string":"Institut Polytechnique de Paris,LTCI, T&#x00E9;l&#x00E9;com Paris,France","institution_ids":["https://openalex.org/I4210165912","https://openalex.org/I4210145102"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107526624","display_name":"Paraskevas Stamatiadis","orcid":null},"institutions":[{"id":"https://openalex.org/I4210145102","display_name":"Institut Polytechnique de Paris","ror":"https://ror.org/042tfbd02","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210145102"]},{"id":"https://openalex.org/I4210165912","display_name":"Laboratoire Traitement et Communication de l\u2019Information","ror":"https://ror.org/057er4c39","country_code":"FR","type":"facility","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102","https://openalex.org/I4210165912"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Paraskevas Stamatiadis","raw_affiliation_strings":["Institut Polytechnique de Paris,LTCI, T&#x00E9;l&#x00E9;com Paris,France"],"affiliations":[{"raw_affiliation_string":"Institut Polytechnique de Paris,LTCI, T&#x00E9;l&#x00E9;com Paris,France","institution_ids":["https://openalex.org/I4210165912","https://openalex.org/I4210145102"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028865449","display_name":"Roland Badeau","orcid":"https://orcid.org/0000-0002-9630-6877"},"institutions":[{"id":"https://openalex.org/I4210145102","display_name":"Institut Polytechnique de Paris","ror":"https://ror.org/042tfbd02","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210145102"]},{"id":"https://openalex.org/I4210165912","display_name":"Laboratoire Traitement et Communication de l\u2019Information","ror":"https://ror.org/057er4c39","country_code":"FR","type":"facility","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102","https://openalex.org/I4210165912"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Roland Badeau","raw_affiliation_strings":["Institut Polytechnique de Paris,LTCI, T&#x00E9;l&#x00E9;com Paris,France"],"affiliations":[{"raw_affiliation_string":"Institut Polytechnique de Paris,LTCI, T&#x00E9;l&#x00E9;com Paris,France","institution_ids":["https://openalex.org/I4210165912","https://openalex.org/I4210145102"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060031161","display_name":"Slim Essid","orcid":"https://orcid.org/0000-0002-0028-327X"},"institutions":[{"id":"https://openalex.org/I4210145102","display_name":"Institut Polytechnique de Paris","ror":"https://ror.org/042tfbd02","country_code":"FR","type":"education","lineage":["https://openalex.org/I4210145102"]},{"id":"https://openalex.org/I4210165912","display_name":"Laboratoire Traitement et Communication de l\u2019Information","ror":"https://ror.org/057er4c39","country_code":"FR","type":"facility","lineage":["https://openalex.org/I12356871","https://openalex.org/I205703379","https://openalex.org/I4210145102","https://openalex.org/I4210165912"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Slim Essid","raw_affiliation_strings":["Institut Polytechnique de Paris,LTCI, T&#x00E9;l&#x00E9;com Paris,France"],"affiliations":[{"raw_affiliation_string":"Institut Polytechnique de Paris,LTCI, T&#x00E9;l&#x00E9;com Paris,France","institution_ids":["https://openalex.org/I4210165912","https://openalex.org/I4210145102"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210145102","https://openalex.org/I4210165912"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.41516966,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.5992000102996826,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.5992000102996826,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.11699999868869781,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.07519999891519547,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.5221999883651733},{"id":"https://openalex.org/keywords/signal-processing","display_name":"Signal processing","score":0.45260000228881836},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.44749999046325684},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4399000108242035},{"id":"https://openalex.org/keywords/audio-signal-processing","display_name":"Audio signal processing","score":0.43689998984336853},{"id":"https://openalex.org/keywords/deep-neural-networks","display_name":"Deep neural networks","score":0.42750000953674316},{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.40709999203681946},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.4047999978065491},{"id":"https://openalex.org/keywords/adaptive-filter","display_name":"Adaptive filter","score":0.40380001068115234},{"id":"https://openalex.org/keywords/attenuation","display_name":"Attenuation","score":0.39149999618530273}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7139000296592712},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.5221999883651733},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5216000080108643},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5083000063896179},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.45260000228881836},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.44749999046325684},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4399000108242035},{"id":"https://openalex.org/C127220857","wikidata":"https://www.wikidata.org/wiki/Q2719318","display_name":"Audio signal processing","level":4,"score":0.43689998984336853},{"id":"https://openalex.org/C2984842247","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep neural networks","level":3,"score":0.42750000953674316},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.40709999203681946},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.4047999978065491},{"id":"https://openalex.org/C102248274","wikidata":"https://www.wikidata.org/wiki/Q168388","display_name":"Adaptive filter","level":2,"score":0.40380001068115234},{"id":"https://openalex.org/C184652730","wikidata":"https://www.wikidata.org/wiki/Q2357982","display_name":"Attenuation","level":2,"score":0.39149999618530273},{"id":"https://openalex.org/C100675267","wikidata":"https://www.wikidata.org/wiki/Q1371624","display_name":"Background noise","level":2,"score":0.3880999982357025},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.37860000133514404},{"id":"https://openalex.org/C47432892","wikidata":"https://www.wikidata.org/wiki/Q831390","display_name":"Wavelet","level":2,"score":0.3573000133037567},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.34360000491142273},{"id":"https://openalex.org/C30684385","wikidata":"https://www.wikidata.org/wiki/Q176509","display_name":"Ringing","level":3,"score":0.3271999955177307},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.32710000872612},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3197000026702881},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.31349998712539673},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.313400000333786},{"id":"https://openalex.org/C29265498","wikidata":"https://www.wikidata.org/wiki/Q7047719","display_name":"Noise measurement","level":3,"score":0.29179999232292175},{"id":"https://openalex.org/C64922751","wikidata":"https://www.wikidata.org/wiki/Q4650799","display_name":"Audio signal","level":3,"score":0.29100000858306885},{"id":"https://openalex.org/C196216189","wikidata":"https://www.wikidata.org/wiki/Q2867","display_name":"Wavelet transform","level":3,"score":0.2881999909877777},{"id":"https://openalex.org/C76198728","wikidata":"https://www.wikidata.org/wiki/Q3629144","display_name":"Acoustic attenuation","level":3,"score":0.2842000126838684},{"id":"https://openalex.org/C73208851","wikidata":"https://www.wikidata.org/wiki/Q5157303","display_name":"Computational auditory scene analysis","level":2,"score":0.28290000557899475},{"id":"https://openalex.org/C2776061190","wikidata":"https://www.wikidata.org/wiki/Q7451805","display_name":"Separation (statistics)","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.25679999589920044},{"id":"https://openalex.org/C34951282","wikidata":"https://www.wikidata.org/wiki/Q864191","display_name":"Bioacoustics","level":2,"score":0.2556999921798706},{"id":"https://openalex.org/C38129911","wikidata":"https://www.wikidata.org/wiki/Q4820038","display_name":"Auditory scene analysis","level":3,"score":0.2549999952316284},{"id":"https://openalex.org/C142433447","wikidata":"https://www.wikidata.org/wiki/Q7806653","display_name":"Time\u2013frequency analysis","level":3,"score":0.25189998745918274}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/waspaa66052.2025.11230927","is_oa":false,"landing_page_url":"https://doi.org/10.1109/waspaa66052.2025.11230927","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE Workshop on Applications of Signal Processing to Audio and Acoustics (WASPAA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320307804","display_name":"BP","ror":"https://ror.org/051659894"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W1571508021","https://openalex.org/W1976985008","https://openalex.org/W2022532970","https://openalex.org/W2052666245","https://openalex.org/W2095147901","https://openalex.org/W2124320125","https://openalex.org/W2129229049","https://openalex.org/W2133409090","https://openalex.org/W2136757062","https://openalex.org/W2144498192","https://openalex.org/W2191779130","https://openalex.org/W2621033351","https://openalex.org/W2920829070","https://openalex.org/W2952218014","https://openalex.org/W2961183107","https://openalex.org/W2964058413","https://openalex.org/W2974407961","https://openalex.org/W3015287975","https://openalex.org/W3095717210","https://openalex.org/W3162348042","https://openalex.org/W3175803234","https://openalex.org/W3205770165","https://openalex.org/W4225299287","https://openalex.org/W4281877746","https://openalex.org/W4293363567","https://openalex.org/W4312097006","https://openalex.org/W4312570973","https://openalex.org/W4381249885"],"related_works":[],"abstract_inverted_index":{"We":[0,136],"are":[1],"interested":[2],"in":[3,46,61,158],"audio":[4,52],"systems":[5,43,54],"capable":[6],"of":[7,12],"performing":[8],"a":[9,83,101,109,122,139,144],"differentiated":[10],"processing":[11,27,174],"stationary":[13,98],"backgrounds":[14],"and":[15,129,149,153,176],"isolated":[16],"acoustic":[17,21,69,94],"events":[18,95],"within":[19],"an":[20],"scene,":[22],"whether":[23],"for":[24,33,87,112,133],"applying":[25],"specific":[26],"methods":[28],"to":[29],"each":[30],"part":[31],"or":[32,57,66,72],"focusing":[34],"solely":[35],"on":[36,143,179],"one":[37],"while":[38],"ignoring":[39],"the":[40,97,113,164],"other.":[41],"Such":[42],"have":[44],"applications":[45],"real-world":[47],"scenarios,":[48],"including":[49],"robust":[50,68],"adaptive":[51],"rendering":[53],"(e.g.,":[55],"EQ":[56],"compression),":[58],"plosive":[59],"attenuation":[60],"voice":[62],"mixing,":[63],"noise":[64],"suppression":[65],"reduction,":[67],"event":[70],"classification":[71],"even":[73],"bioacoustics.":[74],"To":[75,116],"this":[76,134,159],"end,":[77],"we":[78,120],"introduce":[79],"IS<sup":[80],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[81],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">3</sup>,":[82],"neural":[84,147],"network":[85],"designed":[86],"Impulsive\u2013Stationary":[88],"Sound":[89,166],"Separation,":[90],"that":[91,105,127,138],"isolates":[92],"impulsive":[93],"from":[96,171],"background":[99],"using":[100],"deep":[102],"filtering":[103,178],"approach,":[104,141],"can":[106],"act":[107],"as":[108],"pre-processing":[110],"stage":[111],"above-mentioned":[114],"tasks.":[115],"ensure":[117],"optimal":[118],"training,":[119],"propose":[121],"sophisticated":[123],"data":[124],"generation":[125],"pipeline":[126],"curates":[128],"adapts":[130],"existing":[131],"datasets":[132],"task.":[135],"demonstrate":[137],"learning-based":[140],"build":[142],"relatively":[145],"lightweight":[146],"architecture":[148],"trained":[150],"with":[151],"well-designed":[152],"varied":[154],"data,":[155],"is":[156],"successful":[157],"previously":[160],"unaddressed":[161],"task,":[162],"outperforming":[163],"Harmonic\u2013Percussive":[165],"Separation":[167],"masking":[168],"method,":[169],"adapted":[170],"music":[172],"signal":[173],"research,":[175],"wavelet":[177],"objective":[180],"separation":[181],"metrics.":[182]},"counts_by_year":[],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-11-14T00:00:00"}
