{"id":"https://openalex.org/W3162564204","doi":"https://doi.org/10.1109/icassp39728.2021.9414884","title":"SepNet: A Deep Separation Matrix Prediction Network for Multichannel Audio Source Separation","display_name":"SepNet: A Deep Separation Matrix Prediction Network for Multichannel Audio Source Separation","publication_year":2021,"publication_date":"2021-05-13","ids":{"openalex":"https://openalex.org/W3162564204","doi":"https://doi.org/10.1109/icassp39728.2021.9414884","mag":"3162564204"},"language":"en","primary_location":{"id":"doi:10.1109/icassp39728.2021.9414884","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp39728.2021.9414884","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5051093194","display_name":"Shota Inoue","orcid":"https://orcid.org/0000-0002-8754-0397"},"institutions":[{"id":"https://openalex.org/I146399215","display_name":"University of Tsukuba","ror":"https://ror.org/02956yf07","country_code":"JP","type":"education","lineage":["https://openalex.org/I146399215"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Shota Inoue","raw_affiliation_strings":["University of Tsukuba, Japan"],"affiliations":[{"raw_affiliation_string":"University of Tsukuba, Japan","institution_ids":["https://openalex.org/I146399215"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001243214","display_name":"Hirokazu Kameoka","orcid":"https://orcid.org/0000-0003-3102-0162"},"institutions":[{"id":"https://openalex.org/I2251713219","display_name":"NTT (Japan)","ror":"https://ror.org/00berct97","country_code":"JP","type":"company","lineage":["https://openalex.org/I2251713219"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hirokazu Kameoka","raw_affiliation_strings":["NTT Communication Science Laboratories, NTT Corporation, Japan"],"affiliations":[{"raw_affiliation_string":"NTT Communication Science Laboratories, NTT Corporation, Japan","institution_ids":["https://openalex.org/I2251713219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100361128","display_name":"Li Li","orcid":"https://orcid.org/0000-0002-2587-843X"},"institutions":[{"id":"https://openalex.org/I146399215","display_name":"University of Tsukuba","ror":"https://ror.org/02956yf07","country_code":"JP","type":"education","lineage":["https://openalex.org/I146399215"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Li Li","raw_affiliation_strings":["University of Tsukuba, Japan"],"affiliations":[{"raw_affiliation_string":"University of Tsukuba, Japan","institution_ids":["https://openalex.org/I146399215"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5075702573","display_name":"Shoji Makino","orcid":"https://orcid.org/0000-0003-1934-640X"},"institutions":[{"id":"https://openalex.org/I146399215","display_name":"University of Tsukuba","ror":"https://ror.org/02956yf07","country_code":"JP","type":"education","lineage":["https://openalex.org/I146399215"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Shoji Makino","raw_affiliation_strings":["University of Tsukuba, Japan"],"affiliations":[{"raw_affiliation_string":"University of Tsukuba, Japan","institution_ids":["https://openalex.org/I146399215"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5051093194"],"corresponding_institution_ids":["https://openalex.org/I146399215"],"apc_list":null,"apc_paid":null,"fwci":0.6094,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.65591616,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"14","issue":null,"first_page":"191","last_page":"195"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7106292843818665},{"id":"https://openalex.org/keywords/blind-signal-separation","display_name":"Blind signal separation","score":0.6508129835128784},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.5565598607063293},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5257509350776672},{"id":"https://openalex.org/keywords/matrix","display_name":"Matrix (chemical analysis)","score":0.5127602219581604},{"id":"https://openalex.org/keywords/independent-component-analysis","display_name":"Independent component analysis","score":0.5104809999465942},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.4956105947494507},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.42165088653564453},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.332422137260437},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.13892099261283875}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7106292843818665},{"id":"https://openalex.org/C120317606","wikidata":"https://www.wikidata.org/wiki/Q17105967","display_name":"Blind signal separation","level":3,"score":0.6508129835128784},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.5565598607063293},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5257509350776672},{"id":"https://openalex.org/C106487976","wikidata":"https://www.wikidata.org/wiki/Q685816","display_name":"Matrix (chemical analysis)","level":2,"score":0.5127602219581604},{"id":"https://openalex.org/C51432778","wikidata":"https://www.wikidata.org/wiki/Q1259145","display_name":"Independent component analysis","level":2,"score":0.5104809999465942},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.4956105947494507},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.42165088653564453},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.332422137260437},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.13892099261283875},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp39728.2021.9414884","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp39728.2021.9414884","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2021 - 2021 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":37,"referenced_works":["https://openalex.org/W95152782","https://openalex.org/W1512388774","https://openalex.org/W1543386260","https://openalex.org/W1831449718","https://openalex.org/W1845880232","https://openalex.org/W1887941968","https://openalex.org/W2072548008","https://openalex.org/W2113990625","https://openalex.org/W2117678320","https://openalex.org/W2123649031","https://openalex.org/W2127851351","https://openalex.org/W2139302694","https://openalex.org/W2168273590","https://openalex.org/W2408744528","https://openalex.org/W2412956798","https://openalex.org/W2460742184","https://openalex.org/W2567070169","https://openalex.org/W2792498316","https://openalex.org/W2886577208","https://openalex.org/W2901552243","https://openalex.org/W2905196628","https://openalex.org/W2922004249","https://openalex.org/W2936446744","https://openalex.org/W2963035245","https://openalex.org/W2963375116","https://openalex.org/W2963969588","https://openalex.org/W2963970792","https://openalex.org/W3015678657","https://openalex.org/W4297801963","https://openalex.org/W6603838645","https://openalex.org/W6632571750","https://openalex.org/W6638670064","https://openalex.org/W6638690007","https://openalex.org/W6678799340","https://openalex.org/W6713966589","https://openalex.org/W6731370813","https://openalex.org/W6754172774"],"related_works":["https://openalex.org/W2390344110","https://openalex.org/W2364896863","https://openalex.org/W2046761971","https://openalex.org/W2107364365","https://openalex.org/W2118307209","https://openalex.org/W1785857632","https://openalex.org/W4281722104","https://openalex.org/W2187523794","https://openalex.org/W2553224454","https://openalex.org/W1503525627"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,145,190,209],"propose":[4,146,192],"SepNet,":[5],"a":[6,112,130,148,154,162,169,194,205],"deep":[7],"neural":[8],"network":[9,213],"(DNN)":[10],"designed":[11,64,138],"to":[12,22,65,71,152,175,183,199,231],"predict":[13],"separation":[14,25,54,68,99,164,233,239],"matrices":[15,55,234],"from":[16],"multichannel":[17,170],"observations.":[18],"One":[19],"well-known":[20],"approach":[21],"blind":[23],"source":[24,188],"(BSS)":[26],"involves":[27],"independent":[28,37],"component":[29],"analysis":[30,40],"(ICA).":[31],"A":[32],"recently":[33],"developed":[34],"method":[35],"called":[36],"low-rank":[38],"matrix":[39,69,165],"(ILRMA)":[41],"is":[42,63,90],"one":[43,119,177],"of":[44,53,97,111,120,124,178,186,245],"its":[45],"powerful":[46],"variants.":[47],"These":[48],"methods":[49],"allow":[50],"the":[51,67,78,121,125,179,187,201,212,216],"estimation":[52],"based":[56,76],"on":[57,77],"deterministic":[58,113],"iterative":[59,114],"algorithms.":[60],"Specifically,":[61],"ILRMA":[62,82,242],"update":[66,73],"according":[70],"an":[72,158],"rule":[74],"derived":[75],"majorization-minimization":[79],"principle.":[80],"Although":[81],"performs":[83],"reasonably":[84],"well":[85],"under":[86],"some":[87],"conditions,":[88],"there":[89],"still":[91],"room":[92],"for":[93,105,243],"improvement":[94],"in":[95,166],"terms":[96],"both":[98],"accuracy":[100,240],"and":[101,139,236],"computation":[102],"time,":[103],"especially":[104],"large-scale":[106],"microphone":[107],"arrays.":[108],"The":[109,223],"existence":[110],"algorithm":[115],"that":[116,129,135,150,215,227],"can":[117,132,210,219],"find":[118,176,232],"stationary":[122],"points":[123],"BSS":[126],"problem":[127],"implies":[128],"DNN":[131,149],"also":[133],"play":[134],"role":[136],"if":[137],"trained":[140],"properly.":[141],"Motivated":[142],"by":[143],"this,":[144],"introducing":[147],"learns":[151],"convert":[153],"predefined":[155],"input":[156],"(e.g.,":[157],"identity":[159],"matrix)":[160],"into":[161],"true":[163],"accordance":[167],"with":[168,237],"observation.":[171],"To":[172],"enable":[173],"it":[174],"multiple":[180],"solutions":[181],"corresponding":[182],"different":[184],"permutations":[185],"indices,":[189],"further":[191],"adopting":[193],"permutation":[195],"invariant":[196],"training":[197],"strategy":[198],"train":[200],"network.":[202],"By":[203],"using":[204],"fully":[206],"convolutional":[207],"architecture,":[208],"design":[211],"so":[214],"forward":[217],"propagation":[218],"be":[220],"computed":[221],"efficiently.":[222],"experimental":[224],"results":[225],"revealed":[226],"SepNet":[228],"was":[229],"able":[230],"faster":[235],"better":[238],"than":[241],"mixtures":[244],"two":[246],"sources.":[247]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
