{"id":"https://openalex.org/W4392909836","doi":"https://doi.org/10.1109/icassp48485.2024.10446651","title":"SCNet: Sparse Compression Network for Music Source Separation","display_name":"SCNet: Sparse Compression Network for Music Source Separation","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392909836","doi":"https://doi.org/10.1109/icassp48485.2024.10446651"},"language":"en","primary_location":{"id":"doi:10.1109/icassp48485.2024.10446651","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10446651","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101319297","display_name":"Weinan Tong","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]},{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weinan Tong","raw_affiliation_strings":["Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","Skywork AI PTE. LTD"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]},{"raw_affiliation_string":"Skywork AI PTE. LTD","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114121757","display_name":"Jiaxu Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]},{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiaxu Zhu","raw_affiliation_strings":["Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100450139","display_name":"Jun Chen","orcid":"https://orcid.org/0000-0001-7201-1989"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]},{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Chen","raw_affiliation_strings":["Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","Shenzhen International Graduate School, Tsinghua University, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083463839","display_name":"Shiyin Kang","orcid":"https://orcid.org/0000-0001-8304-5260"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shiyin Kang","raw_affiliation_strings":["Skywork AI PTE. LTD"],"affiliations":[{"raw_affiliation_string":"Skywork AI PTE. LTD","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100744501","display_name":"Tao Jiang","orcid":"https://orcid.org/0000-0001-9116-2635"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tao Jiang","raw_affiliation_strings":["Skywork AI PTE. LTD"],"affiliations":[{"raw_affiliation_string":"Skywork AI PTE. LTD","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100421770","display_name":"Yang Li","orcid":"https://orcid.org/0000-0003-2845-5739"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang Li","raw_affiliation_strings":["Skywork AI PTE. LTD"],"affiliations":[{"raw_affiliation_string":"Skywork AI PTE. LTD","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100667025","display_name":"Zhiyong Wu","orcid":"https://orcid.org/0000-0002-6527-5502"},"institutions":[{"id":"https://openalex.org/I3131625388","display_name":"University Town of Shenzhen","ror":"https://ror.org/05f5j6225","country_code":"CN","type":"education","lineage":["https://openalex.org/I3131625388"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]},{"id":"https://openalex.org/I4210136793","display_name":"Peng Cheng Laboratory","ror":"https://ror.org/03qdqbt06","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210136793"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiyong Wu","raw_affiliation_strings":["Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","Peng Cheng Lab, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University,Shenzhen International Graduate School,Shenzhen,China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"Shenzhen International Graduate School, Tsinghua University, Shenzhen, China","institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"]},{"raw_affiliation_string":"Peng Cheng Lab, Shenzhen, China","institution_ids":["https://openalex.org/I4210136793"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5102225156","display_name":"Helen Meng","orcid":null},"institutions":[{"id":"https://openalex.org/I177725633","display_name":"Chinese University of Hong Kong","ror":"https://ror.org/00t33hh48","country_code":"CN","type":"education","lineage":["https://openalex.org/I177725633"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Helen Meng","raw_affiliation_strings":["The Chinese University of Hong Kong,Hong Kong SAR,China","The Chinese University of Hong Kong, Hong Kong SAR, China"],"affiliations":[{"raw_affiliation_string":"The Chinese University of Hong Kong,Hong Kong SAR,China","institution_ids":["https://openalex.org/I177725633"]},{"raw_affiliation_string":"The Chinese University of Hong Kong, Hong Kong SAR, China","institution_ids":["https://openalex.org/I177725633"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5101319297"],"corresponding_institution_ids":["https://openalex.org/I3131625388","https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":3.3198,"has_fulltext":false,"cited_by_count":9,"citation_normalized_percentile":{"value":0.9276121,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1276","last_page":"1280"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9933000206947327,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6780432462692261},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.5928701162338257},{"id":"https://openalex.org/keywords/compression","display_name":"Compression (physics)","score":0.5073170065879822},{"id":"https://openalex.org/keywords/data-compression","display_name":"Data compression","score":0.44335585832595825},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.209125816822052},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.16181322932243347},{"id":"https://openalex.org/keywords/materials-science","display_name":"Materials science","score":0.07838630676269531}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6780432462692261},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.5928701162338257},{"id":"https://openalex.org/C180016635","wikidata":"https://www.wikidata.org/wiki/Q2712821","display_name":"Compression (physics)","level":2,"score":0.5073170065879822},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.44335585832595825},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.209125816822052},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.16181322932243347},{"id":"https://openalex.org/C192562407","wikidata":"https://www.wikidata.org/wiki/Q228736","display_name":"Materials science","level":0,"score":0.07838630676269531},{"id":"https://openalex.org/C159985019","wikidata":"https://www.wikidata.org/wiki/Q181790","display_name":"Composite material","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp48485.2024.10446651","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp48485.2024.10446651","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W398859631","https://openalex.org/W569478347","https://openalex.org/W1522301498","https://openalex.org/W2127851351","https://openalex.org/W2587994092","https://openalex.org/W2669032454","https://openalex.org/W2899663614","https://openalex.org/W2952218014","https://openalex.org/W2963452667","https://openalex.org/W2963992487","https://openalex.org/W2971458685","https://openalex.org/W3001377302","https://openalex.org/W3015199127","https://openalex.org/W3037149862","https://openalex.org/W3090496396","https://openalex.org/W3097777922","https://openalex.org/W3099330747","https://openalex.org/W3213726885","https://openalex.org/W3216004336","https://openalex.org/W4226221107","https://openalex.org/W4286980120","https://openalex.org/W4295312788","https://openalex.org/W4372260250","https://openalex.org/W4372267621","https://openalex.org/W4375928773","https://openalex.org/W4385473570","https://openalex.org/W4386065588","https://openalex.org/W6631190155","https://openalex.org/W6731370813","https://openalex.org/W6751512325","https://openalex.org/W6755977528","https://openalex.org/W6766978945","https://openalex.org/W6767502687","https://openalex.org/W6773772901","https://openalex.org/W6783557883","https://openalex.org/W6801426729","https://openalex.org/W6804608017","https://openalex.org/W6810984764","https://openalex.org/W6844662008","https://openalex.org/W6855434424"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2612632602","https://openalex.org/W2321805087"],"abstract_inverted_index":{"Deep":[0],"learning-based":[1],"methods":[2],"have":[3],"made":[4],"significant":[5],"achievements":[6],"in":[7,23,35],"music":[8,26],"source":[9,27],"separation.":[10,28],"However,":[11],"obtaining":[12],"good":[13],"results":[14,119],"while":[15],"maintaining":[16],"a":[17,55,72,82,126],"low":[18],"model":[19,76,124],"complexity":[20],"remains":[21],"challenging":[22],"super":[24],"wide-band":[25],"Previous":[29],"works":[30],"either":[31],"overlook":[32],"the":[33,40,62,65,93,107,122,136,160],"differences":[34],"subbands":[36,69,87,100],"or":[37],"inadequately":[38],"address":[39],"problem":[41],"of":[42,64,132,155,159],"information":[43,90,94],"loss":[44],"when":[45],"generating":[46],"subband":[47],"features.":[48],"In":[49,104],"this":[50,105],"paper,":[51],"we":[52],"propose":[53],"SCNet,":[54],"novel":[56],"frequency-domain":[57],"network":[58],"to":[59,75,91,128],"explicitly":[60],"split":[61],"spectrogram":[63],"mixture":[66],"into":[67],"several":[68],"and":[70,96],"introduce":[71],"sparsity-based":[73],"encoder":[74],"different":[77],"frequency":[78],"bands.":[79],"We":[80],"use":[81],"higher":[83],"compression":[84],"ratio":[85,130],"on":[86,98,135],"with":[88,101],"less":[89],"improve":[92],"density":[95],"focus":[97],"modeling":[99],"more":[102],"information.":[103],"way,":[106],"separation":[108],"performance":[109],"can":[110],"be":[111],"significantly":[112],"improved":[113],"using":[114,140],"lower":[115],"computational":[116],"consumption.":[117],"Experiment":[118],"show":[120],"that":[121],"proposed":[123],"achieves":[125],"signal":[127],"distortion":[129],"(SDR)":[131],"9.0":[133],"dB":[134],"MUSDB18-HQ":[137],"dataset":[138],"without":[139],"extra":[141],"data,":[142],"which":[143],"outperforms":[144],"state-of-the-art":[145,162],"methods.":[146],"Specifically,":[147],"SCNet\u2019s":[148],"CPU":[149],"inference":[150],"time":[151],"is":[152],"only":[153],"48%":[154],"HT":[156],"Demucs,":[157],"one":[158],"previous":[161],"models.":[163]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":8}],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
