{"id":"https://openalex.org/W4295781833","doi":"https://doi.org/10.1007/s00034-022-02166-5","title":"High-Resolution Representation Learning and Recurrent Neural Network for Singing Voice Separation","display_name":"High-Resolution Representation Learning and Recurrent Neural Network for Singing Voice Separation","publication_year":2022,"publication_date":"2022-09-14","ids":{"openalex":"https://openalex.org/W4295781833","doi":"https://doi.org/10.1007/s00034-022-02166-5"},"language":"en","primary_location":{"id":"doi:10.1007/s00034-022-02166-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00034-022-02166-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00034-022-02166-5.pdf","source":{"id":"https://openalex.org/S20109229","display_name":"Circuits Systems and Signal Processing","issn_l":"0278-081X","issn":["0278-081X","1531-5878"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320186","host_organization_name":"Birkh\u00e4user","host_organization_lineage":["https://openalex.org/P4310320186","https://openalex.org/P4310319900"],"host_organization_lineage_names":["Birkh\u00e4user","Springer Science+Business Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Circuits, Systems, and Signal Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s00034-022-02166-5.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030180662","display_name":"Bhuwan Bhattarai","orcid":"https://orcid.org/0000-0001-7014-4868"},"institutions":[{"id":"https://openalex.org/I80611190","display_name":"Jeonbuk National University","ror":"https://ror.org/05q92br09","country_code":"KR","type":"education","lineage":["https://openalex.org/I80611190"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Bhuwan Bhattarai","raw_affiliation_strings":["Department of Computer Science and Engineering, Jeonbuk National University, Jeonju, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Jeonbuk National University, Jeonju, South Korea","institution_ids":["https://openalex.org/I80611190"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064192572","display_name":"Yagya Raj Pandeya","orcid":"https://orcid.org/0000-0002-9842-8704"},"institutions":[{"id":"https://openalex.org/I47881588","display_name":"Kathmandu University","ror":"https://ror.org/036xnae80","country_code":"NP","type":"education","lineage":["https://openalex.org/I47881588"]},{"id":"https://openalex.org/I5268612","display_name":"Nepal Academy of Science and Technology","ror":"https://ror.org/00863x694","country_code":"NP","type":"education","lineage":["https://openalex.org/I5268612"]}],"countries":["NP"],"is_corresponding":false,"raw_author_name":"Yagya Raj Pandeya","raw_affiliation_strings":["Deep AI Nepal under Guru Technology, Kathmandu, Nepal","Department of Computer Science and Engineering, Kathmandu University, Dhulikhel, Nepal"],"affiliations":[{"raw_affiliation_string":"Deep AI Nepal under Guru Technology, Kathmandu, Nepal","institution_ids":["https://openalex.org/I5268612"]},{"raw_affiliation_string":"Department of Computer Science and Engineering, Kathmandu University, Dhulikhel, Nepal","institution_ids":["https://openalex.org/I47881588"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107118691","display_name":"You Jie","orcid":null},"institutions":[{"id":"https://openalex.org/I80611190","display_name":"Jeonbuk National University","ror":"https://ror.org/05q92br09","country_code":"KR","type":"education","lineage":["https://openalex.org/I80611190"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"You Jie","raw_affiliation_strings":["Department of Computer Science and Engineering, Jeonbuk National University, Jeonju, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Jeonbuk National University, Jeonju, South Korea","institution_ids":["https://openalex.org/I80611190"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026374972","display_name":"Arjun Kumar Lamichhane","orcid":null},"institutions":[{"id":"https://openalex.org/I155028946","display_name":"Tribhuvan University","ror":"https://ror.org/02rg1r889","country_code":"NP","type":"education","lineage":["https://openalex.org/I155028946"]}],"countries":["NP"],"is_corresponding":false,"raw_author_name":"Arjun Kumar Lamichhane","raw_affiliation_strings":["Central Department of Computer Science and Information Technology, Tribhuvan University, Kirtipur, Nepal"],"affiliations":[{"raw_affiliation_string":"Central Department of Computer Science and Information Technology, Tribhuvan University, Kirtipur, Nepal","institution_ids":["https://openalex.org/I155028946"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044837622","display_name":"Joonwhoan Lee","orcid":"https://orcid.org/0000-0003-1854-9643"},"institutions":[{"id":"https://openalex.org/I80611190","display_name":"Jeonbuk National University","ror":"https://ror.org/05q92br09","country_code":"KR","type":"education","lineage":["https://openalex.org/I80611190"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Joonwhoan Lee","raw_affiliation_strings":["Department of Computer Science and Engineering, Jeonbuk National University, Jeonju, South Korea"],"affiliations":[{"raw_affiliation_string":"Department of Computer Science and Engineering, Jeonbuk National University, Jeonju, South Korea","institution_ids":["https://openalex.org/I80611190"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5030180662"],"corresponding_institution_ids":["https://openalex.org/I80611190"],"apc_list":null,"apc_paid":null,"fwci":1.34,"has_fulltext":true,"cited_by_count":9,"citation_normalized_percentile":{"value":0.79944963,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":98},"biblio":{"volume":"42","issue":"2","first_page":"1083","last_page":"1104"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.8877370357513428},{"id":"https://openalex.org/keywords/singing","display_name":"Singing","score":0.7720140814781189},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7381103038787842},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5934284329414368},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5868324637413025},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.5835542678833008},{"id":"https://openalex.org/keywords/recurrent-neural-network","display_name":"Recurrent neural network","score":0.5319718718528748},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.5311065316200256},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5064889192581177},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4973492920398712},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4830658733844757},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.46511486172676086},{"id":"https://openalex.org/keywords/separation","display_name":"Separation (statistics)","score":0.458721399307251},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.44782012701034546},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.20871204137802124},{"id":"https://openalex.org/keywords/acoustics","display_name":"Acoustics","score":0.1170651912689209}],"concepts":[{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.8877370357513428},{"id":"https://openalex.org/C44819458","wikidata":"https://www.wikidata.org/wiki/Q27939","display_name":"Singing","level":2,"score":0.7720140814781189},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7381103038787842},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5934284329414368},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5868324637413025},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.5835542678833008},{"id":"https://openalex.org/C147168706","wikidata":"https://www.wikidata.org/wiki/Q1457734","display_name":"Recurrent neural network","level":3,"score":0.5319718718528748},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.5311065316200256},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5064889192581177},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4973492920398712},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4830658733844757},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.46511486172676086},{"id":"https://openalex.org/C2776061190","wikidata":"https://www.wikidata.org/wiki/Q7451805","display_name":"Separation (statistics)","level":2,"score":0.458721399307251},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.44782012701034546},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.20871204137802124},{"id":"https://openalex.org/C24890656","wikidata":"https://www.wikidata.org/wiki/Q82811","display_name":"Acoustics","level":1,"score":0.1170651912689209},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1007/s00034-022-02166-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00034-022-02166-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00034-022-02166-5.pdf","source":{"id":"https://openalex.org/S20109229","display_name":"Circuits Systems and Signal Processing","issn_l":"0278-081X","issn":["0278-081X","1531-5878"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320186","host_organization_name":"Birkh\u00e4user","host_organization_lineage":["https://openalex.org/P4310320186","https://openalex.org/P4310319900"],"host_organization_lineage_names":["Birkh\u00e4user","Springer Science+Business Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Circuits, Systems, and Signal Processing","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1007/s00034-022-02166-5","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s00034-022-02166-5","pdf_url":"https://link.springer.com/content/pdf/10.1007/s00034-022-02166-5.pdf","source":{"id":"https://openalex.org/S20109229","display_name":"Circuits Systems and Signal Processing","issn_l":"0278-081X","issn":["0278-081X","1531-5878"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320186","host_organization_name":"Birkh\u00e4user","host_organization_lineage":["https://openalex.org/P4310320186","https://openalex.org/P4310319900"],"host_organization_lineage_names":["Birkh\u00e4user","Springer Science+Business Media"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Circuits, Systems, and Signal Processing","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.4399999976158142}],"awards":[{"id":"https://openalex.org/G1225283220","display_name":null,"funder_award_id":"NRF-2021R","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G3071639259","display_name":null,"funder_award_id":"2021R1","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G7112868416","display_name":null,"funder_award_id":"NRF-2021R1A2C2006895","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G982292920","display_name":null,"funder_award_id":"NRF-20","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"}],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"},{"id":"https://openalex.org/F4320328992","display_name":"Jeonbuk National University","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4295781833.pdf","grobid_xml":"https://content.openalex.org/works/W4295781833.grobid-xml"},"referenced_works_count":43,"referenced_works":["https://openalex.org/W1554094125","https://openalex.org/W1555814299","https://openalex.org/W1594771616","https://openalex.org/W1964531215","https://openalex.org/W1973693401","https://openalex.org/W2022668263","https://openalex.org/W2029878753","https://openalex.org/W2046869671","https://openalex.org/W2059793040","https://openalex.org/W2099904336","https://openalex.org/W2108089013","https://openalex.org/W2123649031","https://openalex.org/W2124539664","https://openalex.org/W2127851351","https://openalex.org/W2151186643","https://openalex.org/W2164336224","https://openalex.org/W2364134690","https://openalex.org/W2408744528","https://openalex.org/W2516392987","https://openalex.org/W2536529409","https://openalex.org/W2552058035","https://openalex.org/W2563534197","https://openalex.org/W2605138598","https://openalex.org/W2669032454","https://openalex.org/W2916583660","https://openalex.org/W2949650786","https://openalex.org/W2962935966","https://openalex.org/W2963103134","https://openalex.org/W2963519193","https://openalex.org/W2963750251","https://openalex.org/W2963751183","https://openalex.org/W3010461307","https://openalex.org/W3014641072","https://openalex.org/W3101923269","https://openalex.org/W3198780369","https://openalex.org/W3211333361","https://openalex.org/W4235128394","https://openalex.org/W4297797352","https://openalex.org/W4297817572","https://openalex.org/W4302765731","https://openalex.org/W6600045627","https://openalex.org/W6600135713","https://openalex.org/W6600168311"],"related_works":["https://openalex.org/W3094316140","https://openalex.org/W3133205200","https://openalex.org/W2898145319","https://openalex.org/W4289363934","https://openalex.org/W2898606530","https://openalex.org/W2098101267","https://openalex.org/W2059119686","https://openalex.org/W4289362680","https://openalex.org/W2403380333","https://openalex.org/W2761596192"],"abstract_inverted_index":{"Abstract":[0],"Music":[1],"source":[2],"separation":[3,51,149],"has":[4],"traditionally":[5],"followed":[6],"the":[7,35,40,74,78,140,151,162,169,176],"encoder-decoder":[8],"paradigm":[9],"(e.g.,":[10],"hourglass,":[11],"U-Net,":[12],"DeconvNet,":[13],"SegNet)":[14],"to":[15,67,101,112,158,185],"isolate":[16],"individual":[17],"music":[18,107],"components":[19,173],"from":[20],"mixtures.":[21],"Such":[22],"networks,":[23],"however,":[24],"result":[25],"in":[26],"a":[27,53,61],"loss":[28],"of":[29,77,86],"location-sensitivity,":[30],"as":[31,90],"low-resolution":[32],"representation":[33,55],"drops":[34],"useful":[36],"harmonic":[37],"patterns":[38],"over":[39],"temporal":[41,75],"dimension.":[42],"We":[43,81],"overcame":[44],"this":[45,83,97],"problem":[46],"by":[47,96,115],"performing":[48],"singing":[49,134,147],"voice":[50,148,170],"using":[52,123],"high-resolution":[54,69],"learning":[56],"(HRNet)":[57],"system":[58,98],"coupled":[59],"with":[60],"long":[62],"short-term":[63],"memory":[64],"(LSTM)":[65],"module":[66],"retain":[68],"feature":[70],"map":[71],"and":[72,88,104,131,167,171,178,187,194],"capture":[73],"behavior":[76],"acoustic":[79],"signal.":[80],"called":[82],"joint":[84],"combination":[85],"HRNet":[87],"LSTM":[89],"HR-LSTM.":[91],"The":[92,118],"predicted":[93],"spectrograms":[94],"produced":[95],"are":[99,181],"close":[100],"ground":[102],"truth":[103],"successfully":[105],"separate":[106],"sources,":[108],"achieving":[109],"results":[110],"superior":[111],"those":[113],"realized":[114],"past":[116],"methods.":[117],"proposed":[119,141],"network":[120],"was":[121],"tested":[122],"four":[124],"datasets":[125,180],"(DSD100,":[126],"MIR-1K,":[127],"Korean":[128],"Pansori":[129,177],",":[130],"Nepal":[132,197],"Idol":[133,198],"voice).":[135],"Our":[136],"experiments":[137],"confirmed":[138],"that":[139],"HR-LSTM":[142],"outperforms":[143],"state-of-the-art":[144],"networks":[145],"at":[146],"when":[150,161,175],"DSD100":[152],"dataset":[153,164],"is":[154,165],"used,":[155,166],"performs":[156],"comparably":[157],"alternative":[159],"methods":[160],"MIR-1K":[163],"separates":[168],"accompaniment":[172],"well":[174],"NISVS":[179],"used.":[182],"In":[183],"addition":[184],"proposing":[186],"validating":[188],"our":[189,196],"network,":[190],"we":[191],"also":[192],"developed":[193],"shared":[195],"dataset.":[199]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
