{"id":"https://openalex.org/W2961034873","doi":"https://doi.org/10.1145/3309772.3309780","title":"Separating musical sources with convolutional sparse coding","display_name":"Separating musical sources with convolutional sparse coding","publication_year":2019,"publication_date":"2019-01-07","ids":{"openalex":"https://openalex.org/W2961034873","doi":"https://doi.org/10.1145/3309772.3309780","mag":"2961034873"},"language":"en","primary_location":{"id":"doi:10.1145/3309772.3309780","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3309772.3309780","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd International Conference on Applications of Intelligent Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011246176","display_name":"Mohit L. Dubey","orcid":"https://orcid.org/0000-0002-8575-8827"},"institutions":[{"id":"https://openalex.org/I70571728","display_name":"Oberlin College","ror":"https://ror.org/05ac26z88","country_code":"US","type":"education","lineage":["https://openalex.org/I70571728"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mohit Dubey","raw_affiliation_strings":["Oberlin College and Conservatory, Oberlin, Ohio"],"affiliations":[{"raw_affiliation_string":"Oberlin College and Conservatory, Oberlin, Ohio","institution_ids":["https://openalex.org/I70571728"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076756533","display_name":"Haydn Jones","orcid":null},"institutions":[{"id":"https://openalex.org/I207123951","display_name":"New Mexico Institute of Mining and Technology","ror":"https://ror.org/005p9kw61","country_code":"US","type":"education","lineage":["https://openalex.org/I207123951"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Haydn Jones","raw_affiliation_strings":["New Mexico Institute of Mining and Technology, Socorro, New Mexico"],"affiliations":[{"raw_affiliation_string":"New Mexico Institute of Mining and Technology, Socorro, New Mexico","institution_ids":["https://openalex.org/I207123951"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023392501","display_name":"Austin Thresher","orcid":null},"institutions":[{"id":"https://openalex.org/I4210110743","display_name":"New Mexico Consortium","ror":"https://ror.org/01qnpp968","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210110743"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Austin Thresher","raw_affiliation_strings":["New Mexico Consortium, Los Alamos, New Mexico"],"affiliations":[{"raw_affiliation_string":"New Mexico Consortium, Los Alamos, New Mexico","institution_ids":["https://openalex.org/I4210110743"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086534835","display_name":"Garrett T. Kenyon","orcid":"https://orcid.org/0000-0003-4836-3938"},"institutions":[{"id":"https://openalex.org/I1343871089","display_name":"Los Alamos National Laboratory","ror":"https://ror.org/01e41cf67","country_code":"US","type":"facility","lineage":["https://openalex.org/I1330989302","https://openalex.org/I1343871089","https://openalex.org/I198811213","https://openalex.org/I4210120050"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Garrett Kenyon","raw_affiliation_strings":["Los Alamos National Laboratory, Los Alamos, New Mexico"],"affiliations":[{"raw_affiliation_string":"Los Alamos National Laboratory, Los Alamos, New Mexico","institution_ids":["https://openalex.org/I1343871089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5011246176"],"corresponding_institution_ids":["https://openalex.org/I70571728"],"apc_list":null,"apc_paid":null,"fwci":0.1659,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.43347244,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":93},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11447","display_name":"Blind Source Separation Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10283","display_name":"Hearing Loss and Rehabilitation","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2805","display_name":"Cognitive Neuroscience"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.7660016417503357},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6647069454193115},{"id":"https://openalex.org/keywords/neural-coding","display_name":"Neural coding","score":0.5769940614700317},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.561489999294281},{"id":"https://openalex.org/keywords/fourier-transform","display_name":"Fourier transform","score":0.53608238697052},{"id":"https://openalex.org/keywords/waveform","display_name":"Waveform","score":0.5031866431236267},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.4875578284263611},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4628564119338989},{"id":"https://openalex.org/keywords/auditory-cortex","display_name":"Auditory cortex","score":0.43922722339630127},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3963885009288788},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3517867624759674},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1894983947277069},{"id":"https://openalex.org/keywords/neuroscience","display_name":"Neuroscience","score":0.10744971036911011},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.10675749182701111},{"id":"https://openalex.org/keywords/radar","display_name":"Radar","score":0.07647603750228882}],"concepts":[{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.7660016417503357},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6647069454193115},{"id":"https://openalex.org/C77637269","wikidata":"https://www.wikidata.org/wiki/Q7002051","display_name":"Neural coding","level":2,"score":0.5769940614700317},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.561489999294281},{"id":"https://openalex.org/C102519508","wikidata":"https://www.wikidata.org/wiki/Q6520159","display_name":"Fourier transform","level":2,"score":0.53608238697052},{"id":"https://openalex.org/C197424946","wikidata":"https://www.wikidata.org/wiki/Q1165717","display_name":"Waveform","level":3,"score":0.5031866431236267},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.4875578284263611},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4628564119338989},{"id":"https://openalex.org/C2780297895","wikidata":"https://www.wikidata.org/wiki/Q18676","display_name":"Auditory cortex","level":2,"score":0.43922722339630127},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3963885009288788},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3517867624759674},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1894983947277069},{"id":"https://openalex.org/C169760540","wikidata":"https://www.wikidata.org/wiki/Q207011","display_name":"Neuroscience","level":1,"score":0.10744971036911011},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.10675749182701111},{"id":"https://openalex.org/C554190296","wikidata":"https://www.wikidata.org/wiki/Q47528","display_name":"Radar","level":2,"score":0.07647603750228882},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3309772.3309780","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3309772.3309780","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2nd International Conference on Applications of Intelligent Systems","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.4300000071525574}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W635496727","https://openalex.org/W1790748249","https://openalex.org/W1838323663","https://openalex.org/W1965192788","https://openalex.org/W1972168487","https://openalex.org/W2060085436","https://openalex.org/W2070857950","https://openalex.org/W2093290760","https://openalex.org/W2100543212","https://openalex.org/W2108089013","https://openalex.org/W2124134481","https://openalex.org/W2127851351","https://openalex.org/W2145889472","https://openalex.org/W2151116952","https://openalex.org/W2154805298","https://openalex.org/W2164098335","https://openalex.org/W2344054597","https://openalex.org/W2398350456","https://openalex.org/W2515071189","https://openalex.org/W2641889749","https://openalex.org/W2766926913","https://openalex.org/W3124794156"],"related_works":["https://openalex.org/W3094316140","https://openalex.org/W3133205200","https://openalex.org/W2898145319","https://openalex.org/W4289363934","https://openalex.org/W2098101267","https://openalex.org/W2059119686","https://openalex.org/W2898606530","https://openalex.org/W4289362680","https://openalex.org/W2403380333","https://openalex.org/W2761596192"],"abstract_inverted_index":{"The":[0],"solution":[1],"to":[2,28,41,78,102],"the":[3,21,79,103,115],"problem":[4],"of":[5,52,58,82,105,117],"separating":[6,42],"multiple":[7],"vocal":[8],"and":[9,46,55,74],"instrumental":[10],"tracks":[11],"from":[12,49,67,90],"a":[13,38],"single":[14],"audio":[15],"waveform":[16],"is":[17,108],"solved":[18],"naturally":[19],"by":[20],"human":[22,83],"auditory":[23,84],"cortex":[24],"but":[25],"has":[26],"yet":[27],"be":[29],"effectively":[30],"implemented":[31],"computationally.":[32],"In":[33],"this":[34],"paper,":[35],"we":[36],"demonstrate":[37],"neurally-inspired":[39],"approach":[40],"bass,":[43],"drums,":[44],"vocals":[45],"other":[47],"instruments":[48],"sparse":[50,63],"encodings":[51,64],"phase-rich":[53],"Fourier":[54,99],"Constant-Q":[56,93],"representations":[57,94],"stereo":[59],"musical":[60],"data.":[61],"Our":[62],"are":[65,71],"generated":[66],"learned":[68],"features":[69],"that":[70,88,107,112],"both":[72],"spectrally":[73],"temporally":[75],"convolutional,":[76],"similar":[77],"hemispheric":[80],"lateralization":[81],"cortex.":[85],"We":[86],"find":[87],"learning":[89],"neurally":[91],"inspired":[92],"provides":[95],"better":[96],"separation":[97],"over":[98],"spectrograms":[100],"due":[101],"presence":[104],"structure":[106],"convolutional":[109],"in":[110,114],"log-frequency":[111],"aids":[113],"differentiation":[116],"instruments.":[118]},"counts_by_year":[{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
