{"id":"https://openalex.org/W2605138598","doi":"https://doi.org/10.1109/globalsip.2017.8309164","title":"Single channel audio source separation using convolutional denoising autoencoders","display_name":"Single channel audio source separation using convolutional denoising autoencoders","publication_year":2017,"publication_date":"2017-11-01","ids":{"openalex":"https://openalex.org/W2605138598","doi":"https://doi.org/10.1109/globalsip.2017.8309164","mag":"2605138598"},"language":"en","primary_location":{"id":"doi:10.1109/globalsip.2017.8309164","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globalsip.2017.8309164","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Global Conference on Signal and Information Processing (GlobalSIP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013467271","display_name":"Emad M. Grais","orcid":"https://orcid.org/0000-0002-6387-0981"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Emad M. Grais","raw_affiliation_strings":["Speech and Signal Processing, University of Surrey, Guildford, UK"],"affiliations":[{"raw_affiliation_string":"Speech and Signal Processing, University of Surrey, Guildford, UK","institution_ids":["https://openalex.org/I28290843"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066967599","display_name":"Mark D. Plumbley","orcid":"https://orcid.org/0000-0002-9708-1075"},"institutions":[{"id":"https://openalex.org/I28290843","display_name":"University of Surrey","ror":"https://ror.org/00ks66431","country_code":"GB","type":"education","lineage":["https://openalex.org/I28290843"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Mark D. Plumbley","raw_affiliation_strings":["Speech and Signal Processing, University of Surrey, Guildford, UK"],"affiliations":[{"raw_affiliation_string":"Speech and Signal Processing, University of Surrey, Guildford, UK","institution_ids":["https://openalex.org/I28290843"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5013467271"],"corresponding_institution_ids":["https://openalex.org/I28290843"],"apc_list":null,"apc_paid":null,"fwci":9.2462,"has_fulltext":false,"cited_by_count":105,"citation_normalized_percentile":{"value":0.98564824,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":91,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1265","last_page":"1269"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.8737082481384277},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8063902854919434},{"id":"https://openalex.org/keywords/monaural","display_name":"Monaural","score":0.7316379547119141},{"id":"https://openalex.org/keywords/noise-reduction","display_name":"Noise reduction","score":0.6915854215621948},{"id":"https://openalex.org/keywords/convolutional-neural-network","display_name":"Convolutional neural network","score":0.6015812158584595},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.596174418926239},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.5746882557868958},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.5319348573684692},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5007162094116211},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.498732328414917},{"id":"https://openalex.org/keywords/blind-signal-separation","display_name":"Blind signal separation","score":0.48724380135536194},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.39541298151016235},{"id":"https://openalex.org/keywords/telecommunications","display_name":"Telecommunications","score":0.05870059132575989}],"concepts":[{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.8737082481384277},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8063902854919434},{"id":"https://openalex.org/C102894143","wikidata":"https://www.wikidata.org/wiki/Q1323979","display_name":"Monaural","level":2,"score":0.7316379547119141},{"id":"https://openalex.org/C163294075","wikidata":"https://www.wikidata.org/wiki/Q581861","display_name":"Noise reduction","level":2,"score":0.6915854215621948},{"id":"https://openalex.org/C81363708","wikidata":"https://www.wikidata.org/wiki/Q17084460","display_name":"Convolutional neural network","level":2,"score":0.6015812158584595},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.596174418926239},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.5746882557868958},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.5319348573684692},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5007162094116211},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.498732328414917},{"id":"https://openalex.org/C120317606","wikidata":"https://www.wikidata.org/wiki/Q17105967","display_name":"Blind signal separation","level":3,"score":0.48724380135536194},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.39541298151016235},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.05870059132575989},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/globalsip.2017.8309164","is_oa":false,"landing_page_url":"https://doi.org/10.1109/globalsip.2017.8309164","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE Global Conference on Signal and Information Processing (GlobalSIP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6513227722","display_name":null,"funder_award_id":"EP/L027119/2","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G740539323","display_name":null,"funder_award_id":"EP/L027119/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W104184427","https://openalex.org/W1523493493","https://openalex.org/W1564690189","https://openalex.org/W1604717235","https://openalex.org/W1606347560","https://openalex.org/W2025768430","https://openalex.org/W2042419400","https://openalex.org/W2045402776","https://openalex.org/W2049113157","https://openalex.org/W2099904336","https://openalex.org/W2100495367","https://openalex.org/W2107789863","https://openalex.org/W2127851351","https://openalex.org/W2136655611","https://openalex.org/W2145094598","https://openalex.org/W2146337213","https://openalex.org/W2292405593","https://openalex.org/W2321627895","https://openalex.org/W2398306137","https://openalex.org/W2405258286","https://openalex.org/W2408744528","https://openalex.org/W2410860376","https://openalex.org/W2508884455","https://openalex.org/W2509006290","https://openalex.org/W2515753980","https://openalex.org/W2516342150","https://openalex.org/W2519994964","https://openalex.org/W2552400013","https://openalex.org/W2587994092","https://openalex.org/W2592944988","https://openalex.org/W2669032454","https://openalex.org/W2917831833","https://openalex.org/W2963451564","https://openalex.org/W2963453742","https://openalex.org/W2997574889","https://openalex.org/W3098670224","https://openalex.org/W3099271704","https://openalex.org/W6604254268","https://openalex.org/W6633740391","https://openalex.org/W6636358008","https://openalex.org/W6676071220","https://openalex.org/W6681096077","https://openalex.org/W6681686951","https://openalex.org/W6696765674","https://openalex.org/W6712656540","https://openalex.org/W6713676406"],"related_works":["https://openalex.org/W4312417841","https://openalex.org/W4321369474","https://openalex.org/W2731899572","https://openalex.org/W3133861977","https://openalex.org/W4200173597","https://openalex.org/W3116150086","https://openalex.org/W2999805992","https://openalex.org/W2952367144","https://openalex.org/W4300806340","https://openalex.org/W2605138598"],"abstract_inverted_index":{"Deep":[0],"learning":[1],"techniques":[2],"have":[3],"been":[4],"used":[5],"recently":[6],"to":[7,19,42,53,69,73,80],"tackle":[8],"the":[9,38,46,59,96],"audio":[10,29],"source":[11,30,56,91],"separation":[12,92],"problem.":[13],"In":[14],"this":[15],"work,":[16],"we":[17],"propose":[18],"use":[20,33],"deep":[21,97],"fully":[22],"convolutional":[23],"denoising":[24],"autoencoders":[25],"(CDAEs)":[26],"for":[27],"monaural":[28],"separation.":[31],"We":[32],"as":[34,37,62],"many":[35],"CDAEs":[36,89],"number":[39],"of":[40],"sources":[41,61],"be":[43],"separated":[44],"from":[45],"mixed":[47],"signal.":[48],"Each":[49],"CDAE":[50,72],"is":[51,68],"trained":[52],"separate":[54],"one":[55],"and":[57,78],"treats":[58],"other":[60],"background":[63],"noise.":[64],"The":[65],"main":[66],"idea":[67],"allow":[70],"each":[71],"learn":[74],"suitable":[75],"spectral-temporal":[76],"filters":[77],"features":[79],"its":[81],"corresponding":[82],"source.":[83],"Our":[84],"experimental":[85],"results":[86],"show":[87],"that":[88],"perform":[90],"slightly":[93],"better":[94],"than":[95,106],"feedforward":[98],"neural":[99],"networks":[100],"(FNNs)":[101],"even":[102],"with":[103],"fewer":[104],"parameters":[105],"FNNs.":[107]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":10},{"year":2023,"cited_by_count":16},{"year":2022,"cited_by_count":9},{"year":2021,"cited_by_count":19},{"year":2020,"cited_by_count":17},{"year":2019,"cited_by_count":16},{"year":2018,"cited_by_count":14},{"year":2017,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
