{"id":"https://openalex.org/W2399556727","doi":"https://doi.org/10.1109/icassp.2016.7471723","title":"Shifted and convolutive source-filter non-negative matrix factorization for monaural audio source separation","display_name":"Shifted and convolutive source-filter non-negative matrix factorization for monaural audio source separation","publication_year":2016,"publication_date":"2016-03-01","ids":{"openalex":"https://openalex.org/W2399556727","doi":"https://doi.org/10.1109/icassp.2016.7471723","mag":"2399556727"},"language":"en","primary_location":{"id":"doi:10.1109/icassp.2016.7471723","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2016.7471723","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102941659","display_name":"Tomohiko Nakamura","orcid":"https://orcid.org/0000-0003-4385-7170"},"institutions":[{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tomohiko Nakamura","raw_affiliation_strings":["Graduate School of Information Science and Technology, The University of Tokyo.,7-3-1, Hongo, Bunkyo-ku, Tokyo, 113-8656, Japan","Graduate School of Information Science and Technology, The University of Tokyo, Bunkyo-ku, Tokyo, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Technology, The University of Tokyo.,7-3-1, Hongo, Bunkyo-ku, Tokyo, 113-8656, Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"Graduate School of Information Science and Technology, The University of Tokyo, Bunkyo-ku, Tokyo, Japan","institution_ids":["https://openalex.org/I74801974"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001243214","display_name":"Hirokazu Kameoka","orcid":"https://orcid.org/0000-0003-3102-0162"},"institutions":[{"id":"https://openalex.org/I2251713219","display_name":"NTT (Japan)","ror":"https://ror.org/00berct97","country_code":"JP","type":"company","lineage":["https://openalex.org/I2251713219"]},{"id":"https://openalex.org/I74801974","display_name":"The University of Tokyo","ror":"https://ror.org/057zh3y96","country_code":"JP","type":"education","lineage":["https://openalex.org/I74801974"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Hirokazu Kameoka","raw_affiliation_strings":["Graduate School of Information Science and Technology, The University of Tokyo.,7-3-1, Hongo, Bunkyo-ku, Tokyo, 113-8656, Japan","NTT Communication Science Laboratories, Nippon Telegraph and Telephone Corporation, Atsugi, Kanagawa, Japan"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Graduate School of Information Science and Technology, The University of Tokyo.,7-3-1, Hongo, Bunkyo-ku, Tokyo, 113-8656, Japan","institution_ids":["https://openalex.org/I74801974"]},{"raw_affiliation_string":"NTT Communication Science Laboratories, Nippon Telegraph and Telephone Corporation, Atsugi, Kanagawa, Japan","institution_ids":["https://openalex.org/I2251713219"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.5105,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.62949282,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"489","last_page":"493"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11233","display_name":"Advanced Adaptive Filtering Techniques","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/2206","display_name":"Computational Mechanics"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/non-negative-matrix-factorization","display_name":"Non-negative matrix factorization","score":0.8051356077194214},{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.7458106279373169},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.6978104710578918},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5847818851470947},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.5638951659202576},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5239555835723877},{"id":"https://openalex.org/keywords/matrix-decomposition","display_name":"Matrix decomposition","score":0.5020730495452881},{"id":"https://openalex.org/keywords/deconvolution","display_name":"Deconvolution","score":0.47558653354644775},{"id":"https://openalex.org/keywords/blind-signal-separation","display_name":"Blind signal separation","score":0.4300042986869812},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.38454824686050415},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.3740919828414917},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.13879305124282837},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.12101170420646667}],"concepts":[{"id":"https://openalex.org/C152671427","wikidata":"https://www.wikidata.org/wiki/Q10843505","display_name":"Non-negative matrix factorization","level":4,"score":0.8051356077194214},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.7458106279373169},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.6978104710578918},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5847818851470947},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.5638951659202576},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5239555835723877},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.5020730495452881},{"id":"https://openalex.org/C174576160","wikidata":"https://www.wikidata.org/wiki/Q1183700","display_name":"Deconvolution","level":2,"score":0.47558653354644775},{"id":"https://openalex.org/C120317606","wikidata":"https://www.wikidata.org/wiki/Q17105967","display_name":"Blind signal separation","level":3,"score":0.4300042986869812},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.38454824686050415},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.3740919828414917},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.13879305124282837},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.12101170420646667},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp.2016.7471723","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icassp.2016.7471723","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W178436704","https://openalex.org/W1580974668","https://openalex.org/W1626927927","https://openalex.org/W1987133051","https://openalex.org/W2017578549","https://openalex.org/W2039844283","https://openalex.org/W2080815483","https://openalex.org/W2090963365","https://openalex.org/W2098101267","https://openalex.org/W2102780911","https://openalex.org/W2104298926","https://openalex.org/W2106582496","https://openalex.org/W2113217465","https://openalex.org/W2120340098","https://openalex.org/W2127851351","https://openalex.org/W2139122061","https://openalex.org/W2139318943","https://openalex.org/W2156662892","https://openalex.org/W2157313348","https://openalex.org/W2170989203","https://openalex.org/W2293043088","https://openalex.org/W2293293689","https://openalex.org/W2311880653","https://openalex.org/W2395437797","https://openalex.org/W2397931447","https://openalex.org/W2400942170","https://openalex.org/W3139660364","https://openalex.org/W4256715062","https://openalex.org/W4299512035","https://openalex.org/W6636678576","https://openalex.org/W6697066685"],"related_works":["https://openalex.org/W2123043102","https://openalex.org/W2577807713","https://openalex.org/W2098101267","https://openalex.org/W2037504162","https://openalex.org/W2774154397","https://openalex.org/W2146544734","https://openalex.org/W2921513691","https://openalex.org/W2156699640","https://openalex.org/W2081322759","https://openalex.org/W1979654135"],"abstract_inverted_index":{"This":[0],"paper":[1],"proposes":[2],"an":[3,183],"extension":[4],"of":[5,47,52,64,72,109,119,140,147,154,166,172,182,219,241],"non-negative":[6,191],"matrix":[7,192],"factorization":[8],"(NMF),":[9],"which":[10,38,175],"combines":[11],"the":[12,17,48,70,81,92,107,125,130,138,145,148,151,163,170,173,180,190,198,203,216,220,225,233,242],"shifted":[13,62,117,152,237],"NMF":[14,21,238],"model":[15,196,200,222],"with":[16],"source-filter":[18,82],"model.":[19],"Shifted":[20],"was":[22],"proposed":[23,234],"as":[24,124,144],"a":[25,53,61,65,110,116,120,141,208],"powerful":[26],"approach":[27],"for":[28,76,178,214],"monaural":[29],"source":[30,243],"separation":[31,244],"and":[32,59,128,158,211],"multiple":[33],"fundamental":[34],"frequency":[35],"(F0)":[36],"estimation,":[37],"is":[39,113,176],"particularly":[40],"unique":[41],"in":[42,56,89,239],"that":[43,79,232],"it":[44],"takes":[45],"account":[46],"constant":[49],"inter-harmonic":[50],"spacings":[51],"harmonic":[54,121],"structure":[55,122],"log-frequency":[57],"representations":[58],"uses":[60],"copy":[63,118],"spectrum":[66,108,127,132,156,160],"template":[67,123],"to":[68,105,114,201],"represent":[69,106],"spectra":[71,94,168],"different":[73,111],"F0s.":[74],"However,":[75],"those":[77],"sounds":[78],"follow":[80],"model,":[83],"this":[84],"assumption":[85],"does":[86],"not":[87],"hold":[88],"reality,":[90],"since":[91],"filter":[93,131,159,167,204],"are":[95],"usually":[96],"invariant":[97],"under":[98],"F0":[99,112],"changes.":[100],"A":[101],"more":[102],"reasonable":[103],"way":[104],"use":[115],"excitation":[126,155],"keep":[129],"fixed.":[133],"Thus,":[134,186],"we":[135,187],"can":[136],"describe":[137,202],"spectrogram":[139],"mixture":[142],"signal":[143],"sum":[146],"products":[149],"between":[150],"copies":[153],"templates":[157],"templates.":[161],"Furthermore,":[162],"time":[164],"course":[165],"represents":[169],"dynamics":[171],"timbre,":[174],"important":[177],"characterizing":[179],"feature":[181],"instrument":[184],"sound.":[185],"further":[188],"incorporate":[189],"factor":[193],"deconvolution":[194],"(NMFD)":[195],"into":[197],"above":[199],"spectrogram.":[205],"We":[206],"derive":[207],"computationally":[209],"efficient":[210],"convergence-guaranteed":[212],"algorithm":[213],"estimating":[215],"unknown":[217],"parameters":[218],"constructed":[221],"based":[223],"on":[224],"auxiliary":[226],"function":[227],"approach.":[228],"Experimental":[229],"results":[230],"revealed":[231],"method":[235],"outperformed":[236],"terms":[240],"accuracy.":[245]},"counts_by_year":[{"year":2020,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
