{"id":"https://openalex.org/W2064649926","doi":"https://doi.org/10.1109/tasl.2012.2231072","title":"Single-Channel Speech-Music Separation for Robust ASR With Mixture Models","display_name":"Single-Channel Speech-Music Separation for Robust ASR With Mixture Models","publication_year":2012,"publication_date":"2012-11-30","ids":{"openalex":"https://openalex.org/W2064649926","doi":"https://doi.org/10.1109/tasl.2012.2231072","mag":"2064649926"},"language":"en","primary_location":{"id":"doi:10.1109/tasl.2012.2231072","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2012.2231072","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006515267","display_name":"Cemil Demir","orcid":"https://orcid.org/0000-0002-6365-0196"},"institutions":[{"id":"https://openalex.org/I4405392","display_name":"Bo\u011fazi\u00e7i University","ror":"https://ror.org/03z9tma90","country_code":"TR","type":"education","lineage":["https://openalex.org/I4405392"]},{"id":"https://openalex.org/I198068145","display_name":"Scientific and Technological Research Council of Turkey","ror":"https://ror.org/04w9kkr77","country_code":"TR","type":"government","lineage":["https://openalex.org/I198068145"]}],"countries":["TR"],"is_corresponding":true,"raw_author_name":"C. Demir","raw_affiliation_strings":["Department of Electrical Engineering, Bogazici University, Istanbul, Turkey","Speech & Language Technol. Lab, TUBITAK-BILGEM, Kocaeli, Turkey"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Bogazici University, Istanbul, Turkey","institution_ids":["https://openalex.org/I4405392"]},{"raw_affiliation_string":"Speech & Language Technol. Lab, TUBITAK-BILGEM, Kocaeli, Turkey","institution_ids":["https://openalex.org/I198068145"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055086464","display_name":"Murat Sara\u00e7lar","orcid":"https://orcid.org/0000-0002-7435-8510"},"institutions":[{"id":"https://openalex.org/I4405392","display_name":"Bo\u011fazi\u00e7i University","ror":"https://ror.org/03z9tma90","country_code":"TR","type":"education","lineage":["https://openalex.org/I4405392"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"M. Saraclar","raw_affiliation_strings":["Department of Electrical Engineering, Bogazici University, Istanbul, Turkey","Dept. of Electr. Eng., Bogazici Univ., Istanbul, Turkey"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Bogazici University, Istanbul, Turkey","institution_ids":["https://openalex.org/I4405392"]},{"raw_affiliation_string":"Dept. of Electr. Eng., Bogazici Univ., Istanbul, Turkey","institution_ids":["https://openalex.org/I4405392"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5064633247","display_name":"Ali Taylan Cemgil","orcid":"https://orcid.org/0000-0003-4463-8455"},"institutions":[{"id":"https://openalex.org/I4405392","display_name":"Bo\u011fazi\u00e7i University","ror":"https://ror.org/03z9tma90","country_code":"TR","type":"education","lineage":["https://openalex.org/I4405392"]}],"countries":["TR"],"is_corresponding":false,"raw_author_name":"A. T. Cemgil","raw_affiliation_strings":["Department of Electrical Engineering, Bogazici University, Istanbul, Turkey","Dept. of Electr. Eng., Bogazici Univ., Istanbul, Turkey"],"affiliations":[{"raw_affiliation_string":"Department of Electrical Engineering, Bogazici University, Istanbul, Turkey","institution_ids":["https://openalex.org/I4405392"]},{"raw_affiliation_string":"Dept. of Electr. Eng., Bogazici Univ., Istanbul, Turkey","institution_ids":["https://openalex.org/I4405392"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5006515267"],"corresponding_institution_ids":["https://openalex.org/I198068145","https://openalex.org/I4405392"],"apc_list":null,"apc_paid":null,"fwci":1.7139,"has_fulltext":false,"cited_by_count":23,"citation_normalized_percentile":{"value":0.87477501,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"21","issue":"4","first_page":"725","last_page":"736"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6779776811599731},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6627165079116821},{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.6257936954498291},{"id":"https://openalex.org/keywords/spectrogram","display_name":"Spectrogram","score":0.6241055727005005},{"id":"https://openalex.org/keywords/non-negative-matrix-factorization","display_name":"Non-negative matrix factorization","score":0.5988589525222778},{"id":"https://openalex.org/keywords/hidden-markov-model","display_name":"Hidden Markov model","score":0.5670852661132812},{"id":"https://openalex.org/keywords/source-separation","display_name":"Source separation","score":0.5204456448554993},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.4872232973575592},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.4840106666088104},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48013922572135925},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.43041715025901794},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.4114535450935364},{"id":"https://openalex.org/keywords/matrix-decomposition","display_name":"Matrix decomposition","score":0.2555990219116211},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.11128881573677063}],"concepts":[{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6779776811599731},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6627165079116821},{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.6257936954498291},{"id":"https://openalex.org/C45273575","wikidata":"https://www.wikidata.org/wiki/Q578970","display_name":"Spectrogram","level":2,"score":0.6241055727005005},{"id":"https://openalex.org/C152671427","wikidata":"https://www.wikidata.org/wiki/Q10843505","display_name":"Non-negative matrix factorization","level":4,"score":0.5988589525222778},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.5670852661132812},{"id":"https://openalex.org/C2776864781","wikidata":"https://www.wikidata.org/wiki/Q52617913","display_name":"Source separation","level":2,"score":0.5204456448554993},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.4872232973575592},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.4840106666088104},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48013922572135925},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.43041715025901794},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.4114535450935364},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.2555990219116211},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.11128881573677063},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.0},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tasl.2012.2231072","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tasl.2012.2231072","pdf_url":null,"source":{"id":"https://openalex.org/S199497470","display_name":"IEEE Transactions on Audio Speech and Language Processing","issn_l":"1558-7916","issn":["1558-7916","1558-7924"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Audio, Speech, and Language Processing","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.4000000059604645,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W146976060","https://openalex.org/W185399533","https://openalex.org/W196049401","https://openalex.org/W1485161427","https://openalex.org/W1488912948","https://openalex.org/W1528056001","https://openalex.org/W1543025785","https://openalex.org/W1544503773","https://openalex.org/W1574263887","https://openalex.org/W1801637500","https://openalex.org/W1963835294","https://openalex.org/W2008900415","https://openalex.org/W2031696998","https://openalex.org/W2039844283","https://openalex.org/W2107288886","https://openalex.org/W2115283881","https://openalex.org/W2117042571","https://openalex.org/W2117150818","https://openalex.org/W2118522520","https://openalex.org/W2121894251","https://openalex.org/W2121973264","https://openalex.org/W2127851351","https://openalex.org/W2128402994","https://openalex.org/W2130789253","https://openalex.org/W2134807719","https://openalex.org/W2149648698","https://openalex.org/W2150415460","https://openalex.org/W2150574373","https://openalex.org/W2152457943","https://openalex.org/W2152753389","https://openalex.org/W2155355606","https://openalex.org/W2155531311","https://openalex.org/W2157342986","https://openalex.org/W2157885315","https://openalex.org/W2164162335","https://openalex.org/W2168793898","https://openalex.org/W2395107641","https://openalex.org/W2403025337","https://openalex.org/W4285719527","https://openalex.org/W6607486085","https://openalex.org/W6629347297","https://openalex.org/W6632614696","https://openalex.org/W6677513291","https://openalex.org/W6682181234","https://openalex.org/W6684458083"],"related_works":["https://openalex.org/W2098101267","https://openalex.org/W2403380333","https://openalex.org/W2558565288","https://openalex.org/W1488912948","https://openalex.org/W2152457943","https://openalex.org/W2008565517","https://openalex.org/W2611465255","https://openalex.org/W2155531311","https://openalex.org/W2774675727","https://openalex.org/W1965243342"],"abstract_inverted_index":{"In":[0],"this":[1],"study,":[2],"we":[3,20],"describe":[4],"a":[5,14,22,42,54,68,93,131],"mixture":[6,57,128],"model":[7,24,58,89,129],"based":[8],"single-channel":[9],"speech-music":[10,137],"separation":[11,138],"method.":[12],"Given":[13],"catalog":[15],"of":[16,78,86],"background":[17,33,48],"music":[18,30,34,49],"material,":[19],"propose":[21],"generative":[23],"for":[25,154],"the":[26,45,60,75,87,97,126,158,172],"superposed":[27],"speech":[28,63,88,141,173],"and":[29,106,117,139],"spectrograms.":[31],"The":[32,47,62,84,100],"signal":[35,64],"is":[36,51,65,72,90,102],"assumed":[37],"to":[38,74,114],"be":[39],"generated":[40],"by":[41,53,67],"jingle":[43,159],"in":[44,92,136],"catalog.":[46],"component":[50],"modeled":[52,66],"scaled":[55],"conditional":[56],"representing":[59],"jingle.":[61],"probabilistic":[69,76],"model,":[70],"which":[71],"similar":[73],"interpretation":[77],"Non-negative":[79],"Matrix":[80],"Factorization":[81],"(NMF)":[82],"model.":[83],"parameters":[85],"estimated":[91],"semi-supervised":[94],"manner":[95],"from":[96],"mixed":[98],"signal.":[99],"approach":[101],"tested":[103],"with":[104,164],"Poisson":[105],"complex":[107],"Gaussian":[108],"observation":[109],"models":[110],"that":[111,125,168],"correspond":[112],"respectively":[113],"Kullback-Leibler":[115],"(KL)":[116],"Itakura-Saito":[118],"(IS)":[119],"divergence":[120],"measures.":[121],"Our":[122,161],"experiments":[123],"show":[124,167],"proposed":[127],"outperforms":[130],"standard":[132],"NMF":[133],"method":[134,170],"both":[135],"automatic":[140],"recognition":[142,174],"(ASR)":[143],"tasks.":[144],"These":[145],"results":[146,163],"are":[147],"further":[148],"improved":[149],"using":[150],"Markovian":[151],"prior":[152],"structures":[153],"temporal":[155],"continuity":[156],"between":[157],"frames.":[160],"test":[162],"real":[165],"data":[166],"our":[169],"increases":[171],"performance.":[175]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":5},{"year":2013,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
