{"id":"https://openalex.org/W2088304067","doi":"https://doi.org/10.1109/mlsp.2013.6661902","title":"Blocked Gibbs sampling based multi-scale mixture model for speaker clustering on noisy data","display_name":"Blocked Gibbs sampling based multi-scale mixture model for speaker clustering on noisy data","publication_year":2013,"publication_date":"2013-09-01","ids":{"openalex":"https://openalex.org/W2088304067","doi":"https://doi.org/10.1109/mlsp.2013.6661902","mag":"2088304067"},"language":"en","primary_location":{"id":"doi:10.1109/mlsp.2013.6661902","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp.2013.6661902","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5073111123","display_name":"Naohiro Tawara","orcid":null},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Naohiro Tawara","raw_affiliation_strings":["Waseda University, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Waseda University, Tokyo, Japan","institution_ids":["https://openalex.org/I150744194"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087632404","display_name":"Tetsuji Ogawa","orcid":"https://orcid.org/0000-0002-7316-2073"},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tetsuji Ogawa","raw_affiliation_strings":["Waseda University, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Waseda University, Tokyo, Japan","institution_ids":["https://openalex.org/I150744194"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001291873","display_name":"Shinji Watanabe","orcid":"https://orcid.org/0000-0002-5970-8631"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]},{"id":"https://openalex.org/I1306287861","display_name":"Mitsubishi Group (Japan)","ror":"https://ror.org/0234cd281","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861"]}],"countries":["JP","US"],"is_corresponding":false,"raw_author_name":"Shinji Watanabe","raw_affiliation_strings":["Mitsubishi Electric Research, Laboratories (MERL), MA, USA","Labs. (MERL), Mitsubishi Electr. Res., Cambridge, MA, USA"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research, Laboratories (MERL), MA, USA","institution_ids":["https://openalex.org/I4210159266"]},{"raw_affiliation_string":"Labs. (MERL), Mitsubishi Electr. Res., Cambridge, MA, USA","institution_ids":["https://openalex.org/I1306287861"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018620798","display_name":"Atsushi Nakamura","orcid":"https://orcid.org/0000-0003-0788-2221"},"institutions":[{"id":"https://openalex.org/I2251713219","display_name":"NTT (Japan)","ror":"https://ror.org/00berct97","country_code":"JP","type":"company","lineage":["https://openalex.org/I2251713219"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Atsushi Nakamura","raw_affiliation_strings":["NTT Communication Science Laboratories, NTT Corporation, Kyoto, Japan","NTT Commun. Sci. Lab., NTT Corp., Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"NTT Communication Science Laboratories, NTT Corporation, Kyoto, Japan","institution_ids":["https://openalex.org/I2251713219"]},{"raw_affiliation_string":"NTT Commun. Sci. Lab., NTT Corp., Kyoto, Japan","institution_ids":["https://openalex.org/I2251713219"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101188700","display_name":"Tetsunori Kobayashi","orcid":null},"institutions":[{"id":"https://openalex.org/I150744194","display_name":"Waseda University","ror":"https://ror.org/00ntfnx83","country_code":"JP","type":"education","lineage":["https://openalex.org/I150744194"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Tetsunori Kobayashi","raw_affiliation_strings":["Waseda University, Tokyo, Japan"],"affiliations":[{"raw_affiliation_string":"Waseda University, Tokyo, Japan","institution_ids":["https://openalex.org/I150744194"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5073111123"],"corresponding_institution_ids":["https://openalex.org/I150744194"],"apc_list":null,"apc_paid":null,"fwci":0.4809,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.76609749,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9991000294685364,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.8940230011940002},{"id":"https://openalex.org/keywords/gibbs-sampling","display_name":"Gibbs sampling","score":0.808454155921936},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.701213002204895},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5814502239227295},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.5797784924507141},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.540353536605835},{"id":"https://openalex.org/keywords/hierarchical-clustering","display_name":"Hierarchical clustering","score":0.470790296792984},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.46819835901260376},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4646807014942169},{"id":"https://openalex.org/keywords/slice-sampling","display_name":"Slice sampling","score":0.4628187119960785},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4241056740283966},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.41062474250793457},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.35318613052368164},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3369009494781494},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.1994008719921112},{"id":"https://openalex.org/keywords/markov-chain-monte-carlo","display_name":"Markov chain Monte Carlo","score":0.17372938990592957}],"concepts":[{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.8940230011940002},{"id":"https://openalex.org/C158424031","wikidata":"https://www.wikidata.org/wiki/Q1191905","display_name":"Gibbs sampling","level":3,"score":0.808454155921936},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.701213002204895},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5814502239227295},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.5797784924507141},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.540353536605835},{"id":"https://openalex.org/C92835128","wikidata":"https://www.wikidata.org/wiki/Q1277447","display_name":"Hierarchical clustering","level":3,"score":0.470790296792984},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.46819835901260376},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4646807014942169},{"id":"https://openalex.org/C170593435","wikidata":"https://www.wikidata.org/wiki/Q4128565","display_name":"Slice sampling","level":4,"score":0.4628187119960785},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4241056740283966},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.41062474250793457},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.35318613052368164},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3369009494781494},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.1994008719921112},{"id":"https://openalex.org/C111350023","wikidata":"https://www.wikidata.org/wiki/Q1191869","display_name":"Markov chain Monte Carlo","level":3,"score":0.17372938990592957},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/mlsp.2013.6661902","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mlsp.2013.6661902","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE International Workshop on Machine Learning for Signal Processing (MLSP)","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.403.3440","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.403.3440","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1989879829","https://openalex.org/W1994683528","https://openalex.org/W2041823554","https://openalex.org/W2069739265","https://openalex.org/W2090361527","https://openalex.org/W2100969003","https://openalex.org/W2135624821","https://openalex.org/W2141262306","https://openalex.org/W2148348093","https://openalex.org/W2159598197","https://openalex.org/W2167270514","https://openalex.org/W2168025753","https://openalex.org/W2406103520","https://openalex.org/W4212863985","https://openalex.org/W4233135949","https://openalex.org/W4237791300","https://openalex.org/W6680230631","https://openalex.org/W6681819875"],"related_works":["https://openalex.org/W2517377710","https://openalex.org/W1197719229","https://openalex.org/W2381158726","https://openalex.org/W1992796048","https://openalex.org/W2129090883","https://openalex.org/W1516392727","https://openalex.org/W2379906719","https://openalex.org/W2045761178","https://openalex.org/W2412815366","https://openalex.org/W2088304067"],"abstract_inverted_index":{"A":[0],"novel":[1],"sampling":[2,81,122,129],"method":[3,123],"is":[4,30,82,135],"proposed":[5,136,161],"for":[6,140],"estimating":[7],"a":[8,20,33,83,117,142],"continuous":[9],"multi-scale":[10,14],"mixture":[11,15,29,35,67],"model.":[12],"The":[13],"models":[16,91],"we":[17],"assume":[18],"have":[19],"hierarchical":[21],"structure":[22],"in":[23,52,78,111,146],"which":[24],"each":[25],"component":[26],"of":[27,62,68],"the":[28,50,53,60,66,76,96,106,126,147,160,166,175],"represented":[31],"by":[32,169],"Gaussian":[34],"model":[36,148,163],"(GMM).":[37],"In":[38,153],"speaker":[39,154],"modeling":[40],"from":[41,49,75],"speech,":[42],"this":[43,115],"GMM":[44],"represents":[45,71],"intra-speaker":[46],"dynamics":[47,73],"derived":[48,74],"difference":[51,77],"attributes":[54],"such":[55,88],"as":[56],"phoneme":[57],"contexts":[58],"and":[59,65,120,130,137],"existence":[61],"non-stationary":[63,158],"noise":[64],"GMMs":[69,108],"(MoGMMs)":[70],"inter-speaker":[72],"speakers.":[79],"Gibbs":[80,128],"powerful":[84],"technique":[85],"to":[86,174],"estimate":[87],"hierarchically":[89],"structured":[90],"but":[92],"can":[93],"easily":[94],"induce":[95],"local":[97],"optima":[98],"problem":[99],"depending":[100],"on":[101,125,171],"its":[102],"use":[103],"especially":[104],"when":[105],"elemental":[107],"are":[109],"complex":[110,150],"structure.":[112],"To":[113],"solve":[114],"problem,":[116],"highly":[118],"accurate":[119],"robust":[121],"based":[124],"blocked":[127],"iterative":[131],"conditional":[132],"modes":[133],"(ICM)":[134],"effectively":[138],"applied":[139],"reducing":[141],"singularity":[143],"solution":[144],"given":[145],"with":[149],"multi-modal":[151],"distributions.":[152],"clustering":[155,167],"experiments":[156],"under":[157],"noise,":[159],"sampling-based":[162,177],"estimation":[164],"improved":[165],"performance":[168],"17%":[170],"average":[172],"compared":[173],"conventional":[176],"methods.":[178]},"counts_by_year":[{"year":2015,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
