{"id":"https://openalex.org/W2747754462","doi":"https://doi.org/10.1145/3095713.3095721","title":"Speaker Clustering Based on Non-Negative Matrix Factorization Using Gaussian Mixture Model in Complementary Subspace","display_name":"Speaker Clustering Based on Non-Negative Matrix Factorization Using Gaussian Mixture Model in Complementary Subspace","publication_year":2017,"publication_date":"2017-06-19","ids":{"openalex":"https://openalex.org/W2747754462","doi":"https://doi.org/10.1145/3095713.3095721","mag":"2747754462"},"language":"en","primary_location":{"id":"doi:10.1145/3095713.3095721","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3095713.3095721","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 15th International Workshop on Content-Based Multimedia Indexing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109009818","display_name":"Masafumi Nishida","orcid":null},"institutions":[{"id":"https://openalex.org/I1298590031","display_name":"Shizuoka University","ror":"https://ror.org/01w6wtk13","country_code":"JP","type":"education","lineage":["https://openalex.org/I1298590031"]}],"countries":["JP"],"is_corresponding":true,"raw_author_name":"Masafumi Nishida","raw_affiliation_strings":["Department of Informatics, Shizuoka University, Shizuoka, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Informatics, Shizuoka University, Shizuoka, Japan","institution_ids":["https://openalex.org/I1298590031"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086759974","display_name":"Seiichi Yamamoto","orcid":"https://orcid.org/0000-0002-1280-0043"},"institutions":[{"id":"https://openalex.org/I133984924","display_name":"Doshisha University","ror":"https://ror.org/01fxdkm29","country_code":"JP","type":"education","lineage":["https://openalex.org/I133984924"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Seiichi Yamamoto","raw_affiliation_strings":["Department of Information and Computer Science, Doshisha University, Kyoto, Japan"],"affiliations":[{"raw_affiliation_string":"Department of Information and Computer Science, Doshisha University, Kyoto, Japan","institution_ids":["https://openalex.org/I133984924"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5109009818"],"corresponding_institution_ids":["https://openalex.org/I1298590031"],"apc_list":null,"apc_paid":null,"fwci":0.195,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.61848355,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"5"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10860","display_name":"Speech and Audio Processing","score":0.9957000017166138,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11309","display_name":"Music and Audio Processing","score":0.9866999983787537,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.7046796083450317},{"id":"https://openalex.org/keywords/subspace-topology","display_name":"Subspace topology","score":0.6847509145736694},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.6804279685020447},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.6229063272476196},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.6193201541900635},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6097052693367004},{"id":"https://openalex.org/keywords/non-negative-matrix-factorization","display_name":"Non-negative matrix factorization","score":0.6062676310539246},{"id":"https://openalex.org/keywords/principal-component-analysis","display_name":"Principal component analysis","score":0.6025826334953308},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5568881630897522},{"id":"https://openalex.org/keywords/speaker-recognition","display_name":"Speaker recognition","score":0.5440700054168701},{"id":"https://openalex.org/keywords/gaussian-process","display_name":"Gaussian process","score":0.4337359666824341},{"id":"https://openalex.org/keywords/transformation","display_name":"Transformation (genetics)","score":0.4220195412635803},{"id":"https://openalex.org/keywords/gaussian","display_name":"Gaussian","score":0.41499146819114685},{"id":"https://openalex.org/keywords/matrix-decomposition","display_name":"Matrix decomposition","score":0.3934769630432129},{"id":"https://openalex.org/keywords/eigenvalues-and-eigenvectors","display_name":"Eigenvalues and eigenvectors","score":0.13446524739265442}],"concepts":[{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.7046796083450317},{"id":"https://openalex.org/C32834561","wikidata":"https://www.wikidata.org/wiki/Q660730","display_name":"Subspace topology","level":2,"score":0.6847509145736694},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.6804279685020447},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.6229063272476196},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.6193201541900635},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6097052693367004},{"id":"https://openalex.org/C152671427","wikidata":"https://www.wikidata.org/wiki/Q10843505","display_name":"Non-negative matrix factorization","level":4,"score":0.6062676310539246},{"id":"https://openalex.org/C27438332","wikidata":"https://www.wikidata.org/wiki/Q2873","display_name":"Principal component analysis","level":2,"score":0.6025826334953308},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5568881630897522},{"id":"https://openalex.org/C133892786","wikidata":"https://www.wikidata.org/wiki/Q1145189","display_name":"Speaker recognition","level":2,"score":0.5440700054168701},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.4337359666824341},{"id":"https://openalex.org/C204241405","wikidata":"https://www.wikidata.org/wiki/Q461499","display_name":"Transformation (genetics)","level":3,"score":0.4220195412635803},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.41499146819114685},{"id":"https://openalex.org/C42355184","wikidata":"https://www.wikidata.org/wiki/Q1361088","display_name":"Matrix decomposition","level":3,"score":0.3934769630432129},{"id":"https://openalex.org/C158693339","wikidata":"https://www.wikidata.org/wiki/Q190524","display_name":"Eigenvalues and eigenvectors","level":2,"score":0.13446524739265442},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3095713.3095721","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3095713.3095721","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 15th International Workshop on Content-Based Multimedia Indexing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6100000143051147,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W11080984","https://openalex.org/W76945434","https://openalex.org/W1482605500","https://openalex.org/W1578701839","https://openalex.org/W2034181906","https://openalex.org/W2137319143","https://openalex.org/W2144125830","https://openalex.org/W2159591770","https://openalex.org/W2162627003","https://openalex.org/W2401611834","https://openalex.org/W3034729383"],"related_works":["https://openalex.org/W4390394189","https://openalex.org/W2037504162","https://openalex.org/W2539013788","https://openalex.org/W2792706544","https://openalex.org/W1568451138","https://openalex.org/W2156699640","https://openalex.org/W2045265907","https://openalex.org/W2972997031","https://openalex.org/W34555840","https://openalex.org/W2146544734"],"abstract_inverted_index":{"Speech":[0],"feature":[1],"variations":[2,7],"are":[3,23],"mainly":[4],"attributed":[5],"to":[6],"in":[8,14,86,111],"phonetic":[9,44],"and":[10,60,107],"speaker":[11,30,41,72,88],"information":[12,22,42,105],"included":[13],"speech":[15],"data.":[16],"If":[17],"these":[18],"two":[19],"types":[20],"of":[21,95],"separated":[24],"from":[25,43],"each":[26],"other,":[27],"more":[28],"robust":[29],"clustering":[31,73,126],"can":[32,39,123],"be":[33],"achieved.":[34],"Principal":[35],"component":[36],"analysis":[37],"transformation":[38],"separate":[40],"information,":[45],"under":[46],"the":[47,87,96,120],"assumption":[48],"that":[49,119],"a":[50,57,61,66,71,81],"space":[51,62],"with":[52,99],"large":[53],"within-speaker":[54,63],"variance":[55,64],"is":[56,65],"\"phonetic":[58,67],"subspace\"":[59],"sub-space\".":[68],"We":[69,90],"propose":[70],"method":[74,98,122],"based":[75,102],"on":[76,103],"non-negative":[77],"matrix":[78],"factorization":[79],"using":[80],"Gaussian":[82,108],"mixture":[83,109],"model":[84,110],"trained":[85],"subspace.":[89],"carried":[91],"out":[92],"comparative":[93],"experiments":[94],"proposed":[97,121],"conventional":[100,129],"methods":[101],"Bayesian":[104],"criterion":[106],"an":[112],"observation":[113],"space.":[114],"The":[115],"experimental":[116],"results":[117],"showed":[118],"achieve":[124],"higher":[125],"accuracy":[127],"than":[128],"methods.":[130]},"counts_by_year":[{"year":2019,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
