{"id":"https://openalex.org/W2061292150","doi":"https://doi.org/10.1145/1324172.1324175","title":"Learning correlations using the mixture-of-subsets model","display_name":"Learning correlations using the mixture-of-subsets model","publication_year":2008,"publication_date":"2008-01-01","ids":{"openalex":"https://openalex.org/W2061292150","doi":"https://doi.org/10.1145/1324172.1324175","mag":"2061292150"},"language":"en","primary_location":{"id":"doi:10.1145/1324172.1324175","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1324172.1324175","pdf_url":null,"source":{"id":"https://openalex.org/S41523882","display_name":"ACM Transactions on Knowledge Discovery from Data","issn_l":"1556-4681","issn":["1556-4681","1556-472X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Knowledge Discovery from Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055224128","display_name":"Manas Somaiya","orcid":null},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Manas Somaiya","raw_affiliation_strings":["University of Florida, Gainesville, FL"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Florida, Gainesville, FL","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109437922","display_name":"Christopher Jermaine","orcid":null},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christopher Jermaine","raw_affiliation_strings":["University of Florida, Gainesville, FL"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Florida, Gainesville, FL","institution_ids":["https://openalex.org/I33213144"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077570468","display_name":"Sanjay Ranka","orcid":"https://orcid.org/0000-0003-4886-1988"},"institutions":[{"id":"https://openalex.org/I33213144","display_name":"University of Florida","ror":"https://ror.org/02y3ad647","country_code":"US","type":"education","lineage":["https://openalex.org/I33213144"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sanjay Ranka","raw_affiliation_strings":["University of Florida, Gainesville, FL"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Florida, Gainesville, FL","institution_ids":["https://openalex.org/I33213144"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I33213144"],"apc_list":null,"apc_paid":null,"fwci":1.1756,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.84299891,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":"1","issue":"4","first_page":"1","last_page":"42"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mixture-model","display_name":"Mixture model","score":0.7731112837791443},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6854812502861023},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.6739846467971802},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.5662588477134705},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5189811587333679},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.49992942810058594},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.4904422461986542},{"id":"https://openalex.org/keywords/data-point","display_name":"Data point","score":0.48128288984298706},{"id":"https://openalex.org/keywords/statistical-model","display_name":"Statistical model","score":0.4806469976902008},{"id":"https://openalex.org/keywords/data-set","display_name":"Data set","score":0.4728287160396576},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4700887203216553},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.45836883783340454},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3569129705429077},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.22794294357299805}],"concepts":[{"id":"https://openalex.org/C61224824","wikidata":"https://www.wikidata.org/wiki/Q2260434","display_name":"Mixture model","level":2,"score":0.7731112837791443},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6854812502861023},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.6739846467971802},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.5662588477134705},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5189811587333679},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.49992942810058594},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.4904422461986542},{"id":"https://openalex.org/C21080849","wikidata":"https://www.wikidata.org/wiki/Q13611879","display_name":"Data point","level":2,"score":0.48128288984298706},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.4806469976902008},{"id":"https://openalex.org/C58489278","wikidata":"https://www.wikidata.org/wiki/Q1172284","display_name":"Data set","level":2,"score":0.4728287160396576},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4700887203216553},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.45836883783340454},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3569129705429077},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.22794294357299805},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/1324172.1324175","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1324172.1324175","pdf_url":null,"source":{"id":"https://openalex.org/S41523882","display_name":"ACM Transactions on Knowledge Discovery from Data","issn_l":"1556-4681","issn":["1556-4681","1556-472X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Knowledge Discovery from Data","raw_type":"journal-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.330.763","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.330.763","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.cise.ufl.edu/~cjermain/Manas.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G5435763505","display_name":null,"funder_award_id":"CCF-0325459IIS-0347408IIS-0612170","funder_id":"https://openalex.org/F4320337389","funder_display_name":"Division of Information and Intelligent Systems"},{"id":"https://openalex.org/G8655500934","display_name":null,"funder_award_id":"CCF-0325459IIS-0347408IIS-0612170","funder_id":"https://openalex.org/F4320337387","funder_display_name":"Division of Computing and Communication Foundations"}],"funders":[{"id":"https://openalex.org/F4320337387","display_name":"Division of Computing and Communication Foundations","ror":"https://ror.org/01mng8331"},{"id":"https://openalex.org/F4320337389","display_name":"Division of Information and Intelligent Systems","ror":"https://ror.org/053a2cp42"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W263845233","https://openalex.org/W1486632395","https://openalex.org/W1506285740","https://openalex.org/W1551893515","https://openalex.org/W1579271636","https://openalex.org/W1974708480","https://openalex.org/W1977496278","https://openalex.org/W1992402718","https://openalex.org/W1995433152","https://openalex.org/W1995639191","https://openalex.org/W2036632921","https://openalex.org/W2042035594","https://openalex.org/W2049633694","https://openalex.org/W2065811242","https://openalex.org/W2072343647","https://openalex.org/W2072974396","https://openalex.org/W2080816440","https://openalex.org/W2094909687","https://openalex.org/W2107551505","https://openalex.org/W2112210867","https://openalex.org/W2115875363","https://openalex.org/W2117848638","https://openalex.org/W2127097022","https://openalex.org/W2128002512","https://openalex.org/W2138072998","https://openalex.org/W2152012752","https://openalex.org/W2434205482","https://openalex.org/W2488678869","https://openalex.org/W2977466517","https://openalex.org/W4244268470","https://openalex.org/W4254311734"],"related_works":["https://openalex.org/W2545529375","https://openalex.org/W2924917467","https://openalex.org/W2073891040","https://openalex.org/W2745792676","https://openalex.org/W3128438030","https://openalex.org/W1510133244","https://openalex.org/W1968042686","https://openalex.org/W2009059033","https://openalex.org/W2333793080","https://openalex.org/W4206278474"],"abstract_inverted_index":{"Using":[0],"a":[1,10,47,53,78,99,106,113,141],"mixture":[2,23,43,94],"of":[3,61,108,121,166],"random":[4],"variables":[5],"to":[6,29,67,91,102,135],"model":[7,31,44,84,139,157],"data":[8,15,35,48,100,122,161,168],"is":[9,26,50],"tried-and-tested":[11],"method":[12],"common":[13],"in":[14,56],"mining,":[16],"machine":[17],"learning,":[18],"and":[19,143],"statistics.":[20],"By":[21],"using":[22],"modeling":[24],"it":[25,146],"often":[27],"possible":[28],"accurately":[30],"even":[32],"complex,":[33],"multimodal":[34],"via":[36],"very":[37],"simple":[38],"components.":[39],"However,":[40],"the":[41,57,68,81,92,119,137,155,160,163,167],"classical":[42,93],"assumes":[45],"that":[46,124,154],"point":[49,101],"generated":[51,104],"by":[52,86,105],"single":[54,114],"component":[55,126],"model.":[58,95],"A":[59],"lot":[60],"datasets":[62],"can":[63,127],"be":[64,103],"modeled":[65],"closer":[66],"underlying":[69,164],"reality":[70],"if":[71],"we":[72,97,117],"drop":[73],"this":[74],"restriction.":[75],"We":[76,129],"propose":[77,131],"probabilistic":[79],"framework,":[80],"mixture-of-subsets":[82],"(MOS)":[83],",":[85],"making":[87],"two":[88],"fundamental":[89],"changes":[90],"First,":[96],"allow":[98],"set":[107],"components,":[109],"rather":[110],"than":[111],"just":[112],"component.":[115],"Next,":[116],"limit":[118],"number":[120],"attributes":[123],"each":[125],"influence.":[128],"also":[130],"an":[132],"EM":[133],"framework":[134],"learn":[136],"MOS":[138,156],"from":[140,159],"dataset,":[142],"experimentally":[144],"evaluate":[145],"on":[147],"real,":[148],"high-dimensional":[149],"datasets.":[150],"Our":[151],"results":[152],"show":[153],"learned":[158],"represents":[162],"nature":[165],"accurately.":[169]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2012,"cited_by_count":3}],"updated_date":"2026-06-26T08:34:08.712188","created_date":"2025-10-10T00:00:00"}
