{"id":"https://openalex.org/W2567439001","doi":"https://doi.org/10.1109/uemcon.2016.7777818","title":"Expectation-maximization algorithm for topic modeling on big data streams","display_name":"Expectation-maximization algorithm for topic modeling on big data streams","publication_year":2016,"publication_date":"2016-10-01","ids":{"openalex":"https://openalex.org/W2567439001","doi":"https://doi.org/10.1109/uemcon.2016.7777818","mag":"2567439001"},"language":"en","primary_location":{"id":"doi:10.1109/uemcon.2016.7777818","is_oa":false,"landing_page_url":"https://doi.org/10.1109/uemcon.2016.7777818","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE 7th Annual Ubiquitous Computing, Electronics &amp; Mobile Communication Conference (UEMCON)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091290189","display_name":"Walisa Romsaiyud","orcid":"https://orcid.org/0000-0002-4529-8715"},"institutions":[{"id":"https://openalex.org/I60697786","display_name":"Sukhothai Thammathirat Open University","ror":"https://ror.org/00epajq42","country_code":"TH","type":"education","lineage":["https://openalex.org/I60697786"]}],"countries":["TH"],"is_corresponding":true,"raw_author_name":"Walisa Romsaiyud","raw_affiliation_strings":["School of Science and Technology, Sukhothai Thammathirat Open University, Pakkret, Nonthaburi, Thailand"],"affiliations":[{"raw_affiliation_string":"School of Science and Technology, Sukhothai Thammathirat Open University, Pakkret, Nonthaburi, Thailand","institution_ids":["https://openalex.org/I60697786"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5091290189"],"corresponding_institution_ids":["https://openalex.org/I60697786"],"apc_list":null,"apc_paid":null,"fwci":4.1305,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.93484995,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"105","issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.982699990272522,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.982699990272522,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13398","display_name":"Data Analysis with R","score":0.9815000295639038,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9750999808311462,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7981712818145752},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.703637957572937},{"id":"https://openalex.org/keywords/expectation\u2013maximization-algorithm","display_name":"Expectation\u2013maximization algorithm","score":0.6370294690132141},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5985136032104492},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.5850605964660645},{"id":"https://openalex.org/keywords/bayesian-inference","display_name":"Bayesian inference","score":0.4730609655380249},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.44608747959136963},{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.44160598516464233},{"id":"https://openalex.org/keywords/centroid","display_name":"Centroid","score":0.4338746666908264},{"id":"https://openalex.org/keywords/maximization","display_name":"Maximization","score":0.4219844341278076},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.38676774501800537},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.35364484786987305},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.32404381036758423},{"id":"https://openalex.org/keywords/maximum-likelihood","display_name":"Maximum likelihood","score":0.2519261837005615},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.11008471250534058},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.10851892828941345},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.10010647773742676}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7981712818145752},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.703637957572937},{"id":"https://openalex.org/C182081679","wikidata":"https://www.wikidata.org/wiki/Q1275153","display_name":"Expectation\u2013maximization algorithm","level":3,"score":0.6370294690132141},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5985136032104492},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.5850605964660645},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.4730609655380249},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.44608747959136963},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.44160598516464233},{"id":"https://openalex.org/C146599234","wikidata":"https://www.wikidata.org/wiki/Q511093","display_name":"Centroid","level":2,"score":0.4338746666908264},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.4219844341278076},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.38676774501800537},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.35364484786987305},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.32404381036758423},{"id":"https://openalex.org/C49781872","wikidata":"https://www.wikidata.org/wiki/Q1045555","display_name":"Maximum likelihood","level":2,"score":0.2519261837005615},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.11008471250534058},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.10851892828941345},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.10010647773742676},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/uemcon.2016.7777818","is_oa":false,"landing_page_url":"https://doi.org/10.1109/uemcon.2016.7777818","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2016 IEEE 7th Annual Ubiquitous Computing, Electronics &amp; Mobile Communication Conference (UEMCON)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W1753361524","https://openalex.org/W1880262756","https://openalex.org/W1964082888","https://openalex.org/W1965614296","https://openalex.org/W1991255919","https://openalex.org/W1992196410","https://openalex.org/W2001932471","https://openalex.org/W2008225289","https://openalex.org/W2045631398","https://openalex.org/W2049449085","https://openalex.org/W2054052884","https://openalex.org/W2072644219","https://openalex.org/W2140190241","https://openalex.org/W2175075972","https://openalex.org/W2255966421","https://openalex.org/W2324749769","https://openalex.org/W2399067544","https://openalex.org/W4231510805","https://openalex.org/W4232159537","https://openalex.org/W4302990361","https://openalex.org/W6639619044","https://openalex.org/W6680704940"],"related_works":["https://openalex.org/W2381926679","https://openalex.org/W2611300636","https://openalex.org/W2082644203","https://openalex.org/W3165040664","https://openalex.org/W2007009951","https://openalex.org/W2350539780","https://openalex.org/W1976188970","https://openalex.org/W2990541822","https://openalex.org/W1588885902","https://openalex.org/W1965352811"],"abstract_inverted_index":{"Expectation-Maximization":[0],"(EM)":[1],"is":[2],"typically":[3],"used":[4],"to":[5,146,159],"compute":[6],"maximum":[7],"likelihood":[8],"estimates":[9],"given":[10],"incomplete":[11],"samples":[12],"and":[13,33,122,155,163,176],"estimated":[14],"the":[15,36,60,70,96,107,111,115,119,161,166],"parameters.":[16],"We":[17],"proposed":[18,44],"a":[19,30,80,124,128,133],"new":[20],"algorithm":[21,45,71],"for":[22,55,98,117],"generating":[23],"an":[24],"extension":[25],"Dynamic":[26],"Topic":[27],"Model":[28],"(exDTM)-in":[29],"time-based":[31],"manner":[32],"based":[34],"on":[35,41,170],"distribution":[37,109],"of":[38,59,110,114,152],"documents":[39,51,116],"topics":[40],"Spark.":[42],"The":[43,76,103],"can":[46],"be":[47],"applied":[48,169],"in":[49,84],"clustering":[50,81],"from":[52,89,142],"data":[53,91],"streams":[54],"threat":[56],"cyberbullying":[57,174],"detection":[58],"collected":[61,88,141],"datasets":[62,140],"that":[63],"continuously":[64],"change":[65],"over":[66,132],"time.":[67,135],"In":[68,136,157],"particular,":[69],"includes":[72],"two":[73],"main":[74],"methods.":[75],"first":[77],"method":[78,82,94,105],"introduces":[79],"rooted":[83],"content-based":[85],"coded":[86],"dialogues":[87],"several":[90],"sources.":[92],"This":[93],"measures":[95],"centroid":[97],"each":[99],"cluster":[100],"with":[101],"EM.":[102],"second":[104],"calculates":[106],"joint":[108],"latent":[112],"variables":[113],"finding":[118],"posterior":[120],"distribution,":[121],"generates":[123],"final":[125],"model":[126],"using":[127,149],"variational":[129],"Bayesian":[130],"inference":[131],"sequential":[134],"this":[137],"experiment,":[138],"authentic":[139],"year":[143],"-":[144,148],"2010":[145],"2011":[147],"corpus-wide":[150],"patterns":[151],"words-were":[153],"analyzed":[154],"studied.":[156],"order":[158],"enhance":[160],"reliability":[162],"computation":[164],"time,":[165],"methods":[167],"were":[168],"real-life":[171],"settings":[172],"where":[173],"features":[175,178],"user-based":[177],"had":[179],"experienced.":[180]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2017,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
