{"id":"https://openalex.org/W2810633914","doi":"https://doi.org/10.1145/3209978.3210189","title":"A Tutorial on Probabilistic Topic Models for Text Data Retrieval and Analysis","display_name":"A Tutorial on Probabilistic Topic Models for Text Data Retrieval and Analysis","publication_year":2018,"publication_date":"2018-06-27","ids":{"openalex":"https://openalex.org/W2810633914","doi":"https://doi.org/10.1145/3209978.3210189","mag":"2810633914"},"language":"en","primary_location":{"id":"doi:10.1145/3209978.3210189","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3209978.3210189","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 41st International ACM SIGIR Conference on Research &amp; Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028518494","display_name":"ChengXiang Zhai","orcid":"https://orcid.org/0000-0002-6434-3702"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"ChengXiang Zhai","raw_affiliation_strings":["University of Illinois at Urbana-Champaign, Urbana, IL, USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign, Urbana, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090089591","display_name":"Chase Geigle","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chase Geigle","raw_affiliation_strings":["University of Illinois at Urbana-Champaign, Urbana, IL, USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign, Urbana, IL, USA","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5028518494"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":0.4887,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.72415352,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1395","last_page":"1398"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9979000091552734,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.9871000051498413,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.77137291431427},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.5817878842353821},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5331028699874878},{"id":"https://openalex.org/keywords/divergence-from-randomness-model","display_name":"Divergence-from-randomness model","score":0.42015600204467773},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3395116925239563},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.29601970314979553}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.77137291431427},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.5817878842353821},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5331028699874878},{"id":"https://openalex.org/C149189445","wikidata":"https://www.wikidata.org/wiki/Q5283894","display_name":"Divergence-from-randomness model","level":3,"score":0.42015600204467773},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3395116925239563},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.29601970314979553}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3209978.3210189","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3209978.3210189","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"The 41st International ACM SIGIR Conference on Research &amp; Development in Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.7200000286102295}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":4,"referenced_works":["https://openalex.org/W1880262756","https://openalex.org/W2107743791","https://openalex.org/W2511683478","https://openalex.org/W4233135949"],"related_works":["https://openalex.org/W4290792893","https://openalex.org/W2384888906","https://openalex.org/W2144190808","https://openalex.org/W1525335456","https://openalex.org/W1982975012","https://openalex.org/W2041706320","https://openalex.org/W2079379504","https://openalex.org/W2155482025","https://openalex.org/W2167619257","https://openalex.org/W2116496008"],"abstract_inverted_index":{"As":[0,31],"text":[1,26,29,40,85,98,108,121,148,151],"data":[2,27,41,122,221],"continues":[3],"to":[4,11,15,39,120,183,197,202,205],"grow":[5],"quickly,":[6],"it":[7],"is":[8],"increasingly":[9],"important":[10],"develop":[12],"intelligent":[13],"systems":[14],"help":[16],"people":[17],"manage":[18],"and":[19,43,57,79,92,107,114,127,143,150,166,174,186,217,239,246],"make":[20],"use":[21,206],"of":[22,25,35,97,160,227,243],"vast":[23],"amounts":[24],"(\"big":[28],"data'').":[30],"a":[32,90,194,224,241],"new":[33],"family":[34],"effective":[36],"general":[37,91,113],"approaches":[38],"retrieval":[42,106,149],"analysis,":[44],"probabilistic":[45,140],"topic":[46,72,141,170,191,208,232],"models---notably":[47],"Probabilistic":[48],"Latent":[49,53],"Semantic":[50],"Analysis":[51],"(PLSA),":[52],"Dirichlet":[54],"Allocations":[55],"(LDA),":[56],"their":[58,145],"many":[59,102],"extensions---have":[60],"been":[61],"studied":[62],"actively":[63],"in":[64,84,104,123,139,147,211],"the":[65,135,161,167,199,207,212,229],"past":[66],"decade":[67],"with":[68,219],"widespread":[69,178],"applications.":[70],"These":[71],"models":[73,142,171,209,233],"are":[74,112],"powerful":[75],"tools":[76],"for":[77,190],"extracting":[78],"analyzing":[80],"latent":[81,94],"topics":[82],"contained":[83],"data;":[86],"they":[87,111,116],"also":[88],"provide":[89],"robust":[93],"semantic":[95],"representation":[96],"data,":[99],"thus":[100],"improving":[101],"applications":[103,146],"information":[105],"mining.":[109,152],"Since":[110],"robust,":[115],"can":[117],"be":[118],"applied":[119],"any":[124,129],"natural":[125],"language":[126],"about":[128],"topics.":[130],"This":[131],"tutorial":[132,154,200],"systematically":[133],"reviews":[134],"major":[136,230,244],"research":[137,248],"progress":[138],"discuss":[144],"The":[153],"provides":[155],"(1)":[156],"an":[157,181],"in-depth":[158],"explanation":[159],"basic":[162,169],"concepts,":[163],"underlying":[164],"principles,":[165],"two":[168],"(i.e.,":[172],"PLSA":[173,236],"LDA)":[175],"that":[176,234],"have":[177],"applications,":[179],"(2)":[180],"introduction":[182],"EM":[184],"algorithms":[185,189],"Bayesian":[187],"inference":[188],"models,":[192],"(3)":[193],"hands-on":[195],"exercise":[196],"allow":[198],"attendants":[201],"learn":[203],"how":[204],"implemented":[210],"MeTA":[213],"Open":[214],"Source":[215],"Toolkit":[216],"experiment":[218],"provided":[220],"sets,":[222],"(4)":[223],"broad":[225],"overview":[226],"all":[228],"representative":[231],"extend":[235],"or":[237],"LDA,":[238],"(5)":[240],"discussion":[242],"challenges":[245],"future":[247],"directions.":[249]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
