{"id":"https://openalex.org/W3009379225","doi":"https://doi.org/10.1145/3369873","title":"Probabilistic Topic Modeling for Comparative Analysis of Document Collections","display_name":"Probabilistic Topic Modeling for Comparative Analysis of Document Collections","publication_year":2020,"publication_date":"2020-03-04","ids":{"openalex":"https://openalex.org/W3009379225","doi":"https://doi.org/10.1145/3369873","mag":"3009379225"},"language":"en","primary_location":{"id":"doi:10.1145/3369873","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3369873","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3369873","source":{"id":"https://openalex.org/S41523882","display_name":"ACM Transactions on Knowledge Discovery from Data","issn_l":"1556-4681","issn":["1556-4681","1556-472X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Knowledge Discovery from Data","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3369873","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5103489156","display_name":"Ting Hua","orcid":null},"institutions":[{"id":"https://openalex.org/I859038795","display_name":"Virginia Tech","ror":"https://ror.org/02smfhw86","country_code":"US","type":"education","lineage":["https://openalex.org/I859038795"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ting Hua","raw_affiliation_strings":["Virginia Tech"],"affiliations":[{"raw_affiliation_string":"Virginia Tech","institution_ids":["https://openalex.org/I859038795"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038002204","display_name":"Chang\u2010Tien Lu","orcid":"https://orcid.org/0000-0003-3675-0199"},"institutions":[{"id":"https://openalex.org/I859038795","display_name":"Virginia Tech","ror":"https://ror.org/02smfhw86","country_code":"US","type":"education","lineage":["https://openalex.org/I859038795"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chang-Tien Lu","raw_affiliation_strings":["Virginia Tech"],"affiliations":[{"raw_affiliation_string":"Virginia Tech","institution_ids":["https://openalex.org/I859038795"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047912015","display_name":"Jaegul Choo","orcid":"https://orcid.org/0000-0003-1071-4835"},"institutions":[{"id":"https://openalex.org/I197347611","display_name":"Korea University","ror":"https://ror.org/047dqcg40","country_code":"KR","type":"education","lineage":["https://openalex.org/I197347611"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jaegul Choo","raw_affiliation_strings":["Korea University, South Korea"],"affiliations":[{"raw_affiliation_string":"Korea University, South Korea","institution_ids":["https://openalex.org/I197347611"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001022750","display_name":"Chandan K. Reddy","orcid":"https://orcid.org/0000-0003-2839-3662"},"institutions":[{"id":"https://openalex.org/I859038795","display_name":"Virginia Tech","ror":"https://ror.org/02smfhw86","country_code":"US","type":"education","lineage":["https://openalex.org/I859038795"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chandan K. Reddy","raw_affiliation_strings":["Virginia Tech"],"affiliations":[{"raw_affiliation_string":"Virginia Tech","institution_ids":["https://openalex.org/I859038795"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5103489156"],"corresponding_institution_ids":["https://openalex.org/I859038795"],"apc_list":null,"apc_paid":null,"fwci":2.7428,"has_fulltext":true,"cited_by_count":28,"citation_normalized_percentile":{"value":0.91976508,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"14","issue":"2","first_page":"1","last_page":"27"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9991999864578247,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13910","display_name":"Computational and Text Analysis Methods","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/3300","display_name":"General Social Sciences"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7750802040100098},{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7269951105117798},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.7253382802009583},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.6242364645004272},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5148352980613708},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.4710155725479126},{"id":"https://openalex.org/keywords/document-classification","display_name":"Document classification","score":0.4184829294681549},{"id":"https://openalex.org/keywords/statistical-model","display_name":"Statistical model","score":0.41084030270576477},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3715527653694153},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3653795123100281},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.36315691471099854},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.35350292921066284}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7750802040100098},{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7269951105117798},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.7253382802009583},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.6242364645004272},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5148352980613708},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.4710155725479126},{"id":"https://openalex.org/C2780479914","wikidata":"https://www.wikidata.org/wiki/Q302088","display_name":"Document classification","level":2,"score":0.4184829294681549},{"id":"https://openalex.org/C114289077","wikidata":"https://www.wikidata.org/wiki/Q3284399","display_name":"Statistical model","level":2,"score":0.41084030270576477},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3715527653694153},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3653795123100281},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36315691471099854},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.35350292921066284}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3369873","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3369873","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3369873","source":{"id":"https://openalex.org/S41523882","display_name":"ACM Transactions on Knowledge Discovery from Data","issn_l":"1556-4681","issn":["1556-4681","1556-472X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Knowledge Discovery from Data","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1145/3369873","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3369873","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3369873","source":{"id":"https://openalex.org/S41523882","display_name":"ACM Transactions on Knowledge Discovery from Data","issn_l":"1556-4681","issn":["1556-4681","1556-472X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Knowledge Discovery from Data","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.7900000214576721}],"awards":[{"id":"https://openalex.org/G2037717774","display_name":"III: Small: Collaborative Research: Global Event and Trend Archive Research (GETAR)","funder_award_id":"1619028","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G2690932125","display_name":null,"funder_award_id":"IIS-1707498","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3034753964","display_name":null,"funder_award_id":"grant","funder_id":"https://openalex.org/F4320320671","funder_display_name":"National Research Foundation"},{"id":"https://openalex.org/G3223590597","display_name":null,"funder_award_id":"IIS-1619028","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3343279563","display_name":"III: Small: New Machine Learning Approaches for Modeling Time-to-Event Data","funder_award_id":"1707498","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G342704958","display_name":null,"funder_award_id":"funded","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G3942910960","display_name":null,"funder_award_id":"(NRF) grant","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G4782360968","display_name":null,"funder_award_id":"1838730","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6686156393","display_name":null,"funder_award_id":"Korean government (MSIP)","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G7815765994","display_name":null,"funder_award_id":"NRF2019","funder_id":"https://openalex.org/F4320322120","funder_display_name":"National Research Foundation of Korea"},{"id":"https://openalex.org/G7817772119","display_name":null,"funder_award_id":"IIS-1838730","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320322030","display_name":"Ministry of Science, ICT and Future Planning","ror":"https://ror.org/032e49973"},{"id":"https://openalex.org/F4320322120","display_name":"National Research Foundation of Korea","ror":"https://ror.org/013aysd81"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3009379225.pdf","grobid_xml":"https://content.openalex.org/works/W3009379225.grobid-xml"},"referenced_works_count":29,"referenced_works":["https://openalex.org/W1576326591","https://openalex.org/W1840615776","https://openalex.org/W1880262756","https://openalex.org/W1964346230","https://openalex.org/W2001587475","https://openalex.org/W2005564522","https://openalex.org/W2017966270","https://openalex.org/W2023326407","https://openalex.org/W2024428474","https://openalex.org/W2057990742","https://openalex.org/W2087382273","https://openalex.org/W2123751690","https://openalex.org/W2137340504","https://openalex.org/W2140124448","https://openalex.org/W2146341620","https://openalex.org/W2156693754","https://openalex.org/W2166851633","https://openalex.org/W2167686991","https://openalex.org/W2171343266","https://openalex.org/W2222512263","https://openalex.org/W2243453704","https://openalex.org/W2251283673","https://openalex.org/W2567736915","https://openalex.org/W2583743728","https://openalex.org/W2737946880","https://openalex.org/W2911243414","https://openalex.org/W2930957955","https://openalex.org/W4212863985","https://openalex.org/W4233135949"],"related_works":["https://openalex.org/W2768373660","https://openalex.org/W2703484599","https://openalex.org/W2743191757","https://openalex.org/W2008991527","https://openalex.org/W4297311563","https://openalex.org/W1995796873","https://openalex.org/W2598931156","https://openalex.org/W3159498945","https://openalex.org/W2018409826","https://openalex.org/W2594674086"],"abstract_inverted_index":{"Probabilistic":[0],"topic":[1],"models,":[2],"which":[3],"can":[4,48,111],"discover":[5],"hidden":[6],"patterns":[7],"in":[8,118],"documents,":[9],"have":[10],"been":[11],"extensively":[12],"studied.":[13],"However,":[14],"rather":[15],"than":[16],"learning":[17],"from":[18],"a":[19,27,44,63,71,91],"single":[20],"document":[21,35,69,79,120],"collection,":[22],"numerous":[23],"real-world":[24,119],"applications":[25],"demand":[26],"comprehensive":[28],"understanding":[29],"of":[30,55,73,101],"the":[31,50,99],"relationships":[32],"among":[33],"various":[34],"sets.":[36],"To":[37],"address":[38],"such":[39],"needs,":[40],"this":[41],"article":[42],"proposes":[43],"new":[45],"model":[46,110],"that":[47,66,87],"identify":[49],"common":[51,74],"and":[52,81],"discriminative":[53],"aspects":[54],"multiple":[56],"datasets.":[57],"Specifically,":[58],"our":[59,102],"proposed":[60,109],"method":[61,103],"is":[62],"Bayesian":[64],"approach":[65],"represents":[67],"each":[68],"as":[70],"combination":[72],"topics":[75,83],"(shared":[76],"across":[77],"all":[78],"sets)":[80],"distinctive":[82],"(distributions":[84],"over":[85],"words":[86],"are":[88],"exclusive":[89],"to":[90],"particular":[92],"dataset).":[93],"Through":[94],"extensive":[95],"experiments,":[96],"we":[97],"demonstrate":[98],"effectiveness":[100],"compared":[104],"with":[105],"state-of-the-art":[106],"models.":[107],"The":[108],"be":[112],"useful":[113],"for":[114],"\u201ccomparative":[115],"thinking\u201d":[116],"analysis":[117],"collections.":[121]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":6},{"year":2021,"cited_by_count":6}],"updated_date":"2026-03-18T14:38:29.013473","created_date":"2025-10-10T00:00:00"}
