{"id":"https://openalex.org/W4206085203","doi":"https://doi.org/10.1109/bigdata52589.2021.9671416","title":"Keyword-based Topic Modeling and Keyword Selection","display_name":"Keyword-based Topic Modeling and Keyword Selection","publication_year":2021,"publication_date":"2021-12-15","ids":{"openalex":"https://openalex.org/W4206085203","doi":"https://doi.org/10.1109/bigdata52589.2021.9671416"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata52589.2021.9671416","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata52589.2021.9671416","pdf_url":null,"source":{"id":"https://openalex.org/S4363607718","display_name":"2021 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100351265","display_name":"Xingyu Wang","orcid":"https://orcid.org/0000-0002-1190-4967"},"institutions":[{"id":"https://openalex.org/I111979921","display_name":"Northwestern University","ror":"https://ror.org/000e0be47","country_code":"US","type":"education","lineage":["https://openalex.org/I111979921"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xingyu Wang","raw_affiliation_strings":["Northwestern University,Evanston,IL","Northwestern University, Evanston, IL"],"affiliations":[{"raw_affiliation_string":"Northwestern University,Evanston,IL","institution_ids":["https://openalex.org/I111979921"]},{"raw_affiliation_string":"Northwestern University, Evanston, IL","institution_ids":["https://openalex.org/I111979921"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072931223","display_name":"Lida Zhang","orcid":"https://orcid.org/0000-0002-5207-2458"},"institutions":[{"id":"https://openalex.org/I91045830","display_name":"Texas A&M University","ror":"https://ror.org/01f5ytq51","country_code":"US","type":"education","lineage":["https://openalex.org/I91045830"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lida Zhang","raw_affiliation_strings":["Texas A&#x0026;M University,College Station,TX"],"affiliations":[{"raw_affiliation_string":"Texas A&#x0026;M University,College Station,TX","institution_ids":["https://openalex.org/I91045830"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5013049879","display_name":"Diego Klabjan","orcid":"https://orcid.org/0000-0003-4213-9281"},"institutions":[{"id":"https://openalex.org/I111979921","display_name":"Northwestern University","ror":"https://ror.org/000e0be47","country_code":"US","type":"education","lineage":["https://openalex.org/I111979921"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Diego Klabjan","raw_affiliation_strings":["Northwestern University,Evanston,IL","Northwestern University, Evanston, IL"],"affiliations":[{"raw_affiliation_string":"Northwestern University,Evanston,IL","institution_ids":["https://openalex.org/I111979921"]},{"raw_affiliation_string":"Northwestern University, Evanston, IL","institution_ids":["https://openalex.org/I111979921"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100351265"],"corresponding_institution_ids":["https://openalex.org/I111979921"],"apc_list":null,"apc_paid":null,"fwci":0.2513,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.5235558,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":93,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1148","last_page":"1154"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9793999791145325,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9746000170707703,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8638216257095337},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.6591755151748657},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6285222768783569},{"id":"https://openalex.org/keywords/novelty","display_name":"Novelty","score":0.595185399055481},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5726868510246277},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5445559024810791},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.5264407396316528},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5006134510040283},{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.49884796142578125},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4501592218875885},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4368639290332794},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.4294176995754242},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.41507527232170105},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.32689228653907776},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.32264894247055054},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.32148247957229614}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8638216257095337},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.6591755151748657},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6285222768783569},{"id":"https://openalex.org/C2778738651","wikidata":"https://www.wikidata.org/wiki/Q16546687","display_name":"Novelty","level":2,"score":0.595185399055481},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5726868510246277},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5445559024810791},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.5264407396316528},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5006134510040283},{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.49884796142578125},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4501592218875885},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4368639290332794},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.4294176995754242},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.41507527232170105},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.32689228653907776},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.32264894247055054},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32148247957229614},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C27206212","wikidata":"https://www.wikidata.org/wiki/Q34178","display_name":"Theology","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata52589.2021.9671416","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata52589.2021.9671416","pdf_url":null,"source":{"id":"https://openalex.org/S4363607718","display_name":"2021 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W1525595230","https://openalex.org/W1854214752","https://openalex.org/W2064418625","https://openalex.org/W2072644219","https://openalex.org/W2105745072","https://openalex.org/W2107034620","https://openalex.org/W2108420397","https://openalex.org/W2109154616","https://openalex.org/W2113459411","https://openalex.org/W2140124448","https://openalex.org/W2145766604","https://openalex.org/W2149035855","https://openalex.org/W2156577800","https://openalex.org/W2163659824","https://openalex.org/W2165599843","https://openalex.org/W2181691731","https://openalex.org/W2207592857","https://openalex.org/W2547875792","https://openalex.org/W4206085203","https://openalex.org/W4231510805","https://openalex.org/W6631501603","https://openalex.org/W6639055396","https://openalex.org/W6639619044","https://openalex.org/W6675771100","https://openalex.org/W6676984168","https://openalex.org/W6681769576","https://openalex.org/W6683944584","https://openalex.org/W6684489972","https://openalex.org/W6688018400","https://openalex.org/W6729448088","https://openalex.org/W6773466343","https://openalex.org/W7011438494"],"related_works":["https://openalex.org/W2888805565","https://openalex.org/W4312773271","https://openalex.org/W4315588616","https://openalex.org/W2769501189","https://openalex.org/W2962686197","https://openalex.org/W2207653751","https://openalex.org/W4293863151","https://openalex.org/W3159709618","https://openalex.org/W2611137333","https://openalex.org/W3005513013"],"abstract_inverted_index":{"Certain":[0],"type":[1],"of":[2,13,17,39,55,76,118,122,153],"documents":[3,43,95],"such":[4],"as":[5],"tweets":[6,154],"are":[7],"collected":[8],"by":[9,105,169],"specifying":[10],"a":[11,67,74,107,120,126,147,157],"set":[12],"keywords.":[14,100],"As":[15],"topics":[16,50,54],"interest":[18,56],"change":[19],"with":[20,156],"time":[21],"it":[22],"is":[23,31,103],"beneficial":[24],"to":[25,35,78,81],"adjust":[26],"keywords":[27,77,90,123],"dynamically.":[28],"The":[29,48,85,101,115,160],"challenge":[30],"that":[32,71],"these":[33],"need":[34],"be":[36,60,79],"specified":[37,99],"ahead":[38],"knowing":[40],"the":[41,45,93,98,128,131,136,142],"forthcoming":[42,138],"and":[44,91,111],"underlying":[46,94,132],"topics.":[47],"future":[49,83],"should":[51,59],"mimic":[52],"past":[53],"yet":[57],"there":[58],"some":[61],"novelty":[62],"in":[63],"them.":[64],"We":[65,140],"develop":[66],"keyword-based":[68,161],"topic":[69,144,158,162],"model":[70,102,129,145,149,163,168],"dynamically":[72],"selects":[73,89],"subset":[75,121,127],"used":[80],"collect":[82],"documents.":[84,139],"generative":[86],"process":[87],"first":[88],"then":[92],"based":[96],"on":[97],"trained":[104],"using":[106,150],"variational":[108],"lower":[109],"bound":[110],"stochastic":[112],"gradient":[113],"optimization.":[114],"inference":[116],"consists":[117],"finding":[119],"where":[124],"given":[125],"predicts":[130],"topic-word":[133],"matrix":[134],"for":[135],"unknown":[137],"compare":[141],"keyword":[143],"against":[146],"benchmark":[148],"viral":[151],"predictions":[152],"combined":[155],"model.":[159],"outperforms":[164],"this":[165],"sophisticated":[166],"baseline":[167],"67%.":[170]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2021,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
