{"id":"https://openalex.org/W4200428021","doi":"https://doi.org/10.1145/3488560.3498518","title":"Keyword Assisted Embedded Topic Model","display_name":"Keyword Assisted Embedded Topic Model","publication_year":2022,"publication_date":"2022-02-11","ids":{"openalex":"https://openalex.org/W4200428021","doi":"https://doi.org/10.1145/3488560.3498518"},"language":"en","primary_location":{"id":"doi:10.1145/3488560.3498518","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3488560.3498518","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3488560.3498518","source":{"id":"https://openalex.org/S4363608885","display_name":"Proceedings of the Fifteenth ACM International Conference on Web Search and Data Mining","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Fifteenth ACM International Conference on Web Search and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3488560.3498518","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5066156038","display_name":"Bahareh Harandizadeh","orcid":null},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Bahareh Harandizadeh","raw_affiliation_strings":["University of Southern California, Los Angeles, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Los Angeles, CA, USA","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079427575","display_name":"J. Hunter Priniski","orcid":null},"institutions":[{"id":"https://openalex.org/I161318765","display_name":"University of California, Los Angeles","ror":"https://ror.org/046rm7j60","country_code":"US","type":"education","lineage":["https://openalex.org/I161318765"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"J. Hunter Priniski","raw_affiliation_strings":["University of California, Los Angeles, Los Angeles, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of California, Los Angeles, Los Angeles, CA, USA","institution_ids":["https://openalex.org/I161318765"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5002709735","display_name":"Fred Morstatter","orcid":"https://orcid.org/0000-0002-0247-4328"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Fred Morstatter","raw_affiliation_strings":["University of Southern California, Los Angeles, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Los Angeles, CA, USA","institution_ids":["https://openalex.org/I1174212"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5066156038"],"corresponding_institution_ids":["https://openalex.org/I1174212"],"apc_list":null,"apc_paid":null,"fwci":2.4002,"has_fulltext":true,"cited_by_count":23,"citation_normalized_percentile":{"value":0.90434552,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"372","last_page":"380"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9976000189781189,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.8968325853347778},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8599882125854492},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.8527034521102905},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5606889128684998},{"id":"https://openalex.org/keywords/vocabulary","display_name":"Vocabulary","score":0.5603856444358826},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5540307760238647},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5307531356811523},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5237388610839844},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.516715943813324},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.49896979331970215},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.49751904606819153},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.4913150370121002},{"id":"https://openalex.org/keywords/probabilistic-latent-semantic-analysis","display_name":"Probabilistic latent semantic analysis","score":0.483661025762558},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.46908703446388245},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.45055249333381653},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.4172886610031128},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.4101265072822571},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.1977194845676422}],"concepts":[{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.8968325853347778},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8599882125854492},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.8527034521102905},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5606889128684998},{"id":"https://openalex.org/C2777601683","wikidata":"https://www.wikidata.org/wiki/Q6499736","display_name":"Vocabulary","level":2,"score":0.5603856444358826},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5540307760238647},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5307531356811523},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5237388610839844},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.516715943813324},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.49896979331970215},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.49751904606819153},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.4913150370121002},{"id":"https://openalex.org/C112933361","wikidata":"https://www.wikidata.org/wiki/Q2845258","display_name":"Probabilistic latent semantic analysis","level":2,"score":0.483661025762558},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.46908703446388245},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.45055249333381653},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.4172886610031128},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.4101265072822571},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.1977194845676422},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3488560.3498518","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3488560.3498518","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3488560.3498518","source":{"id":"https://openalex.org/S4363608885","display_name":"Proceedings of the Fifteenth ACM International Conference on Web Search and Data Mining","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Fifteenth ACM International Conference on Web Search and Data Mining","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2112.03101","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2112.03101","pdf_url":"https://arxiv.org/pdf/2112.03101","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/3488560.3498518","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3488560.3498518","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3488560.3498518","source":{"id":"https://openalex.org/S4363608885","display_name":"Proceedings of the Fifteenth ACM International Conference on Web Search and Data Mining","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Fifteenth ACM International Conference on Web Search and Data Mining","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","score":0.8199999928474426,"display_name":"Quality Education"}],"awards":[{"id":"https://openalex.org/G2824684834","display_name":null,"funder_award_id":"W911NF-21-C-0002","funder_id":"https://openalex.org/F4320332180","funder_display_name":"Defense Advanced Research Projects Agency"},{"id":"https://openalex.org/G5524522455","display_name":null,"funder_award_id":"DARPA","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"},{"id":"https://openalex.org/G7452299184","display_name":null,"funder_award_id":"W911NF","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"},{"id":"https://openalex.org/G8576428936","display_name":null,"funder_award_id":"W911NF-21-C-0002","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"},{"id":"https://openalex.org/G8998121839","display_name":null,"funder_award_id":"911NF","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"}],"funders":[{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320332815","display_name":"Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320338281","display_name":"Army Research Office","ror":"https://ror.org/05epdh915"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4200428021.pdf","grobid_xml":"https://content.openalex.org/works/W4200428021.grobid-xml"},"referenced_works_count":23,"referenced_works":["https://openalex.org/W43037342","https://openalex.org/W1506246224","https://openalex.org/W1614298861","https://openalex.org/W1983719983","https://openalex.org/W2098062695","https://openalex.org/W2122683976","https://openalex.org/W2159426623","https://openalex.org/W2250533720","https://openalex.org/W2250539671","https://openalex.org/W2737946880","https://openalex.org/W2888507208","https://openalex.org/W2912500072","https://openalex.org/W2914138217","https://openalex.org/W2914304175","https://openalex.org/W2952478253","https://openalex.org/W3004119480","https://openalex.org/W3045464143","https://openalex.org/W3098852527","https://openalex.org/W3099045991","https://openalex.org/W3100474067","https://openalex.org/W4294170691","https://openalex.org/W4301230818","https://openalex.org/W4362454468"],"related_works":["https://openalex.org/W1551384396","https://openalex.org/W2096865229","https://openalex.org/W2921491680","https://openalex.org/W2251863249","https://openalex.org/W4291700620","https://openalex.org/W2132052677","https://openalex.org/W3159709618","https://openalex.org/W2891616219","https://openalex.org/W4396666968","https://openalex.org/W2110027950"],"abstract_inverted_index":{"By":[0],"illuminating":[1],"latent":[2,29,44],"structures":[3],"in":[4,36,62,115,149],"a":[5,41,86,133],"corpus":[6],"of":[7,22,43,85,90,118],"text,":[8],"topic":[9,25,134],"models":[10,148],"are":[11,38,75],"an":[12],"essential":[13],"tool":[14],"for":[15,152],"categorizing,":[16],"summarizing,":[17],"and":[18,72,129],"exploring":[19],"large":[20],"collections":[21],"documents.":[23],"Probabilistic":[24],"models,":[26,77],"such":[27],"as":[28],"Dirichlet":[30],"allocation":[31],"(LDA),":[32],"describe":[33],"how":[34],"words":[35],"documents":[37],"generated":[39],"via":[40],"set":[42],"distributions":[45],"called":[46],"topics.":[47,69],"Recently,":[48],"the":[49,59,91,98,109,116,123,150],"Embedded":[50,101],"Topic":[51,102],"Model":[52,103],"(ETM)":[53],"has":[54],"extended":[55],"LDA":[56,71],"to":[57,65,81,111],"utilize":[58],"semantic":[60],"information":[61],"word":[63],"embeddings":[64],"derive":[66],"semantically":[67],"richer":[68],"As":[70],"its":[73],"extensions":[74],"unsupervised":[76],"they":[78],"aren't":[79],"defined":[80],"make":[82],"efficient":[83],"use":[84],"user's":[87],"prior":[88],"knowledge":[89,114],"domain.":[92],"To":[93],"this":[94,153],"end,":[95],"we":[96,137],"propose":[97],"Keyword":[99],"Assisted":[100],"(KeyETM),":[104],"which":[105],"equips":[106],"ETM":[107],"with":[108],"ability":[110],"incorporate":[112],"user":[113],"form":[117],"informative":[119],"topic-level":[120],"priors":[121],"over":[122],"vocabulary.":[124],"Using":[125],"both":[126],"quantitative":[127],"metrics":[128],"human":[130],"responses":[131],"on":[132],"intrusion":[135],"task,":[136],"demonstrate":[138],"that":[139],"KeyETM":[140],"produces":[141],"better":[142],"topics":[143],"than":[144],"other":[145],"guided,":[146],"generative":[147],"literature\\footnoteCode":[151],"work":[154],"can":[155],"be":[156],"found":[157],"at":[158],"\\urlhttps://github.com/bahareharandizade/KeyETM":[159],".":[160]},"counts_by_year":[{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
