{"id":"https://openalex.org/W3004119480","doi":"https://doi.org/10.1145/3366423.3380278","title":"Discriminative Topic Mining via Category-Name Guided Text Embedding","display_name":"Discriminative Topic Mining via Category-Name Guided Text Embedding","publication_year":2020,"publication_date":"2020-04-20","ids":{"openalex":"https://openalex.org/W3004119480","doi":"https://doi.org/10.1145/3366423.3380278","mag":"3004119480"},"language":"en","primary_location":{"id":"doi:10.1145/3366423.3380278","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380278","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3366423.3380278","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100770786","display_name":"Meng Yu","orcid":"https://orcid.org/0000-0003-2554-2888"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yu Meng","raw_affiliation_strings":["University of Illinois at Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046688345","display_name":"Jiaxin Huang","orcid":"https://orcid.org/0000-0001-8095-3343"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiaxin Huang","raw_affiliation_strings":["University of Illinois Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101451274","display_name":"Guangyuan Wang","orcid":"https://orcid.org/0009-0007-2388-0716"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Guangyuan Wang","raw_affiliation_strings":["University of Illinois at Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100380104","display_name":"Zihan Wang","orcid":"https://orcid.org/0000-0002-8964-9046"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zihan Wang","raw_affiliation_strings":["University of Illinois at Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100460272","display_name":"Chao Zhang","orcid":"https://orcid.org/0000-0003-3009-598X"},"institutions":[{"id":"https://openalex.org/I130701444","display_name":"Georgia Institute of Technology","ror":"https://ror.org/01zkghx44","country_code":"US","type":"education","lineage":["https://openalex.org/I130701444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Chao Zhang","raw_affiliation_strings":["Georgia Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Georgia Institute of Technology","institution_ids":["https://openalex.org/I130701444"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003837744","display_name":"Yu Zhang","orcid":"https://orcid.org/0000-0003-0540-6758"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yu Zhang","raw_affiliation_strings":["University of Illinois at Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5019539533","display_name":"Jiawei Han","orcid":"https://orcid.org/0000-0002-3629-2696"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiawei Han","raw_affiliation_strings":["University of Illinois at Urbana-Champaign"],"affiliations":[{"raw_affiliation_string":"University of Illinois at Urbana-Champaign","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100770786"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":7.63669652,"has_fulltext":false,"cited_by_count":63,"citation_normalized_percentile":{"value":0.97466165,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2121","last_page":"2132"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9929999709129333,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.7015987038612366},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.691625714302063},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5506441593170166},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.5044974088668823},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4926632046699524},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.47563695907592773}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.7015987038612366},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.691625714302063},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5506441593170166},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.5044974088668823},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4926632046699524},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.47563695907592773}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3366423.3380278","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380278","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1908.07162","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1908.07162","pdf_url":"https://arxiv.org/pdf/1908.07162","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/3366423.3380278","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380278","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.7599999904632568,"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":88,"referenced_works":["https://openalex.org/W56136284","https://openalex.org/W1506246224","https://openalex.org/W1615991656","https://openalex.org/W1788582768","https://openalex.org/W1832693441","https://openalex.org/W1880262756","https://openalex.org/W1966907789","https://openalex.org/W1969486090","https://openalex.org/W2042980227","https://openalex.org/W2048330531","https://openalex.org/W2050451500","https://openalex.org/W2074909580","https://openalex.org/W2098062695","https://openalex.org/W2106490775","https://openalex.org/W2107743791","https://openalex.org/W2108281845","https://openalex.org/W2112050062","https://openalex.org/W2113855231","https://openalex.org/W2122683976","https://openalex.org/W2132001515","https://openalex.org/W2132827946","https://openalex.org/W2133413932","https://openalex.org/W2135964261","https://openalex.org/W2140124448","https://openalex.org/W2145658888","https://openalex.org/W2164019165","https://openalex.org/W2168717408","https://openalex.org/W2178725228","https://openalex.org/W2187089797","https://openalex.org/W2238728730","https://openalex.org/W2250533720","https://openalex.org/W2250539671","https://openalex.org/W2250753706","https://openalex.org/W2250930514","https://openalex.org/W2251981022","https://openalex.org/W2285986798","https://openalex.org/W2286496058","https://openalex.org/W2294774419","https://openalex.org/W2296283641","https://openalex.org/W2470673105","https://openalex.org/W2493916176","https://openalex.org/W2517063656","https://openalex.org/W2519468206","https://openalex.org/W2585828887","https://openalex.org/W2593560537","https://openalex.org/W2618798060","https://openalex.org/W2626778328","https://openalex.org/W2738508272","https://openalex.org/W2744007523","https://openalex.org/W2753171404","https://openalex.org/W2787560479","https://openalex.org/W2796314760","https://openalex.org/W2804622816","https://openalex.org/W2883559670","https://openalex.org/W2890332877","https://openalex.org/W2890931111","https://openalex.org/W2895817984","https://openalex.org/W2896457183","https://openalex.org/W2912651257","https://openalex.org/W2949300694","https://openalex.org/W2949679478","https://openalex.org/W2950069681","https://openalex.org/W2950133940","https://openalex.org/W2961152326","https://openalex.org/W2962936818","https://openalex.org/W2963413667","https://openalex.org/W2963639153","https://openalex.org/W2963766892","https://openalex.org/W2963841265","https://openalex.org/W2963912736","https://openalex.org/W2964117810","https://openalex.org/W2964301648","https://openalex.org/W2964311827","https://openalex.org/W2971324494","https://openalex.org/W2986039727","https://openalex.org/W3003661976","https://openalex.org/W3004011066","https://openalex.org/W3045464143","https://openalex.org/W3101606352","https://openalex.org/W3102679845","https://openalex.org/W3104717349","https://openalex.org/W3158986179","https://openalex.org/W4231510805","https://openalex.org/W4233135949","https://openalex.org/W4294170691","https://openalex.org/W4295111765","https://openalex.org/W4295112348","https://openalex.org/W4385245566"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W4205463238","https://openalex.org/W2761785940","https://openalex.org/W2110523656","https://openalex.org/W1482209366","https://openalex.org/W3204019825"],"abstract_inverted_index":{"Mining":[0],"a":[1,23,47,55,74,97,116,131,152],"set":[2,56,133,142],"of":[3,57,134,143,154],"meaningful":[4],"and":[5,38,78,120,150,160],"distinctive":[6],"topics":[7,30,64,81,144],"automatically":[8],"from":[9,65],"massive":[10],"text":[11,66,101],"corpora":[12],"has":[13],"broad":[14],"applications.":[15],"Existing":[16],"topic":[17,51,106],"models,":[18],"however,":[19],"typically":[20],"work":[21],"in":[22,125],"purely":[24],"unsupervised":[25],"way,":[26],"which":[27,53,108],"often":[28],"generate":[29],"that":[31,138],"do":[32],"not":[33,71],"fit":[34],"users'":[35],"particular":[36],"needs":[37],"yield":[39],"suboptimal":[40],"performance":[41],"on":[42],"downstream":[43,155],"tasks.":[44,93],"We":[45,94,129],"propose":[46],"new":[48,69],"task,":[49],"discriminative":[50,63,105,117],"mining,":[52,107],"leverages":[54,110],"user-provided":[58],"category":[59,122,147],"names":[60,148],"to":[61,114,136],"mine":[62],"corpora.":[67],"This":[68],"task":[70],"only":[72],"helps":[73],"user":[75,112],"understand":[76],"clearly":[77],"distinctively":[79],"the":[80],"he/she":[82],"is":[83],"most":[84],"interested":[85],"in,":[86],"but":[87],"also":[88],"benefits":[89,151],"directly":[90],"keyword-driven":[91],"classification":[92,159],"develop":[95],"CatE,":[96],"novel":[98],"category-name":[99],"guided":[100,145],"embedding":[102,118],"method":[103],"for":[104],"effectively":[109],"minimal":[111],"guidance":[113],"learn":[115],"space":[119],"discover":[121],"representative":[123],"terms":[124],"an":[126],"iterative":[127],"manner.":[128],"conduct":[130],"comprehensive":[132],"experiments":[135],"show":[137],"CatE":[139],"mines":[140],"high-quality":[141],"by":[146],"only,":[149],"variety":[153],"applications":[156],"including":[157],"weakly-supervised":[158],"lexical":[161],"entailment":[162],"direction":[163],"identification.":[164]},"counts_by_year":[{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":14},{"year":2022,"cited_by_count":15},{"year":2021,"cited_by_count":8},{"year":2020,"cited_by_count":15}],"updated_date":"2026-02-09T09:26:11.010843","created_date":"2025-10-10T00:00:00"}
