{"id":"https://openalex.org/W2564359861","doi":"https://doi.org/10.1145/2996890.3007856","title":"Multi-level topical text categorization with wikipedia","display_name":"Multi-level topical text categorization with wikipedia","publication_year":2016,"publication_date":"2016-12-06","ids":{"openalex":"https://openalex.org/W2564359861","doi":"https://doi.org/10.1145/2996890.3007856","mag":"2564359861"},"language":"en","primary_location":{"id":"doi:10.1145/2996890.3007856","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2996890.3007856","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 9th International Conference on Utility and Cloud Computing","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101916247","display_name":"Nan Guo","orcid":"https://orcid.org/0000-0002-2124-371X"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Nan Guo","raw_affiliation_strings":["Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102025805","display_name":"Yuan He","orcid":"https://orcid.org/0000-0001-8462-3907"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuan He","raw_affiliation_strings":["Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101015946","display_name":"Chungang Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"ChunGang Yan","raw_affiliation_strings":["Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002822427","display_name":"Lu Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I22128151","display_name":"University of Derby","ror":"https://ror.org/02yhrrk59","country_code":"GB","type":"education","lineage":["https://openalex.org/I22128151"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Lu Liu","raw_affiliation_strings":["University of Derby, UK"],"affiliations":[{"raw_affiliation_string":"University of Derby, UK","institution_ids":["https://openalex.org/I22128151"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100417007","display_name":"Cheng Wang","orcid":"https://orcid.org/0000-0002-4752-0316"},"institutions":[{"id":"https://openalex.org/I116953780","display_name":"Tongji University","ror":"https://ror.org/03rc6as71","country_code":"CN","type":"education","lineage":["https://openalex.org/I116953780"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cheng Wang","raw_affiliation_strings":["Tongji University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Tongji University, Shanghai, China","institution_ids":["https://openalex.org/I116953780"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101916247"],"corresponding_institution_ids":["https://openalex.org/I116953780"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.09043717,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":"2","issue":null,"first_page":"343","last_page":"352"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9940999746322632,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.79332435131073},{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.7924861907958984},{"id":"https://openalex.org/keywords/latent-dirichlet-allocation","display_name":"Latent Dirichlet allocation","score":0.702507734298706},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.6683405637741089},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.617678165435791},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.584119439125061},{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.5792409777641296},{"id":"https://openalex.org/keywords/text-categorization","display_name":"Text categorization","score":0.558770477771759},{"id":"https://openalex.org/keywords/ambiguity","display_name":"Ambiguity","score":0.516644299030304},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5162160992622375},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.48747777938842773},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.34031474590301514}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.79332435131073},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.7924861907958984},{"id":"https://openalex.org/C500882744","wikidata":"https://www.wikidata.org/wiki/Q269236","display_name":"Latent Dirichlet allocation","level":3,"score":0.702507734298706},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.6683405637741089},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.617678165435791},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.584119439125061},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.5792409777641296},{"id":"https://openalex.org/C2986744138","wikidata":"https://www.wikidata.org/wiki/Q302088","display_name":"Text categorization","level":3,"score":0.558770477771759},{"id":"https://openalex.org/C2780522230","wikidata":"https://www.wikidata.org/wiki/Q1140419","display_name":"Ambiguity","level":2,"score":0.516644299030304},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5162160992622375},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.48747777938842773},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34031474590301514},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2996890.3007856","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2996890.3007856","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 9th International Conference on Utility and Cloud Computing","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7300000190734863}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W1598700880","https://openalex.org/W1817561967","https://openalex.org/W1878153963","https://openalex.org/W1880262756","https://openalex.org/W1961157042","https://openalex.org/W1969572066","https://openalex.org/W1986913017","https://openalex.org/W1993715838","https://openalex.org/W1997698702","https://openalex.org/W2005422315","https://openalex.org/W2006279708","https://openalex.org/W2022679416","https://openalex.org/W2042037135","https://openalex.org/W2042200090","https://openalex.org/W2044185127","https://openalex.org/W2044854172","https://openalex.org/W2046677795","https://openalex.org/W2049260684","https://openalex.org/W2090288396","https://openalex.org/W2096152098","https://openalex.org/W2097089247","https://openalex.org/W2099938389","https://openalex.org/W2100341149","https://openalex.org/W2107008379","https://openalex.org/W2114535528","https://openalex.org/W2116235440","https://openalex.org/W2122382209","https://openalex.org/W2123817815","https://openalex.org/W2131904035","https://openalex.org/W2142515059","https://openalex.org/W2166183437","https://openalex.org/W2168471263","https://openalex.org/W2169606435","https://openalex.org/W2316929664","https://openalex.org/W2365105281","https://openalex.org/W2390100100","https://openalex.org/W3001753394","https://openalex.org/W4298173534","https://openalex.org/W4399461173","https://openalex.org/W6679539681","https://openalex.org/W6684872003"],"related_works":["https://openalex.org/W2888805565","https://openalex.org/W4312773271","https://openalex.org/W4315588616","https://openalex.org/W2769501189","https://openalex.org/W2962686197","https://openalex.org/W2207653751","https://openalex.org/W4293863151","https://openalex.org/W3159709618","https://openalex.org/W2611137333","https://openalex.org/W3005513013"],"abstract_inverted_index":{"This":[0,56],"paper":[1,57],"introduces":[2],"an":[3,59],"automatic":[4],"categorical-marking":[5],"model":[6,65,74,129,186],"for":[7,21],"text":[8,44,114],"categorization.":[9],"Traditional":[10],"classification":[11,189],"algorithms":[12,46],"are":[13,96,123,139],"generally":[14],"applying":[15],"labeled":[16],"training":[17],"set":[18],"and":[19,36,52,62,81,87,110,143,162,168,192],"call":[20],"a":[22,118,126],"lot":[23],"of":[24,38,42,84,148,165,173,181],"manual":[25],"work":[26],"to":[27,33,75,78,90,99,106,141],"tag":[28],"classifications":[29,157],"beforehand.":[30],"Also":[31],"due":[32],"the":[34,40,136,146,152,155,160,166,174],"ambiguity":[35],"fuzziness":[37],"texts,":[39],"results":[41,95,177],"traditional":[43,113,197],"categorization":[45,64,115],"may":[47],"not":[48,97],"be":[49],"clear":[50],"enough":[51],"abundant":[53],"in":[54,188],"content.":[55],"presents":[58],"unsupervised,":[60],"training-set-free":[61],"hierarchical":[63,92],"called":[66,130],"Folk-Topical":[67],"Text":[68],"Categorization":[69],"(FTTC).":[70],"FTTC":[71],"applies":[72],"topic":[73,128],"abstract":[76],"documents":[77],"topical":[79,121,137],"words":[80,122,138],"make":[82],"use":[83],"Wikipedia's":[85],"crowd-sourcing":[86],"collective":[88],"control":[89],"extend":[91],"classifications.":[93],"The":[94],"restricted":[98],"predefined":[100],"categories":[101,104],"but":[102],"contain":[103],"abstracted":[105],"deeper":[107],"semantic":[108],"levels":[109],"greatly":[111],"facilitate":[112],"applications.":[116],"For":[117],"document,":[119],"its":[120],"obtained":[124],"using":[125],"popular":[127],"Latent":[131],"Dirichlet":[132],"Allocation":[133],"(LDA).":[134],"Afterwards,":[135],"used":[140],"build":[142],"trace":[144],"through":[145],"category-trees":[147],"Wikipedia.":[149],"Based":[150],"on":[151,178],"filtered":[153],"results,":[154],"final":[156],"comprehensively":[158],"reflect":[159],"diversified":[161],"content-rich":[163],"information":[164],"text,":[167],"fully":[169],"cover":[170],"different":[171,179],"aspects":[172],"text.":[175],"Experimental":[176],"kinds":[180],"datasets":[182],"show":[183],"that":[184],"our":[185],"advances":[187],"accuracy,":[190],"flexibility":[191],"intelligibility,":[193],"as":[194],"compared":[195],"with":[196],"models.":[198]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
