{"id":"https://openalex.org/W2904614016","doi":"https://doi.org/10.1145/3238250","title":"Seed-Guided Topic Model for Document Filtering and Classification","display_name":"Seed-Guided Topic Model for Document Filtering and Classification","publication_year":2018,"publication_date":"2018-12-06","ids":{"openalex":"https://openalex.org/W2904614016","doi":"https://doi.org/10.1145/3238250","mag":"2904614016"},"language":"en","primary_location":{"id":"doi:10.1145/3238250","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3238250","pdf_url":null,"source":{"id":"https://openalex.org/S4394735545","display_name":"ACM Transactions on Information Systems","issn_l":"1046-8188","issn":["1046-8188","1558-2868"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Information Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://dr.ntu.edu.sg/bitstream/10356/142845/2/Seed-guided%20topic%20model%20for%20document%20filtering%20and%20classification.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100734069","display_name":"Chenliang Li","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chenliang Li","raw_affiliation_strings":["Wuhan University, Wuhan, Hubei, China"],"affiliations":[{"raw_affiliation_string":"Wuhan University, Wuhan, Hubei, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012774122","display_name":"Shiqian Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiqian Chen","raw_affiliation_strings":["Wuhan University, Wuhan, Hubei, China"],"affiliations":[{"raw_affiliation_string":"Wuhan University, Wuhan, Hubei, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016171393","display_name":"Jian Xing","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jian Xing","raw_affiliation_strings":["Hithink RoyalFlush Information Network Co., Ltd, China"],"affiliations":[{"raw_affiliation_string":"Hithink RoyalFlush Information Network Co., Ltd, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100618738","display_name":"Aixin Sun","orcid":"https://orcid.org/0000-0003-0764-4258"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Aixin Sun","raw_affiliation_strings":["Nanyang technological University, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5008327536","display_name":"Zongyang Ma","orcid":"https://orcid.org/0009-0003-1980-9379"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zongyang Ma","raw_affiliation_strings":["Microsoft (China) Co., Ltd, Soochow, China"],"affiliations":[{"raw_affiliation_string":"Microsoft (China) Co., Ltd, Soochow, China","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5100734069"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":null,"apc_paid":null,"fwci":4.0617,"has_fulltext":true,"cited_by_count":42,"citation_normalized_percentile":{"value":0.95108978,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"37","issue":"1","first_page":"1","last_page":"37"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8224483132362366},{"id":"https://openalex.org/keywords/novelty","display_name":"Novelty","score":0.664941132068634},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.6343811750411987},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5811046361923218},{"id":"https://openalex.org/keywords/meaning","display_name":"Meaning (existential)","score":0.5765601396560669},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.5692384243011475},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5353975892066956},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.529328465461731},{"id":"https://openalex.org/keywords/topic-model","display_name":"Topic model","score":0.519388735294342},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4592589735984802},{"id":"https://openalex.org/keywords/word","display_name":"Word (group theory)","score":0.43724897503852844},{"id":"https://openalex.org/keywords/stop-words","display_name":"Stop words","score":0.41186216473579407},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.14053210616111755}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8224483132362366},{"id":"https://openalex.org/C2778738651","wikidata":"https://www.wikidata.org/wiki/Q16546687","display_name":"Novelty","level":2,"score":0.664941132068634},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.6343811750411987},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5811046361923218},{"id":"https://openalex.org/C2780876879","wikidata":"https://www.wikidata.org/wiki/Q3054749","display_name":"Meaning (existential)","level":2,"score":0.5765601396560669},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.5692384243011475},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5353975892066956},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.529328465461731},{"id":"https://openalex.org/C171686336","wikidata":"https://www.wikidata.org/wiki/Q3532085","display_name":"Topic model","level":2,"score":0.519388735294342},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4592589735984802},{"id":"https://openalex.org/C90805587","wikidata":"https://www.wikidata.org/wiki/Q10944557","display_name":"Word (group theory)","level":2,"score":0.43724897503852844},{"id":"https://openalex.org/C188338183","wikidata":"https://www.wikidata.org/wiki/Q80735","display_name":"Stop words","level":3,"score":0.41186216473579407},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.14053210616111755},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.0},{"id":"https://openalex.org/C542102704","wikidata":"https://www.wikidata.org/wiki/Q183257","display_name":"Psychotherapist","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C27206212","wikidata":"https://www.wikidata.org/wiki/Q34178","display_name":"Theology","level":1,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3238250","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3238250","pdf_url":null,"source":{"id":"https://openalex.org/S4394735545","display_name":"ACM Transactions on Information Systems","issn_l":"1046-8188","issn":["1046-8188","1558-2868"],"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM Transactions on Information Systems","raw_type":"journal-article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/142845","is_oa":true,"landing_page_url":"https://hdl.handle.net/10356/142845","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/142845/2/Seed-guided%20topic%20model%20for%20document%20filtering%20and%20classification.pdf","source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"}],"best_oa_location":{"id":"pmh:oai:dr.ntu.edu.sg:10356/142845","is_oa":true,"landing_page_url":"https://hdl.handle.net/10356/142845","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/142845/2/Seed-guided%20topic%20model%20for%20document%20filtering%20and%20classification.pdf","source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","score":0.4699999988079071,"display_name":"Partnerships for the goals"}],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2802911279","display_name":null,"funder_award_id":"Young","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2870525900","display_name":null,"funder_award_id":"Wuhan","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5525282449","display_name":null,"funder_award_id":"201601","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6058138561","display_name":null,"funder_award_id":", No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6181681409","display_name":null,"funder_award_id":"2017CFB502","funder_id":"https://openalex.org/F4320322186","funder_display_name":"Natural Science Foundation of Hubei Province"},{"id":"https://openalex.org/G6804958431","display_name":null,"funder_award_id":"Wuhan","funder_id":"https://openalex.org/F4320322186","funder_display_name":"Natural Science Foundation of Hubei Province"},{"id":"https://openalex.org/G6904163575","display_name":null,"funder_award_id":"2042017kf0225","funder_id":"https://openalex.org/F4320324116","funder_display_name":"Wuhan University"},{"id":"https://openalex.org/G6933957087","display_name":null,"funder_award_id":"2016012","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7050358598","display_name":null,"funder_award_id":"61502344","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322186","display_name":"Natural Science Foundation of Hubei Province","ror":null},{"id":"https://openalex.org/F4320322724","display_name":"Ministry of Education, India","ror":"https://ror.org/048xjjh50"},{"id":"https://openalex.org/F4320324116","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2904614016.pdf","grobid_xml":"https://content.openalex.org/works/W2904614016.grobid-xml"},"referenced_works_count":50,"referenced_works":["https://openalex.org/W43037342","https://openalex.org/W265767496","https://openalex.org/W658020064","https://openalex.org/W746911252","https://openalex.org/W1506246224","https://openalex.org/W1532325895","https://openalex.org/W1598801360","https://openalex.org/W1609010894","https://openalex.org/W1628041482","https://openalex.org/W1880262756","https://openalex.org/W1995866178","https://openalex.org/W2001082470","https://openalex.org/W2026439336","https://openalex.org/W2035798593","https://openalex.org/W2065883328","https://openalex.org/W2069564398","https://openalex.org/W2083305840","https://openalex.org/W2092970348","https://openalex.org/W2097089247","https://openalex.org/W2098062695","https://openalex.org/W2101101940","https://openalex.org/W2103587173","https://openalex.org/W2107743791","https://openalex.org/W2108281845","https://openalex.org/W2113378307","https://openalex.org/W2120779048","https://openalex.org/W2125327503","https://openalex.org/W2127416213","https://openalex.org/W2128507180","https://openalex.org/W2129319055","https://openalex.org/W2130339025","https://openalex.org/W2133568543","https://openalex.org/W2137268161","https://openalex.org/W2145078771","https://openalex.org/W2145494108","https://openalex.org/W2147152072","https://openalex.org/W2150731624","https://openalex.org/W2152253130","https://openalex.org/W2158085718","https://openalex.org/W2166353350","https://openalex.org/W2171506566","https://openalex.org/W2270414365","https://openalex.org/W2285986798","https://openalex.org/W2340381866","https://openalex.org/W2507254902","https://openalex.org/W2533513334","https://openalex.org/W2745475103","https://openalex.org/W3005822403","https://openalex.org/W3138773240","https://openalex.org/W4233135949"],"related_works":["https://openalex.org/W2381242807","https://openalex.org/W2751208925","https://openalex.org/W3126131230","https://openalex.org/W2347541121","https://openalex.org/W4288804799","https://openalex.org/W2080951048","https://openalex.org/W3089617106","https://openalex.org/W3032237421","https://openalex.org/W2155531513","https://openalex.org/W2359738357"],"abstract_inverted_index":{"One":[0],"important":[1],"necessity":[2],"is":[3,36,167,204,220,249,311,340],"to":[4,45,62,120,313],"filter":[5],"out":[6,129],"the":[7,12,48,52,92,121,125,130,135,139,180,183,188,192,195,218,224,228,234,244,271,299,314,324,347,351,355,360],"irrelevant":[8,131],"information":[9,14],"and":[10,38,96,106,133,152,163,210,237,281],"organize":[11],"relevant":[13,71,119,136],"into":[15,138],"meaningful":[16],"categories.":[17],"However,":[18],"developing":[19],"text":[20,79,94,274,332],"classifiers":[21,275],"often":[22],"requires":[23],"a":[24,56,67,87,101,111,207,211,320],"large":[25],"number":[26],"of":[27,70,103,114,124,149,160,182,213,217,326,350],"labeled":[28],"documents":[29,35,53,64,132,137],"as":[30,77],"training":[31],"examples.":[32],"Manually":[33],"labeling":[34],"costly":[37],"time-consuming.":[39],"More":[40],"importantly,":[41],"it":[42,339],"becomes":[43],"unrealistic":[44],"know":[46],"all":[47],"categories":[49,141,185],"covered":[50,186],"by":[51,65,187,226],"beforehand.":[54],"Recently,":[55],"few":[57],"methods":[58],"have":[59],"been":[60],"proposed":[61],"label":[63],"using":[66,342],"small":[68,112],"set":[69,113],"keywords":[72],"for":[73,91,107,276,329,354],"each":[74,108,202],"category,":[75,126,172],"known":[76],"dataless":[78,93,273,331,361],"classification":[80,97,278,282,296,333,362],".":[81,154],"In":[82,285],"this":[83],"article,":[84],"we":[85,318],"propose":[86],"seed-guided":[88],"topic":[89,143],"model":[90,219],"filtering":[95,280],"(named":[98],"DFC).":[99],"Given":[100],"collection":[102],"unlabeled":[104],"documents,":[105],"specified":[109],"category":[110,357],"seed":[115,235,327,344,352],"words":[116,236,239,328,345,353],"that":[117,201,221,267,309,338,358],"are":[118,157],"semantic":[122,175,197],"meaning":[123],"DFC":[127,145,199,222,268,288,310],"filters":[128],"classifies":[134],"corresponding":[140,356],"through":[142],"influence.":[144],"models":[146],"two":[147,158,262],"kinds":[148,159],"topics:":[150],"category-topics":[151],"general-topics":[153,193],"Also,":[155],"there":[156],"category-topics:":[161],"relevant-topics":[162],"irrelevant-topics.":[164],"Each":[165],"relevant-topic":[166],"associated":[168,205],"with":[169,206,279],"one":[170],"specific":[171],"representing":[173],"its":[174,256],"meaning.":[176],"The":[177,335],"irrelevant-topics":[178],"represent":[179],"semantics":[181],"unknown":[184],"document":[189,203,245,248,348],"collection.":[190,246],"And":[191],"capture":[194],"global":[196],"information.":[198],"assumes":[200],"single":[208],"category-topic":[209,258],"mixture":[212],"general-topics.":[214],"A":[215,247],"novelty":[216],"learns":[223],"topics":[225],"exploiting":[227],"explicit":[229],"word":[230],"co-occurrence":[231],"patterns":[232],"between":[233],"regular":[238],"(i.e.,":[240],"non-seed":[241],"words)":[242],"in":[243],"then":[250],"filtered,":[251],"or":[252,293],"classified,":[253],"based":[254],"on":[255,261],"posterior":[257],"assignment.":[259],"Experiments":[260],"widely":[263],"used":[264],"datasets":[265],"show":[266,308],"consistently":[269],"outperforms":[270],"state-of-the-art":[272,300],"both":[277],"without":[283],"filtering.":[284],"many":[286],"tasks,":[287],"can":[289],"also":[290],"achieve":[291],"comparable":[292],"even":[294],"better":[295],"accuracy":[297],"than":[298],"supervised":[301],"learning":[302],"solutions.":[303],"Our":[304],"experimental":[305],"results":[306,336],"further":[307],"insensitive":[312],"tuning":[315],"parameters.":[316],"Moreover,":[317],"conduct":[319],"thorough":[321],"study":[322],"about":[323],"impact":[325],"existing":[330],"techniques.":[334],"reveal":[337],"not":[341],"more":[343],"but":[346],"coverage":[349],"affects":[359],"performance.":[363]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":4},{"year":2021,"cited_by_count":13},{"year":2020,"cited_by_count":10},{"year":2019,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
