{"id":"https://openalex.org/W4389474103","doi":"https://doi.org/10.1109/tkde.2023.3340732","title":"A Clustering Framework for Unsupervised and Semi-Supervised New Intent Discovery","display_name":"A Clustering Framework for Unsupervised and Semi-Supervised New Intent Discovery","publication_year":2023,"publication_date":"2023-12-08","ids":{"openalex":"https://openalex.org/W4389474103","doi":"https://doi.org/10.1109/tkde.2023.3340732"},"language":"en","primary_location":{"id":"doi:10.1109/tkde.2023.3340732","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tkde.2023.3340732","pdf_url":null,"source":{"id":"https://openalex.org/S30698027","display_name":"IEEE Transactions on Knowledge and Data Engineering","issn_l":"1041-4347","issn":["1041-4347","1558-2191","2326-3865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Knowledge and Data Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5020655643","display_name":"Hanlei Zhang","orcid":"https://orcid.org/0000-0003-3448-6793"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Hanlei Zhang","raw_affiliation_strings":["State Key Laboratory of Intelligent Technology and Systems, Department of Computer Science and Technology, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-3448-6793","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Intelligent Technology and Systems, Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086201515","display_name":"Hua Xu","orcid":"https://orcid.org/0000-0002-7401-307X"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hua Xu","raw_affiliation_strings":["State Key Laboratory of Intelligent Technology and Systems, Department of Computer Science and Technology, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-7401-307X","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Intelligent Technology and Systems, Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092354460","display_name":"Xin Wang","orcid":"https://orcid.org/0000-0003-2709-9330"},"institutions":[{"id":"https://openalex.org/I34155123","display_name":"Hebei University of Science and Technology","ror":"https://ror.org/05h3pkk68","country_code":"CN","type":"education","lineage":["https://openalex.org/I34155123"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Wang","raw_affiliation_strings":["State Key Laboratory of Intelligent Technology and Systems, Department of Computer Science and Technology, Tsinghua University, Beijing, China","School of Information Science and Engineering, Hebei University of Science and Technology, Shijiazhuang, China"],"raw_orcid":"https://orcid.org/0000-0003-2709-9330","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Intelligent Technology and Systems, Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]},{"raw_affiliation_string":"School of Information Science and Engineering, Hebei University of Science and Technology, Shijiazhuang, China","institution_ids":["https://openalex.org/I34155123"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Fei Long","orcid":"https://orcid.org/0000-0002-2569-6396"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fei Long","raw_affiliation_strings":["State Key Laboratory of Intelligent Technology and Systems, Department of Computer Science and Technology, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-2569-6396","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Intelligent Technology and Systems, Department of Computer Science and Technology, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049255470","display_name":"Kai Gao","orcid":"https://orcid.org/0000-0003-3713-6035"},"institutions":[{"id":"https://openalex.org/I34155123","display_name":"Hebei University of Science and Technology","ror":"https://ror.org/05h3pkk68","country_code":"CN","type":"education","lineage":["https://openalex.org/I34155123"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kai Gao","raw_affiliation_strings":["School of Information Science and Engineering, Hebei University of Science and Technology, Shijiazhuang, Hebei, China"],"raw_orcid":"https://orcid.org/0000-0003-3713-6035","affiliations":[{"raw_affiliation_string":"School of Information Science and Engineering, Hebei University of Science and Technology, Shijiazhuang, Hebei, China","institution_ids":["https://openalex.org/I34155123"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5020655643"],"corresponding_institution_ids":["https://openalex.org/I99065089"],"apc_list":null,"apc_paid":null,"fwci":3.0674,"has_fulltext":false,"cited_by_count":18,"citation_normalized_percentile":{"value":0.93213831,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"36","issue":"11","first_page":"5468","last_page":"5481"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9948999881744385,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7871338129043579},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7268014550209045},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.53817218542099},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5239210724830627},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.3547179102897644},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.14510896801948547}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7871338129043579},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7268014550209045},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.53817218542099},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5239210724830627},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.3547179102897644},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.14510896801948547}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tkde.2023.3340732","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tkde.2023.3340732","pdf_url":null,"source":{"id":"https://openalex.org/S30698027","display_name":"IEEE Transactions on Knowledge and Data Engineering","issn_l":"1041-4347","issn":["1041-4347","1558-2191","2326-3865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Knowledge and Data Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":59,"referenced_works":["https://openalex.org/W1516407653","https://openalex.org/W1992419399","https://openalex.org/W2020735245","https://openalex.org/W2040810017","https://openalex.org/W2096100960","https://openalex.org/W2153839362","https://openalex.org/W2222512263","https://openalex.org/W2250539671","https://openalex.org/W2251410829","https://openalex.org/W2779692282","https://openalex.org/W2883725317","https://openalex.org/W2897135094","https://openalex.org/W2919115771","https://openalex.org/W2963341956","https://openalex.org/W2970641574","https://openalex.org/W2979826702","https://openalex.org/W2986193249","https://openalex.org/W2990604239","https://openalex.org/W2991537901","https://openalex.org/W2997574889","https://openalex.org/W2997591727","https://openalex.org/W2998721586","https://openalex.org/W3034576826","https://openalex.org/W3045492832","https://openalex.org/W3087124270","https://openalex.org/W3110446398","https://openalex.org/W3112240880","https://openalex.org/W3119242082","https://openalex.org/W3156636935","https://openalex.org/W3171153522","https://openalex.org/W3173488222","https://openalex.org/W3174620475","https://openalex.org/W3175562757","https://openalex.org/W3188188945","https://openalex.org/W4214687390","https://openalex.org/W4214872590","https://openalex.org/W4221161865","https://openalex.org/W4281719801","https://openalex.org/W4284968770","https://openalex.org/W4287855190","https://openalex.org/W4290877706","https://openalex.org/W4304080418","https://openalex.org/W4312281441","https://openalex.org/W4362714661","https://openalex.org/W4400315096","https://openalex.org/W6668990524","https://openalex.org/W6678914141","https://openalex.org/W6679849079","https://openalex.org/W6681096077","https://openalex.org/W6682962330","https://openalex.org/W6685380521","https://openalex.org/W6728550200","https://openalex.org/W6745901624","https://openalex.org/W6757817989","https://openalex.org/W6758241014","https://openalex.org/W6771518190","https://openalex.org/W6776700526","https://openalex.org/W6779997284","https://openalex.org/W6810927799"],"related_works":["https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2382290278","https://openalex.org/W2350741829","https://openalex.org/W2130043461","https://openalex.org/W2530322880"],"abstract_inverted_index":{"New":[0],"intent":[1,181,192],"discovery":[2,193],"is":[3,46],"of":[4,16,33,43,90,118,170],"great":[5],"value":[6],"to":[7,28,95,114,140],"natural":[8],"language":[9],"processing,":[10],"allowing":[11],"for":[12,59,105,127,158],"a":[13,54,110],"better":[14],"understanding":[15],"user":[17],"needs":[18],"and":[19,64,101,122,149,189,194],"providing":[20],"friendly":[21],"services.":[22],"However,":[23],"most":[24],"existing":[25],"methods":[26],"struggle":[27],"capture":[29],"the":[30,116,160,168],"complicated":[31],"semantics":[32,134],"discrete":[34],"text":[35],"representations":[36,104],"when":[37],"limited":[38],"or":[39,92,137],"no":[40],"prior":[41],"knowledge":[42],"labeled":[44],"data":[45,94,139],"available.":[47],"To":[48],"tackle":[49],"this":[50],"problem,":[51],"we":[52],"propose":[53,154],"novel":[55],"clustering":[56,112],"framework,":[57],"USNID,":[58],"<bold":[60,65,69,73,77],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[61,66,70,74,78],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">u</b>":[62],"nsupervised":[63],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">s</b>":[67],"emi-supervised":[68],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">n</b>":[71],"ew":[72],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">i</b>":[75],"ntent":[76],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">d</b>":[79],"iscovery,":[80],"which":[81],"has":[82],"three":[83],"key":[84],"technologies.":[85],"First,":[86],"it":[87,108,131],"fully":[88],"utilizes":[89],"unsupervised":[91,136,188],"semi-supervised":[93,138,190],"mine":[96],"shallow":[97],"semantic":[98],"similarity":[99],"relations":[100],"provide":[102,123],"well-initialized":[103],"clustering.":[106],"Second,":[107],"designs":[109],"centroid-guided":[111],"mechanism":[113],"address":[115],"issue":[117],"cluster":[119,161,200],"allocation":[120],"inconsistency":[121],"high-quality":[124],"self-supervised":[125],"targets":[126],"representation":[128],"learning.":[129],"Third,":[130],"captures":[132],"high-level":[133],"in":[135,163,187],"discover":[141],"fine-grained":[142],"intent-wise":[143],"clusters":[144],"by":[145],"optimizing":[146],"both":[147],"cluster-level":[148],"instance-level":[150],"objectives.":[151],"We":[152],"also":[153],"an":[155],"effective":[156],"method":[157],"estimating":[159],"number":[162,169],"open-world":[164],"scenarios":[165],"without":[166],"knowing":[167],"new":[171,184,191],"intents":[172],"beforehand.":[173],"USNID":[174],"performs":[175],"exceptionally":[176],"well":[177],"on":[178],"several":[179],"benchmark":[180],"datasets,":[182],"achieving":[183],"state-of-the-art":[185],"results":[186],"demonstrating":[195],"robust":[196],"performance":[197],"with":[198],"different":[199],"numbers.":[201]},"counts_by_year":[{"year":2026,"cited_by_count":6},{"year":2025,"cited_by_count":7},{"year":2024,"cited_by_count":5}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
