{"id":"https://openalex.org/W4205601495","doi":"https://doi.org/10.1109/acit53391.2021.9677217","title":"Unsupervised Topic Aware Document-Level Semantic Representation for Document Clustering","display_name":"Unsupervised Topic Aware Document-Level Semantic Representation for Document Clustering","publication_year":2021,"publication_date":"2021-12-21","ids":{"openalex":"https://openalex.org/W4205601495","doi":"https://doi.org/10.1109/acit53391.2021.9677217"},"language":"en","primary_location":{"id":"doi:10.1109/acit53391.2021.9677217","is_oa":false,"landing_page_url":"https://doi.org/10.1109/acit53391.2021.9677217","pdf_url":null,"source":{"id":"https://openalex.org/S4363608487","display_name":"2021 22nd International Arab Conference on Information Technology (ACIT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 22nd International Arab Conference on Information Technology (ACIT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086471874","display_name":"Muhammad Rafi","orcid":"https://orcid.org/0000-0002-3673-5979"},"institutions":[{"id":"https://openalex.org/I201384688","display_name":"National University of Computer and Emerging Sciences","ror":"https://ror.org/003eyb898","country_code":"PK","type":"education","lineage":["https://openalex.org/I201384688"]}],"countries":["PK"],"is_corresponding":true,"raw_author_name":"Muhammad Rafi","raw_affiliation_strings":["FAST National University of Computer and Emerging Sciences,School of Computing,Karachi,Pakistan","School of Computing, FAST National University of Computer and Emerging Sciences, Karachi, Pakistan"],"affiliations":[{"raw_affiliation_string":"FAST National University of Computer and Emerging Sciences,School of Computing,Karachi,Pakistan","institution_ids":["https://openalex.org/I201384688"]},{"raw_affiliation_string":"School of Computing, FAST National University of Computer and Emerging Sciences, Karachi, Pakistan","institution_ids":["https://openalex.org/I201384688"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085291131","display_name":"Hamza Khan","orcid":"https://orcid.org/0000-0001-6165-4479"},"institutions":[{"id":"https://openalex.org/I201384688","display_name":"National University of Computer and Emerging Sciences","ror":"https://ror.org/003eyb898","country_code":"PK","type":"education","lineage":["https://openalex.org/I201384688"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Hamza Khan","raw_affiliation_strings":["FAST National University of Computer and Emerging Sciences,School of Computing,Karachi,Pakistan","School of Computing, FAST National University of Computer and Emerging Sciences, Karachi, Pakistan"],"affiliations":[{"raw_affiliation_string":"FAST National University of Computer and Emerging Sciences,School of Computing,Karachi,Pakistan","institution_ids":["https://openalex.org/I201384688"]},{"raw_affiliation_string":"School of Computing, FAST National University of Computer and Emerging Sciences, Karachi, Pakistan","institution_ids":["https://openalex.org/I201384688"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056906830","display_name":"Haya Nadeem","orcid":null},"institutions":[{"id":"https://openalex.org/I201384688","display_name":"National University of Computer and Emerging Sciences","ror":"https://ror.org/003eyb898","country_code":"PK","type":"education","lineage":["https://openalex.org/I201384688"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Haya Nadeem","raw_affiliation_strings":["FAST National University of Computer and Emerging Sciences,School of Computing,Karachi,Pakistan","School of Computing, FAST National University of Computer and Emerging Sciences, Karachi, Pakistan"],"affiliations":[{"raw_affiliation_string":"FAST National University of Computer and Emerging Sciences,School of Computing,Karachi,Pakistan","institution_ids":["https://openalex.org/I201384688"]},{"raw_affiliation_string":"School of Computing, FAST National University of Computer and Emerging Sciences, Karachi, Pakistan","institution_ids":["https://openalex.org/I201384688"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112727570","display_name":"H. Muhammad Shakeel","orcid":null},"institutions":[{"id":"https://openalex.org/I201384688","display_name":"National University of Computer and Emerging Sciences","ror":"https://ror.org/003eyb898","country_code":"PK","type":"education","lineage":["https://openalex.org/I201384688"]}],"countries":["PK"],"is_corresponding":false,"raw_author_name":"Hassan Shakeel","raw_affiliation_strings":["FAST National University of Computer and Emerging Sciences,School of Computing,Karachi,Pakistan","School of Computing, FAST National University of Computer and Emerging Sciences, Karachi, Pakistan"],"affiliations":[{"raw_affiliation_string":"FAST National University of Computer and Emerging Sciences,School of Computing,Karachi,Pakistan","institution_ids":["https://openalex.org/I201384688"]},{"raw_affiliation_string":"School of Computing, FAST National University of Computer and Emerging Sciences, Karachi, Pakistan","institution_ids":["https://openalex.org/I201384688"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5086471874"],"corresponding_institution_ids":["https://openalex.org/I201384688"],"apc_list":null,"apc_paid":null,"fwci":0.377,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.60871191,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"10"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/document-clustering","display_name":"Document clustering","score":0.8627236485481262},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8390467762947083},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7998071908950806},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.6165059208869934},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5565191507339478},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5366033911705017},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.5235124230384827},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.48624029755592346},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.46541452407836914},{"id":"https://openalex.org/keywords/document-retrieval","display_name":"Document retrieval","score":0.43105459213256836}],"concepts":[{"id":"https://openalex.org/C177937566","wikidata":"https://www.wikidata.org/wiki/Q4223102","display_name":"Document clustering","level":3,"score":0.8627236485481262},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8390467762947083},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7998071908950806},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.6165059208869934},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5565191507339478},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5366033911705017},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.5235124230384827},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.48624029755592346},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.46541452407836914},{"id":"https://openalex.org/C161156560","wikidata":"https://www.wikidata.org/wiki/Q1638872","display_name":"Document retrieval","level":2,"score":0.43105459213256836},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/acit53391.2021.9677217","is_oa":false,"landing_page_url":"https://doi.org/10.1109/acit53391.2021.9677217","pdf_url":null,"source":{"id":"https://openalex.org/S4363608487","display_name":"2021 22nd International Arab Conference on Information Technology (ACIT)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2021 22nd International Arab Conference on Information Technology (ACIT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.75,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W130742730","https://openalex.org/W1493526108","https://openalex.org/W1970544520","https://openalex.org/W1996640618","https://openalex.org/W2058990119","https://openalex.org/W2103986443","https://openalex.org/W2116031377","https://openalex.org/W2158997610","https://openalex.org/W2165612380","https://openalex.org/W2562566938","https://openalex.org/W2946185384","https://openalex.org/W2958504338","https://openalex.org/W4233135949","https://openalex.org/W6605363618"],"related_works":["https://openalex.org/W2019737068","https://openalex.org/W2899601636","https://openalex.org/W4254379378","https://openalex.org/W3015674157","https://openalex.org/W4206655101","https://openalex.org/W4237592971","https://openalex.org/W2387982377","https://openalex.org/W2145036943","https://openalex.org/W2000031603","https://openalex.org/W2102270039"],"abstract_inverted_index":{"Text":[0],"representation":[1,92,106,116,163],"is":[2,58,81,159,173],"critical":[3],"for":[4,94,113],"a":[5,27,33,59,102],"lot":[6,28],"of":[7,21,29,45,50,74,140,156],"applications":[8],"in":[9,23,26,32,62,66],"natural/computational":[10],"language":[11,68],"processing":[12],"and":[13,48,100,131,142,151,171,177],"understanding.":[14],"Textual":[15],"documents":[16,64],"are":[17,38,69,169],"the":[18,43,46,51,54,90,128],"basic":[19,129],"unit":[20],"communication":[22],"written/typed":[24],"form,":[25],"practical":[30],"settings":[31],"human":[34,67],"work":[35],"environment.":[36],"Humans":[37],"very":[39,82],"good":[40],"at":[41],"understanding":[42],"purpose":[44],"document":[47,85,91,97,105,115,152,157],"comprehension":[49],"semantics":[52,99],"from":[53,127],"document.":[55],"Document":[56,78],"clustering":[57,61,79,158,172,179],"specialized":[60],"which":[63],"written":[65],"automatically":[70],"partitioned":[71],"into":[72],"groups(clusters)":[73],"distinguishable":[75],"sub":[76],"collection.":[77],"process":[80],"sensitive":[83],"to":[84,134,161],"representation.":[86],"This":[87],"paper":[88],"investigates":[89],"models":[93],"succinctly":[95],"representing":[96],"level":[98],"employs":[101],"topic":[103],"aware":[104],"approach.":[107],"It":[108],"suggests":[109],"several":[110],"desirable":[111],"features":[112],"effective":[114],"(i)":[117],"it":[118,124],"should":[119,125],"capture":[120],"word-to-word":[121],"relationship,":[122],"(ii)":[123],"derive":[126],"words":[130],"their":[132],"relation":[133],"form":[135],"topic-units":[136,150],"(a":[137],"larger":[138],"composition":[139],"words)":[141],"(iii)":[143],"feature":[144],"\u2013weighting":[145],"scheme":[146],"based":[147],"on":[148,175],"frequent":[149],"correlation.":[153],"The":[154],"task":[155],"used":[160,170],"evaluate":[162],"schemes.":[164],"Standard":[165],"text":[166],"mining":[167],"datasets":[168],"evaluated":[174],"internal":[176],"external":[178],"evaluation":[180],"measures.":[181]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2021,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
