{"id":"https://openalex.org/W2768631238","doi":"https://doi.org/10.1109/icci-cc.2017.8109735","title":"An improved KNN text classification algorithm based on Simhash","display_name":"An improved KNN text classification algorithm based on Simhash","publication_year":2017,"publication_date":"2017-07-01","ids":{"openalex":"https://openalex.org/W2768631238","doi":"https://doi.org/10.1109/icci-cc.2017.8109735","mag":"2768631238"},"language":"en","primary_location":{"id":"doi:10.1109/icci-cc.2017.8109735","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icci-cc.2017.8109735","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE 16th International Conference on Cognitive Informatics &amp; Cognitive Computing (ICCI*CC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100454179","display_name":"Jie Liu","orcid":"https://orcid.org/0000-0003-0895-7598"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jie Liu","raw_affiliation_strings":["State Grid Sichuan Electric Power Company Information and Communications Branch"],"affiliations":[{"raw_affiliation_string":"State Grid Sichuan Electric Power Company Information and Communications Branch","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052636062","display_name":"Ting Jin","orcid":"https://orcid.org/0000-0002-0165-9021"},"institutions":[{"id":"https://openalex.org/I20942203","display_name":"Hainan University","ror":"https://ror.org/03q648j11","country_code":"CN","type":"education","lineage":["https://openalex.org/I20942203"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ting Jin","raw_affiliation_strings":["School of Information Science and Technology, HaiNan University"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Technology, HaiNan University","institution_ids":["https://openalex.org/I20942203"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5029772640","display_name":"Kejia Pan","orcid":"https://orcid.org/0000-0001-5768-7972"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kejia Pan","raw_affiliation_strings":["State Grid Sichuan Electric Power Company Information and Communications Branch"],"affiliations":[{"raw_affiliation_string":"State Grid Sichuan Electric Power Company Information and Communications Branch","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106743847","display_name":"Yi Yang","orcid":"https://orcid.org/0000-0001-9102-3678"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yi Yang","raw_affiliation_strings":["State Grid Sichuan Electric Power Company Information and Communications Branch"],"affiliations":[{"raw_affiliation_string":"State Grid Sichuan Electric Power Company Information and Communications Branch","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086732099","display_name":"Wu Yan","orcid":"https://orcid.org/0000-0002-0488-6967"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yan Wu","raw_affiliation_strings":["State Grid Sichuan Electric Power Company Information and Communications Branch"],"affiliations":[{"raw_affiliation_string":"State Grid Sichuan Electric Power Company Information and Communications Branch","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100328059","display_name":"Xin Wang","orcid":"https://orcid.org/0000-0003-0203-9964"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xin Wang","raw_affiliation_strings":["Chengdu Duhang Technology Development Co., Ltd"],"affiliations":[{"raw_affiliation_string":"Chengdu Duhang Technology Development Co., Ltd","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100454179"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.1701,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.84600411,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"92","last_page":"95"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12016","display_name":"Web Data Mining and Analysis","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hamming-distance","display_name":"Hamming distance","score":0.7936646938323975},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7220996618270874},{"id":"https://openalex.org/keywords/hamming-code","display_name":"Hamming code","score":0.6594278216362},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.5801429748535156},{"id":"https://openalex.org/keywords/statistical-classification","display_name":"Statistical classification","score":0.5228815078735352},{"id":"https://openalex.org/keywords/value","display_name":"Value (mathematics)","score":0.5153753161430359},{"id":"https://openalex.org/keywords/k-nearest-neighbors-algorithm","display_name":"k-nearest neighbors algorithm","score":0.48119646310806274},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.48020872473716736},{"id":"https://openalex.org/keywords/precision-and-recall","display_name":"Precision and recall","score":0.4657725989818573},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4596113860607147},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.4487980604171753},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3772439956665039},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2024947702884674},{"id":"https://openalex.org/keywords/decoding-methods","display_name":"Decoding methods","score":0.09249001741409302}],"concepts":[{"id":"https://openalex.org/C193319292","wikidata":"https://www.wikidata.org/wiki/Q272172","display_name":"Hamming distance","level":2,"score":0.7936646938323975},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7220996618270874},{"id":"https://openalex.org/C73150493","wikidata":"https://www.wikidata.org/wiki/Q853922","display_name":"Hamming code","level":4,"score":0.6594278216362},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.5801429748535156},{"id":"https://openalex.org/C110083411","wikidata":"https://www.wikidata.org/wiki/Q1744628","display_name":"Statistical classification","level":2,"score":0.5228815078735352},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.5153753161430359},{"id":"https://openalex.org/C113238511","wikidata":"https://www.wikidata.org/wiki/Q1071612","display_name":"k-nearest neighbors algorithm","level":2,"score":0.48119646310806274},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.48020872473716736},{"id":"https://openalex.org/C81669768","wikidata":"https://www.wikidata.org/wiki/Q2359161","display_name":"Precision and recall","level":2,"score":0.4657725989818573},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4596113860607147},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4487980604171753},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3772439956665039},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2024947702884674},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.09249001741409302},{"id":"https://openalex.org/C157125643","wikidata":"https://www.wikidata.org/wiki/Q884707","display_name":"Block code","level":3,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icci-cc.2017.8109735","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icci-cc.2017.8109735","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2017 IEEE 16th International Conference on Cognitive Informatics &amp; Cognitive Computing (ICCI*CC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7799999713897705,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":12,"referenced_works":["https://openalex.org/W1528068634","https://openalex.org/W1587362683","https://openalex.org/W1625504505","https://openalex.org/W1978394996","https://openalex.org/W1993934121","https://openalex.org/W1994410331","https://openalex.org/W2044144232","https://openalex.org/W2107686700","https://openalex.org/W2145349611","https://openalex.org/W2149684865","https://openalex.org/W2355995786","https://openalex.org/W2391609022"],"related_works":["https://openalex.org/W2943247777","https://openalex.org/W2740543340","https://openalex.org/W2371167013","https://openalex.org/W1582340598","https://openalex.org/W1541021634","https://openalex.org/W2794545997","https://openalex.org/W2584980534","https://openalex.org/W2182731056","https://openalex.org/W66917582","https://openalex.org/W1600949677"],"abstract_inverted_index":{"An":[0],"improved":[1],"KNN":[2,42],"text":[3,43],"classification":[4,44],"algorithm":[5,52],"based":[6],"on":[7],"Simhash":[8,14],"has":[9],"been":[10],"proposed":[11,51,71],"by":[12,31],"introducing":[13],"and":[15,34,60],"the":[16,28,35,40,50,67,70],"average":[17],"Hamming":[18],"distance":[19],"of":[20,69],"adjacent":[21],"texts":[22],"as":[23],"a":[24,54,57,61],"unit,":[25],"which":[26,65],"solves":[27],"problems":[29],"caused":[30],"data":[32],"imbalance":[33],"large":[36],"computational":[37],"overhead":[38],"in":[39],"traditional":[41],"algorithms.":[45],"Experimental":[46],"results":[47],"demonstrate":[48],"that":[49],"performs":[53],"higher":[55,58],"precision,":[56],"recall":[59],"better":[62],"F1":[63],"value,":[64],"shows":[66],"validity":[68],"algorithm.":[72]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":2},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":3},{"year":2018,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
