{"id":"https://openalex.org/W2168812139","doi":"https://doi.org/10.1177/0165551507082592","title":"A comparative study of two automatic document classification methods in a library setting","display_name":"A comparative study of two automatic document classification methods in a library setting","publication_year":2007,"publication_date":"2007-07-12","ids":{"openalex":"https://openalex.org/W2168812139","doi":"https://doi.org/10.1177/0165551507082592","mag":"2168812139"},"language":"en","primary_location":{"id":"doi:10.1177/0165551507082592","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551507082592","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5072960624","display_name":"Joanna Pong","orcid":"https://orcid.org/0000-0003-3304-2939"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Joanna Yi-Hang Pong","raw_affiliation_strings":["Run Run Shaw Library, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Run Run Shaw Library, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101559768","display_name":"Ron Chi-Wai Kwok","orcid":"https://orcid.org/0000-0001-9100-0142"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":true,"raw_author_name":"Ron Chi-Wai Kwok","raw_affiliation_strings":["Department of Information Systems, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong,"],"affiliations":[{"raw_affiliation_string":"Department of Information Systems, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong,","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5084348345","display_name":"Raymond Y.K. Lau","orcid":"https://orcid.org/0000-0002-5751-4550"},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Raymond Yiu-Keung Lau","raw_affiliation_strings":["Department of Information Systems, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Information Systems, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100507018","display_name":"Jin\u2010Xing Hao","orcid":null},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Jin-Xing Hao","raw_affiliation_strings":["Department of Information Systems, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Information Systems, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5090689254","display_name":"Percy Ching-Chi Wong","orcid":null},"institutions":[{"id":"https://openalex.org/I168719708","display_name":"City University of Hong Kong","ror":"https://ror.org/03q8dnn23","country_code":"HK","type":"education","lineage":["https://openalex.org/I168719708"]}],"countries":["HK"],"is_corresponding":false,"raw_author_name":"Percy Ching-Chi Wong","raw_affiliation_strings":["Department of Information Systems, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Department of Information Systems, City University of Hong Kong, Tat Chee Avenue, Kowloon, Hong Kong","institution_ids":["https://openalex.org/I168719708"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101559768"],"corresponding_institution_ids":["https://openalex.org/I168719708"],"apc_list":null,"apc_paid":null,"fwci":1.877,"has_fulltext":false,"cited_by_count":26,"citation_normalized_percentile":{"value":0.88612379,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"34","issue":"2","first_page":"213","last_page":"230"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13083","display_name":"Advanced Text Analysis Techniques","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9638000130653381,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8321454524993896},{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.6733173131942749},{"id":"https://openalex.org/keywords/library-classification","display_name":"Library classification","score":0.6687520742416382},{"id":"https://openalex.org/keywords/digital-library","display_name":"Digital library","score":0.6606884598731995},{"id":"https://openalex.org/keywords/search-engine-indexing","display_name":"Search engine indexing","score":0.6174222826957703},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6011708378791809},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5753827691078186},{"id":"https://openalex.org/keywords/document-classification","display_name":"Document classification","score":0.5601718425750732},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.530471920967102},{"id":"https://openalex.org/keywords/automatic-indexing","display_name":"Automatic indexing","score":0.4870662987232208},{"id":"https://openalex.org/keywords/the-internet","display_name":"The Internet","score":0.42785048484802246},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.32401394844055176},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.22610872983932495}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8321454524993896},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.6733173131942749},{"id":"https://openalex.org/C204126058","wikidata":"https://www.wikidata.org/wiki/Q48473","display_name":"Library classification","level":2,"score":0.6687520742416382},{"id":"https://openalex.org/C513874922","wikidata":"https://www.wikidata.org/wiki/Q212805","display_name":"Digital library","level":3,"score":0.6606884598731995},{"id":"https://openalex.org/C75165309","wikidata":"https://www.wikidata.org/wiki/Q2258979","display_name":"Search engine indexing","level":2,"score":0.6174222826957703},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6011708378791809},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5753827691078186},{"id":"https://openalex.org/C2780479914","wikidata":"https://www.wikidata.org/wiki/Q302088","display_name":"Document classification","level":2,"score":0.5601718425750732},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.530471920967102},{"id":"https://openalex.org/C2778330532","wikidata":"https://www.wikidata.org/wiki/Q4826577","display_name":"Automatic indexing","level":3,"score":0.4870662987232208},{"id":"https://openalex.org/C110875604","wikidata":"https://www.wikidata.org/wiki/Q75","display_name":"The Internet","level":2,"score":0.42785048484802246},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.32401394844055176},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.22610872983932495},{"id":"https://openalex.org/C164913051","wikidata":"https://www.wikidata.org/wiki/Q482","display_name":"Poetry","level":2,"score":0.0},{"id":"https://openalex.org/C124952713","wikidata":"https://www.wikidata.org/wiki/Q8242","display_name":"Literature","level":1,"score":0.0},{"id":"https://openalex.org/C142362112","wikidata":"https://www.wikidata.org/wiki/Q735","display_name":"Art","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1177/0165551507082592","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551507082592","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7300000190734863,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W128026211","https://openalex.org/W140312209","https://openalex.org/W1487445520","https://openalex.org/W1620204465","https://openalex.org/W1924689489","https://openalex.org/W1956559956","https://openalex.org/W1965350351","https://openalex.org/W1974339500","https://openalex.org/W1974858995","https://openalex.org/W2005422315","https://openalex.org/W2017792962","https://openalex.org/W2032304665","https://openalex.org/W2054207584","https://openalex.org/W2060259280","https://openalex.org/W2063862666","https://openalex.org/W2064580901","https://openalex.org/W2081321668","https://openalex.org/W2094255877","https://openalex.org/W2098162425","https://openalex.org/W2118020653","https://openalex.org/W2148202334","https://openalex.org/W2149684865","https://openalex.org/W2236857040","https://openalex.org/W2325227998","https://openalex.org/W2560674852","https://openalex.org/W2917891876","https://openalex.org/W4246519874","https://openalex.org/W4285719527"],"related_works":["https://openalex.org/W2011471399","https://openalex.org/W4249836580","https://openalex.org/W2094492371","https://openalex.org/W2509430763","https://openalex.org/W1873761914","https://openalex.org/W4256137736","https://openalex.org/W2128580294","https://openalex.org/W2471302064","https://openalex.org/W2002101594","https://openalex.org/W171162874"],"abstract_inverted_index":{"In":[0],"current":[1,175],"library":[2,41,50,68,81,101,134,176,197],"practice,":[3],"trained":[4],"human":[5],"experts":[6],"usually":[7],"carry":[8],"out":[9],"document":[10,64,76,122,170,193,218],"cataloguing":[11],"and":[12,33,48,61,114,155],"indexing":[13],"based":[14,120,220],"on":[15,30,221],"a":[16,54,105,117,196],"manual":[17,55,128],"approach.":[18,56],"With":[19],"the":[20,24,31,59,67,112,127,133,156,187,207,213,222],"explosive":[21],"growth":[22],"in":[23,91,153,161,195],"number":[25],"of":[26,63,73,116,211],"electronic":[27,46],"documents":[28,47],"available":[29],"Internet":[32],"digital":[34],"libraries,":[35],"it":[36],"is":[37,103,206],"increasingly":[38],"difficult":[39],"for":[40],"practitioners":[42],"to":[43,79,99,125,166,173,184,190,216],"categorize":[44,80],"both":[45],"traditional":[49],"materials":[51],"using":[52,74],"just":[53],"To":[57,201],"improve":[58,100],"effectiveness":[60],"efficiency":[62],"categorization":[65,129],"at":[66],"setting,":[69],"more":[70],"in-depth":[71,209],"studies":[72],"automatic":[75,121,192,217],"classification":[77,123,171,194,219,226],"methods":[78],"items":[82],"are":[83,199],"required.":[84],"Machine":[85],"learning":[86,97,119,139,151],"research":[87],"has":[88],"advanced":[89],"rapidly":[90],"recent":[92],"years.":[93],"However,":[94],"applying":[95,212],"machine":[96,118,138,150],"techniques":[98],"practice":[102],"still":[104],"relatively":[106],"unexplored":[107],"area.":[108],"This":[109],"paper":[110],"illustrates":[111],"design":[113],"development":[115],"system":[124,172],"alleviate":[126],"problem":[130],"encountered":[131],"within":[132],"setting.":[135],"Two":[136],"supervised":[137,149],"algorithms":[140,152],"have":[141],"been":[142],"tested.":[143],"Our":[144],"empirical":[145],"tests":[146],"show":[147],"that":[148],"general,":[154],"k-nearest":[157],"neighbours":[158],"(KNN)":[159],"algorithm":[160,189,215],"particular,":[162],"can":[163],"be":[164],"used":[165,224],"develop":[167,191],"an":[168],"effective":[169],"enhance":[174],"practice.":[177],"Moreover,":[178],"some":[179],"concrete":[180],"recommendations":[181],"regarding":[182],"how":[183],"practically":[185],"apply":[186],"KNN":[188,214],"setting":[198],"made.":[200],"our":[202],"best":[203],"knowledge,":[204],"this":[205],"first":[208],"study":[210],"widely":[223],"LCC":[225],"scheme":[227],"adopted":[228],"by":[229],"many":[230],"large":[231],"libraries.":[232]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":4},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
