{"id":"https://openalex.org/W2168849694","doi":"https://doi.org/10.1177/0165551504046722","title":"The effect of similarity measures on the quality of query clusters","display_name":"The effect of similarity measures on the quality of query clusters","publication_year":2004,"publication_date":"2004-10-01","ids":{"openalex":"https://openalex.org/W2168849694","doi":"https://doi.org/10.1177/0165551504046722","mag":"2168849694"},"language":"en","primary_location":{"id":"doi:10.1177/0165551504046722","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551504046722","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://dr.ntu.edu.sg/bitstream/10356/91768/1/2004-effect-similarity-jis.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5110219817","display_name":"Fu Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Lin Fu","raw_affiliation_strings":["Division of Information Studies, School of Communication and Information,                         Nanyang Technological University, Singapore,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Division of Information Studies, School of Communication and Information,                         Nanyang Technological University, Singapore,","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051793131","display_name":"Dion Hoe\u2010Lian Goh","orcid":"https://orcid.org/0000-0003-2904-3269"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Dion Hoe-Lian Goh","raw_affiliation_strings":["Division of Information Studies, School of Communication and Information,                         Nanyang Technological University, Singapore","Division of Information Studies, School of Communication and Information, Nanyang Technological University, Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Division of Information Studies, School of Communication and Information,                         Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]},{"raw_affiliation_string":"Division of Information Studies, School of Communication and Information, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006167228","display_name":"Schubert Foo","orcid":"https://orcid.org/0000-0003-3043-0450"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Schubert Shou-Boon Foo","raw_affiliation_strings":["Division of Information Studies, School of Communication and Information,                         Nanyang Technological University, Singapore","Division of Information Studies, School of Communication and Information, Nanyang Technological University, Singapore"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Division of Information Studies, School of Communication and Information,                         Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]},{"raw_affiliation_string":"Division of Information Studies, School of Communication and Information, Nanyang Technological University, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5110219817"],"corresponding_institution_ids":["https://openalex.org/I172675005"],"apc_list":null,"apc_paid":null,"fwci":2.4214,"has_fulltext":true,"cited_by_count":12,"citation_normalized_percentile":{"value":0.92042927,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":96},"biblio":{"volume":"30","issue":"5","first_page":"396","last_page":"407"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.994700014591217,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7507869601249695},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.7419145703315735},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.7365105152130127},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.658405065536499},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.599838376045227},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.5464550256729126},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5250220894813538},{"id":"https://openalex.org/keywords/nearest-neighbor-search","display_name":"Nearest neighbor search","score":0.478851318359375},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.476375550031662},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.46973833441734314},{"id":"https://openalex.org/keywords/result-set","display_name":"Result set","score":0.4598004221916199},{"id":"https://openalex.org/keywords/query-expansion","display_name":"Query expansion","score":0.4505201578140259},{"id":"https://openalex.org/keywords/similarity-measure","display_name":"Similarity measure","score":0.43391329050064087},{"id":"https://openalex.org/keywords/web-query-classification","display_name":"Web query classification","score":0.43049243092536926},{"id":"https://openalex.org/keywords/web-search-query","display_name":"Web search query","score":0.3752862513065338},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.29716452956199646},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.11922904849052429},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.0641539990901947}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7507869601249695},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.7419145703315735},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.7365105152130127},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.658405065536499},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.599838376045227},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.5464550256729126},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5250220894813538},{"id":"https://openalex.org/C116738811","wikidata":"https://www.wikidata.org/wiki/Q608751","display_name":"Nearest neighbor search","level":2,"score":0.478851318359375},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.476375550031662},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.46973833441734314},{"id":"https://openalex.org/C4969071","wikidata":"https://www.wikidata.org/wiki/Q7316353","display_name":"Result set","level":3,"score":0.4598004221916199},{"id":"https://openalex.org/C99016210","wikidata":"https://www.wikidata.org/wiki/Q5488129","display_name":"Query expansion","level":2,"score":0.4505201578140259},{"id":"https://openalex.org/C2776517306","wikidata":"https://www.wikidata.org/wiki/Q29017317","display_name":"Similarity measure","level":2,"score":0.43391329050064087},{"id":"https://openalex.org/C118689300","wikidata":"https://www.wikidata.org/wiki/Q7978614","display_name":"Web query classification","level":4,"score":0.43049243092536926},{"id":"https://openalex.org/C164120249","wikidata":"https://www.wikidata.org/wiki/Q995982","display_name":"Web search query","level":3,"score":0.3752862513065338},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.29716452956199646},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.11922904849052429},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0641539990901947},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1177/0165551504046722","is_oa":false,"landing_page_url":"https://doi.org/10.1177/0165551504046722","pdf_url":null,"source":{"id":"https://openalex.org/S68913162","display_name":"Journal of Information Science","issn_l":"0165-5515","issn":["0165-5515","1741-6485"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Journal of Information Science","raw_type":"journal-article"},{"id":"pmh:oai:dr.ntu.edu.sg:10356/91768","is_oa":true,"landing_page_url":"http://hdl.handle.net/10220/6178","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/91768/1/2004-effect-similarity-jis.pdf","source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.95.5035","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.95.5035","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://staffx.webstore.ntu.edu.sg/personal/ashlgoh/Shared Documents/pubs/2004-effect-similarity-jis.pdf","raw_type":"text"}],"best_oa_location":{"id":"pmh:oai:dr.ntu.edu.sg:10356/91768","is_oa":true,"landing_page_url":"http://hdl.handle.net/10220/6178","pdf_url":"https://dr.ntu.edu.sg/bitstream/10356/91768/1/2004-effect-similarity-jis.pdf","source":{"id":"https://openalex.org/S4306402609","display_name":"DR-NTU (Nanyang Technological University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I172675005","host_organization_name":"Nanyang Technological University","host_organization_lineage":["https://openalex.org/I172675005"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Journal Article"},"sustainable_development_goals":[{"score":0.6600000262260437,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320766","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2168849694.pdf","grobid_xml":"https://content.openalex.org/works/W2168849694.grobid-xml"},"referenced_works_count":35,"referenced_works":["https://openalex.org/W86205303","https://openalex.org/W100277439","https://openalex.org/W1554796723","https://openalex.org/W1588295798","https://openalex.org/W1673310716","https://openalex.org/W1802760973","https://openalex.org/W1847816476","https://openalex.org/W1956559956","https://openalex.org/W1966553486","https://openalex.org/W1982889956","https://openalex.org/W1987833517","https://openalex.org/W1992419399","https://openalex.org/W1993421924","https://openalex.org/W1998196377","https://openalex.org/W2000145992","https://openalex.org/W2009202693","https://openalex.org/W2039273494","https://openalex.org/W2041179002","https://openalex.org/W2057670860","https://openalex.org/W2066590388","https://openalex.org/W2069690469","https://openalex.org/W2075251734","https://openalex.org/W2109406928","https://openalex.org/W2113788004","https://openalex.org/W2123656745","https://openalex.org/W2155106456","https://openalex.org/W2325227998","https://openalex.org/W2602753196","https://openalex.org/W3142744039","https://openalex.org/W4231011906","https://openalex.org/W4253996635","https://openalex.org/W4285719527","https://openalex.org/W4300831780","https://openalex.org/W4300874750","https://openalex.org/W4365799952"],"related_works":["https://openalex.org/W2340295440","https://openalex.org/W3049728138","https://openalex.org/W4301666339","https://openalex.org/W2395498354","https://openalex.org/W4297789472","https://openalex.org/W206333655","https://openalex.org/W1805532631","https://openalex.org/W2100301193","https://openalex.org/W1581365825","https://openalex.org/W1982587323"],"abstract_inverted_index":{"Query":[0],"clustering":[1,76],"is":[2,57],"a":[3,63],"process":[4],"that":[5,36,113],"can":[6],"be":[7],"used":[8],"to":[9,18,49,59,73,96],"discover":[10],"common":[11],"interests":[12],"of":[13,27,42,62,66,85,91,100,107],"online":[14],"information":[15,47,53],"seekers":[16],"and":[17,45],"exploit":[19],"their":[20,52],"collective":[21],"search":[22,31],"experience":[23],"for":[24,127],"the":[25,60,74,83,98,105],"benefit":[26],"others.":[28],"Harnessing":[29],"such":[30],"experiences":[32],"facilitates":[33],"collaborative":[34],"querying":[35],"in":[37,120],"turn":[38],"may":[39],"help":[40],"users":[41],"digital":[43],"libraries":[44],"other":[46,119],"systems":[48],"better":[50],"meet":[51],"needs.":[54],"Since":[55],"similarity":[56,67,87,102,115],"fundamental":[58],"definition":[61],"cluster,":[64],"measures":[65,103,116],"between":[68],"two":[69],"queries":[70],"are":[71,130],"essential":[72],"query":[75,108,122],"procedure.":[77],"In":[78],"this":[79],"paper,":[80],"we":[81],"examine":[82],"effectiveness":[84],"different":[86,101,114,121],"measures.":[88],"A":[89],"set":[90],"experiments":[92],"was":[93],"carried":[94],"out":[95],"study":[97],"impact":[99],"on":[104],"quality":[106,124],"clusters.":[109],"The":[110],"results":[111],"show":[112],"outperform":[117],"each":[118],"cluster":[123],"criteria.":[125],"Implications":[126],"these":[128],"findings":[129],"discussed.":[131]},"counts_by_year":[{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2016,"cited_by_count":2},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":1}],"updated_date":"2026-05-05T06:06:40.768181","created_date":"2025-10-10T00:00:00"}
