{"id":"https://openalex.org/W2022006917","doi":"https://doi.org/10.1145/1645953.1646069","title":"Clustering web queries","display_name":"Clustering web queries","publication_year":2009,"publication_date":"2009-11-02","ids":{"openalex":"https://openalex.org/W2022006917","doi":"https://doi.org/10.1145/1645953.1646069","mag":"2022006917"},"language":"en","primary_location":{"id":"doi:10.1145/1645953.1646069","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1645953.1646069","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 18th ACM conference on Information and knowledge management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5009284826","display_name":"John S. Whissell","orcid":null},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"John S. Whissell","raw_affiliation_strings":["University of Waterloo, Waterloo, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo, Waterloo, ON, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037737168","display_name":"Charles L. A. Clarke","orcid":"https://orcid.org/0000-0001-8178-9194"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Charles L.A. Clarke","raw_affiliation_strings":["University of Waterloo, Waterloo, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo, Waterloo, ON, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5018753905","display_name":"Azin Ashkan","orcid":null},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Azin Ashkan","raw_affiliation_strings":["University of Waterloo, Waterloo, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo, Waterloo, ON, Canada","institution_ids":["https://openalex.org/I151746483"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5009284826"],"corresponding_institution_ids":["https://openalex.org/I151746483"],"apc_list":null,"apc_paid":null,"fwci":1.7447,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.86743784,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"899","last_page":"908"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10637","display_name":"Advanced Clustering Algorithms Research","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.8197671175003052},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7617787718772888},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.6593132615089417},{"id":"https://openalex.org/keywords/weighting","display_name":"Weighting","score":0.6130655407905579},{"id":"https://openalex.org/keywords/classifier","display_name":"Classifier (UML)","score":0.5230848789215088},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.49749186635017395},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.46929389238357544},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.4688013195991516},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.45486941933631897},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.42690831422805786},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.28388726711273193}],"concepts":[{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.8197671175003052},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7617787718772888},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.6593132615089417},{"id":"https://openalex.org/C183115368","wikidata":"https://www.wikidata.org/wiki/Q856577","display_name":"Weighting","level":2,"score":0.6130655407905579},{"id":"https://openalex.org/C95623464","wikidata":"https://www.wikidata.org/wiki/Q1096149","display_name":"Classifier (UML)","level":2,"score":0.5230848789215088},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.49749186635017395},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.46929389238357544},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.4688013195991516},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.45486941933631897},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.42690831422805786},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.28388726711273193},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C126838900","wikidata":"https://www.wikidata.org/wiki/Q77604","display_name":"Radiology","level":1,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C71924100","wikidata":"https://www.wikidata.org/wiki/Q11190","display_name":"Medicine","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1645953.1646069","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1645953.1646069","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 18th ACM conference on Information and knowledge management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","score":0.699999988079071,"display_name":"Reduced inequalities"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":40,"referenced_works":["https://openalex.org/W37713582","https://openalex.org/W145805811","https://openalex.org/W146900863","https://openalex.org/W1484330506","https://openalex.org/W1484435853","https://openalex.org/W1512164432","https://openalex.org/W1583837637","https://openalex.org/W1585610988","https://openalex.org/W1602389404","https://openalex.org/W1612003148","https://openalex.org/W1798054139","https://openalex.org/W1971318281","https://openalex.org/W1972645849","https://openalex.org/W1974603499","https://openalex.org/W1985593448","https://openalex.org/W1992419399","https://openalex.org/W2013029404","https://openalex.org/W2013225614","https://openalex.org/W2049633694","https://openalex.org/W2060314721","https://openalex.org/W2071949631","https://openalex.org/W2104217798","https://openalex.org/W2107743791","https://openalex.org/W2113076747","https://openalex.org/W2113455164","https://openalex.org/W2115746347","https://openalex.org/W2121947440","https://openalex.org/W2124658502","https://openalex.org/W2132820034","https://openalex.org/W2137572914","https://openalex.org/W2150593711","https://openalex.org/W2150753219","https://openalex.org/W2156037541","https://openalex.org/W2157361576","https://openalex.org/W2293273145","https://openalex.org/W2336821893","https://openalex.org/W2595697910","https://openalex.org/W4210665681","https://openalex.org/W4231336072","https://openalex.org/W4233135949"],"related_works":["https://openalex.org/W2180954594","https://openalex.org/W2052835778","https://openalex.org/W2049003611","https://openalex.org/W2127804977","https://openalex.org/W2108418243","https://openalex.org/W164103134","https://openalex.org/W2787352659","https://openalex.org/W1970611213","https://openalex.org/W4206560911","https://openalex.org/W4372260270"],"abstract_inverted_index":{"Despite":[0],"the":[1,20,71,85,119,131,141,144,179],"wide":[2],"applicability":[3,86],"of":[4,22,46,54,73,80,87,103,111,121,133,165],"clustering":[5,23,41,153],"methods,":[6],"their":[7],"evaluation":[8,21],"remains":[9],"a":[10,17,34,37,63,78,98,107,122],"problem.":[11],"In":[12],"this":[13,55,59,74,88],"paper,":[14],"we":[15,90],"present":[16],"metric":[18,89,170],"for":[19],"methods.":[24],"The":[25,176],"data":[26,101,109,182],"set":[27,102,110,183],"to":[28,50,65,93,161,186],"be":[29],"clustered":[30],"is":[31,128,171],"viewed":[32],"as":[33],"sample":[35],"from":[36,118,147],"larger":[38],"population,":[39],"with":[40,157],"quality":[42],"measured":[43],"in":[44,195],"terms":[45],"our":[47],"predicted":[48],"ability":[49],"discriminate":[51],"between":[52],"members":[53],"population.":[56],"We":[57,96],"measure":[58],"property":[60],"by":[61,77,139],"training":[62],"classifier":[64],"recognize":[66],"each":[67,166],"cluster":[68],"and":[69,106,191],"measuring":[70],"accuracy":[72],"classifier,":[75],"normalized":[76],"notion":[79],"expected":[81],"accuracy.":[82],"To":[83],"demonstrate":[84],"apply":[91],"it":[92],"Web":[94,124],"queries.":[95,113],"investigated":[97],"commercially":[99,180],"oriented":[100,181],"1700":[104],"queries":[105,142],"general":[108],"4000":[112],"Both":[114],"sets":[115],"are":[116,155,184,192],"taken":[117],"logs":[120],"commercial":[123],"search":[125,134,145],"engine.":[126],"Clustering":[127],"based":[129],"on":[130,143,178],"contents":[132],"engine":[135,146],"result":[136],"pages":[137],"generated":[138],"executing":[140],"which":[148],"they":[149],"were":[150],"taken.":[151],"Multiple":[152],"algorithms":[154],"crossed":[156],"various":[158],"weighting":[159],"schemes":[160],"produce":[162],"multiple":[163],"clusterings":[164],"query":[167],"set.":[168],"Our":[169],"used":[172,194],"evaluate":[173],"these":[174],"clusterings.":[175],"results":[177],"compared":[185],"two":[187],"pre-existing":[188],"manual":[189],"labelings,":[190],"also":[193],"an":[196],"ad":[197],"clickthrough":[198],"experiment.":[199]},"counts_by_year":[{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":1},{"year":2012,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
