{"id":"https://openalex.org/W2130476464","doi":"https://doi.org/10.1145/1007568.1007653","title":"Automatic categorization of query results","display_name":"Automatic categorization of query results","publication_year":2004,"publication_date":"2004-06-13","ids":{"openalex":"https://openalex.org/W2130476464","doi":"https://doi.org/10.1145/1007568.1007653","mag":"2130476464"},"language":"en","primary_location":{"id":"doi:10.1145/1007568.1007653","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1007568.1007653","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2004 ACM SIGMOD international conference on Management of data","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113509258","display_name":"Kaushik Chakrabarti","orcid":null},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]},{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["GB","US"],"is_corresponding":true,"raw_author_name":"Kaushik Chakrabarti","raw_affiliation_strings":["Microsoft Research","Microsoft research#TAB#"],"affiliations":[{"raw_affiliation_string":"Microsoft Research","institution_ids":["https://openalex.org/I4210164937"]},{"raw_affiliation_string":"Microsoft research#TAB#","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038037154","display_name":"Surajit Chaudhuri","orcid":"https://orcid.org/0000-0001-8252-5270"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]},{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Surajit Chaudhuri","raw_affiliation_strings":["Microsoft Research","Microsoft research#TAB#"],"affiliations":[{"raw_affiliation_string":"Microsoft Research","institution_ids":["https://openalex.org/I4210164937"]},{"raw_affiliation_string":"Microsoft research#TAB#","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024873601","display_name":"Seung-won Hwang","orcid":null},"institutions":[{"id":"https://openalex.org/I2801919071","display_name":"University of Illinois System","ror":"https://ror.org/05e94g991","country_code":"US","type":"education","lineage":["https://openalex.org/I2801919071"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Seung-won Hwang","raw_affiliation_strings":["University of Illinois"],"affiliations":[{"raw_affiliation_string":"University of Illinois","institution_ids":["https://openalex.org/I2801919071"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5113509258"],"corresponding_institution_ids":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"],"apc_list":null,"apc_paid":null,"fwci":5.1437,"has_fulltext":false,"cited_by_count":87,"citation_normalized_percentile":{"value":0.95943968,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"755","last_page":"766"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11106","display_name":"Data Management and Algorithms","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9902999997138977,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/categorization","display_name":"Categorization","score":0.879319429397583},{"id":"https://openalex.org/keywords/information-overload","display_name":"Information overload","score":0.8334070444107056},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8028981685638428},{"id":"https://openalex.org/keywords/heuristic","display_name":"Heuristic","score":0.6152255535125732},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4556986093521118},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.421889990568161},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.40073469281196594},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3345075249671936},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.08606210350990295}],"concepts":[{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.879319429397583},{"id":"https://openalex.org/C186625053","wikidata":"https://www.wikidata.org/wiki/Q1130191","display_name":"Information overload","level":2,"score":0.8334070444107056},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8028981685638428},{"id":"https://openalex.org/C173801870","wikidata":"https://www.wikidata.org/wiki/Q201413","display_name":"Heuristic","level":2,"score":0.6152255535125732},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4556986093521118},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.421889990568161},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.40073469281196594},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3345075249671936},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.08606210350990295}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/1007568.1007653","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1007568.1007653","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2004 ACM SIGMOD international conference on Management of data","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.606.4496","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.606.4496","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.searchforum.org.cn/dataflowgroup/Reading/Reading_Suny/SIGMOD/sigmod2004/automatic categorization of query results.pdf","raw_type":"text"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.83.7458","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.83.7458","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://research.microsoft.com/users/kaushik/pubs/categorization_sigmod04.pdf","raw_type":"text"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":70,"referenced_works":["https://openalex.org/W5013789","https://openalex.org/W6472071","https://openalex.org/W942791280","https://openalex.org/W976026051","https://openalex.org/W1006168843","https://openalex.org/W1011364289","https://openalex.org/W1484527064","https://openalex.org/W1516293359","https://openalex.org/W1559729415","https://openalex.org/W1560862172","https://openalex.org/W1577233831","https://openalex.org/W1584617460","https://openalex.org/W1585743408","https://openalex.org/W1596747867","https://openalex.org/W1606989144","https://openalex.org/W1638540206","https://openalex.org/W1660390307","https://openalex.org/W1724287152","https://openalex.org/W1746171598","https://openalex.org/W1764664858","https://openalex.org/W1798118326","https://openalex.org/W1844949470","https://openalex.org/W1849704194","https://openalex.org/W1892103244","https://openalex.org/W1916917555","https://openalex.org/W1920142350","https://openalex.org/W1962528201","https://openalex.org/W1986133022","https://openalex.org/W1986898623","https://openalex.org/W2028128906","https://openalex.org/W2033139852","https://openalex.org/W2043885422","https://openalex.org/W2052936337","https://openalex.org/W2064686951","https://openalex.org/W2065085057","https://openalex.org/W2086287277","https://openalex.org/W2086827681","https://openalex.org/W2095897464","https://openalex.org/W2098388305","https://openalex.org/W2102281354","https://openalex.org/W2103201239","https://openalex.org/W2118020653","https://openalex.org/W2120108467","https://openalex.org/W2121350579","https://openalex.org/W2121647436","https://openalex.org/W2122865866","https://openalex.org/W2134195632","https://openalex.org/W2135046866","https://openalex.org/W2135386066","https://openalex.org/W2136461127","https://openalex.org/W2140100403","https://openalex.org/W2145295623","https://openalex.org/W2146431924","https://openalex.org/W2151406030","https://openalex.org/W2153635508","https://openalex.org/W2163352848","https://openalex.org/W2164016202","https://openalex.org/W2170654002","https://openalex.org/W2171903035","https://openalex.org/W2199201860","https://openalex.org/W2244987098","https://openalex.org/W2277238962","https://openalex.org/W2397943291","https://openalex.org/W2407187628","https://openalex.org/W2411457633","https://openalex.org/W2978337448","https://openalex.org/W3142904096","https://openalex.org/W3143471909","https://openalex.org/W4237841550","https://openalex.org/W6682452324"],"related_works":["https://openalex.org/W3134493632","https://openalex.org/W2165912799","https://openalex.org/W1602080981","https://openalex.org/W2735662278","https://openalex.org/W2382615723","https://openalex.org/W4311804456","https://openalex.org/W4242208525","https://openalex.org/W1987484445","https://openalex.org/W2623658258","https://openalex.org/W2605555545"],"abstract_inverted_index":{"Exploratory":[0],"ad-hoc":[1],"queries":[2,29],"could":[3],"return":[4],"too":[5],"many":[6],"answers":[7],"-":[8,42],"a":[9,37,47,86,89,102],"phenomenon":[10],"commonly":[11],"referred":[12],"to":[13,22,30,80,110],"as":[14,101],"\"information":[15],"overload\".":[16],"In":[17],"this":[18,32],"paper,":[19],"we":[20,96],"propose":[21],"automatically":[23],"categorize":[24],"the":[25,63,68,98,112],"results":[26],"of":[27],"SQL":[28],"address":[31],"problem.":[33],"We":[34,75],"dynamically":[35],"generate":[36],"labeled,":[38],"hierarchical":[39],"category":[40,48],"structure":[41],"users":[43],"can":[44,59],"determine":[45],"whether":[46],"is":[49],"relevant":[50,64],"or":[51],"not":[52],"by":[53,85],"examining":[54],"simply":[55],"its":[56],"label;":[57],"she":[58],"then":[60],"explore":[61],"just":[62],"categories":[65],"and":[66,106],"ignore":[67],"remaining":[69],"ones,":[70],"thereby":[71],"reducing":[72],"information":[73,82],"overload.":[74],"first":[76],"develop":[77,107],"analytical":[78],"models":[79],"estimate":[81],"overload":[83],"faced":[84],"user":[87],"for":[88],"given":[90],"exploration.":[91],"Based":[92],"on":[93],"those":[94],"models,":[95],"formulate":[97],"categorization":[99],"problem":[100,105],"cost":[103],"optimization":[104],"heuristic":[108],"algorithms":[109],"compute":[111],"min-cost":[113],"categorization.":[114]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2018,"cited_by_count":1},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":2},{"year":2014,"cited_by_count":6},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":15}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
