{"id":"https://openalex.org/W2137800096","doi":"https://doi.org/10.1145/1592748.1592753","title":"Scalable clustering and keyword suggestion for online advertisements","display_name":"Scalable clustering and keyword suggestion for online advertisements","publication_year":2009,"publication_date":"2009-06-28","ids":{"openalex":"https://openalex.org/W2137800096","doi":"https://doi.org/10.1145/1592748.1592753","mag":"2137800096"},"language":"en","primary_location":{"id":"doi:10.1145/1592748.1592753","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1592748.1592753","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Third International Workshop on Data Mining and Audience Intelligence for Advertising","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010707054","display_name":"Anton Schwaighofer","orcid":"https://orcid.org/0000-0003-1557-0527"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]},{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB","US"],"is_corresponding":true,"raw_author_name":"Anton Schwaighofer","raw_affiliation_strings":["Microsoft Research, Cambridge, UK","Microsoft Research, Cambridge, UK;"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Cambridge, UK","institution_ids":["https://openalex.org/I4210164937"]},{"raw_affiliation_string":"Microsoft Research, Cambridge, UK;","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041298987","display_name":"Joaquin Qui\u00f1onero Candela","orcid":"https://orcid.org/0009-0004-5149-3228"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]},{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Joaquin Qui\u00f1onero Candela","raw_affiliation_strings":["Microsoft Research, Cambridge, UK","Microsoft Research, Cambridge, UK;"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Cambridge, UK","institution_ids":["https://openalex.org/I4210164937"]},{"raw_affiliation_string":"Microsoft Research, Cambridge, UK;","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010665446","display_name":"Thomas Borchert","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]},{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Thomas Borchert","raw_affiliation_strings":["Microsoft Research, Cambridge, UK","Microsoft Research, Cambridge, UK;"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Cambridge, UK","institution_ids":["https://openalex.org/I4210164937"]},{"raw_affiliation_string":"Microsoft Research, Cambridge, UK;","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051619646","display_name":"Thore Graepel","orcid":"https://orcid.org/0000-0003-3957-0310"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]},{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Thore Graepel","raw_affiliation_strings":["Microsoft Research, Cambridge, UK","Microsoft Research, Cambridge, UK;"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Cambridge, UK","institution_ids":["https://openalex.org/I4210164937"]},{"raw_affiliation_string":"Microsoft Research, Cambridge, UK;","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5059907791","display_name":"Ralf Herbrich","orcid":null},"institutions":[{"id":"https://openalex.org/I4210164937","display_name":"Microsoft Research (United Kingdom)","ror":"https://ror.org/05k87vq12","country_code":"GB","type":"company","lineage":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"]},{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["GB","US"],"is_corresponding":false,"raw_author_name":"Ralf Herbrich","raw_affiliation_strings":["Microsoft Research, Cambridge, UK","Microsoft Research, Cambridge, UK;"],"affiliations":[{"raw_affiliation_string":"Microsoft Research, Cambridge, UK","institution_ids":["https://openalex.org/I4210164937"]},{"raw_affiliation_string":"Microsoft Research, Cambridge, UK;","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5010707054"],"corresponding_institution_ids":["https://openalex.org/I1290206253","https://openalex.org/I4210164937"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.13682157,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"35","issue":null,"first_page":"27","last_page":"36"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11901","display_name":"Bayesian Methods and Mixture Models","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11550","display_name":"Text and Document Classification Technologies","score":0.9897000193595886,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7990708351135254},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.7403169870376587},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5386500358581543},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5224593877792358},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.4468016028404236},{"id":"https://openalex.org/keywords/bayesian-inference","display_name":"Bayesian inference","score":0.41586506366729736},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.41539207100868225},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.38942092657089233},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3395685851573944},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3193274140357971},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.09425663948059082}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7990708351135254},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.7403169870376587},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5386500358581543},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5224593877792358},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.4468016028404236},{"id":"https://openalex.org/C160234255","wikidata":"https://www.wikidata.org/wiki/Q812535","display_name":"Bayesian inference","level":3,"score":0.41586506366729736},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.41539207100868225},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.38942092657089233},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3395685851573944},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3193274140357971},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.09425663948059082},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/1592748.1592753","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1592748.1592753","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Third International Workshop on Data Mining and Audience Intelligence for Advertising","raw_type":"proceedings-article"},{"id":"pmh:oai:CiteSeerX.psu:10.1.1.718.4521","is_oa":false,"landing_page_url":"http://citeseerx.ist.psu.edu/viewdoc/summary?doi=10.1.1.718.4521","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"http://www.quinonero.net/Publications/adClustering.pdf","raw_type":"text"},{"id":"pmh:oai:eprints.ucl.ac.uk.OAI2:1514648","is_oa":false,"landing_page_url":"http://discovery.ucl.ac.uk/1514648/","pdf_url":null,"source":{"id":"https://openalex.org/S4306400024","display_name":"UCL Discovery (University College London)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I45129253","host_organization_name":"University College London","host_organization_lineage":["https://openalex.org/I45129253"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"     In:    (pp. pp. 27-36).   (2009)     ","raw_type":"Proceedings paper"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W181127821","https://openalex.org/W1506806321","https://openalex.org/W1515272691","https://openalex.org/W1579271636","https://openalex.org/W1880262756","https://openalex.org/W1968114652","https://openalex.org/W2045729350","https://openalex.org/W2111748568","https://openalex.org/W2132708887","https://openalex.org/W2137813581","https://openalex.org/W2154463588","https://openalex.org/W2488678869","https://openalex.org/W2554987453","https://openalex.org/W4212863985","https://openalex.org/W6607364932","https://openalex.org/W6629510986","https://openalex.org/W6629971530","https://openalex.org/W6642470415","https://openalex.org/W7020380774"],"related_works":["https://openalex.org/W2372267530","https://openalex.org/W2969189870","https://openalex.org/W2585791450","https://openalex.org/W3015855446","https://openalex.org/W4303857162","https://openalex.org/W2965643117","https://openalex.org/W4288266653","https://openalex.org/W2407375987","https://openalex.org/W2505726097","https://openalex.org/W2950975704"],"abstract_inverted_index":{"We":[0],"present":[1],"an":[2,101,117],"efficient":[3],"Bayesian":[4],"online":[5,58,132,137,175],"learning":[6],"algorithm":[7,64],"for":[8,40,156,190],"clustering":[9,164],"vectors":[10],"of":[11,22,92,143],"binary":[12],"values":[13],"based":[14,106],"on":[15,84,107,116,166],"a":[16,50,73,125,171],"well":[17,155],"known":[18],"model,":[19],"the":[20,32,77,90,108,134,141,167,180],"mixture":[21],"Bernoulli":[23],"profiles.":[24],"The":[25,62,112,151],"model":[26,110,113,182],"includes":[27],"conjugate":[28],"Beta":[29],"priors":[30],"over":[31],"success":[33],"probabilities":[34],"and":[35,79,94,97,122,159],"maintains":[36,89],"discrete":[37],"probability":[38],"distributions":[39],"cluster":[41,95],"assignments.":[42],"Clustering":[43],"is":[44,54,114],"then":[45],"formulated":[46],"as":[47],"inference":[48],"in":[49],"factor":[51],"graph":[52],"which":[53,146],"solved":[55],"efficiently":[56],"using":[57],"approximate":[59],"message":[60],"passing.":[61],"resulting":[63],"has":[65],"three":[66],"key":[67],"features:":[68],"a)":[69],"it":[70,88,99],"requires":[71],"only":[72],"single":[74],"pass":[75],"across":[76],"data":[78,85,129,135],"can":[80,183],"hence":[81],"be":[82,184],"used":[83,185],"streams,":[86],"b)":[87],"uncertainty":[91],"parameters":[93],"assignments,":[96],"c)":[98],"implements":[100],"automatic":[102],"step":[103],"size":[104],"adaptation":[105],"current":[109],"uncertainty.":[111],"tested":[115],"artificially":[118],"generated":[119],"toy":[120],"dataset":[121],"applied":[123],"to":[124,145,162,174,186],"large":[126,157],"scale":[127],"real-world":[128],"set":[130,142],"from":[131],"advertising,":[133],"being":[136],"ads":[138,168],"characterized":[139],"by":[140],"keywords":[144,189],"they":[147],"have":[148],"been":[149],"subscribed.":[150],"proposed":[152],"approach":[153],"scales":[154],"datasets,":[158],"compares":[160],"favorably":[161],"other":[163],"algorithms":[165],"dataset.":[169],"As":[170],"concrete":[172],"application":[173],"advertising":[176],"we":[177],"show":[178],"how":[179],"learnt":[181],"recommend":[187],"new":[188],"given":[191],"ads.":[192]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":2},{"year":2020,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":2}],"updated_date":"2026-04-05T17:49:38.594831","created_date":"2025-10-10T00:00:00"}
