{"id":"https://openalex.org/W2071488943","doi":"https://doi.org/10.1145/1281192.1281198","title":"Estimating rates of rare events at multiple resolutions","display_name":"Estimating rates of rare events at multiple resolutions","publication_year":2007,"publication_date":"2007-08-12","ids":{"openalex":"https://openalex.org/W2071488943","doi":"https://doi.org/10.1145/1281192.1281198","mag":"2071488943"},"language":"en","primary_location":{"id":"doi:10.1145/1281192.1281198","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1281192.1281198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th ACM SIGKDD international conference on Knowledge discovery and data mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101736089","display_name":"Deepak Agarwal","orcid":"https://orcid.org/0000-0003-2590-2206"},"institutions":[{"id":"https://openalex.org/I2800095910","display_name":"Yahoo (Spain)","ror":"https://ror.org/03gq8sg42","country_code":"ES","type":"company","lineage":["https://openalex.org/I2800095910","https://openalex.org/I4210134091"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Deepak Agarwal","raw_affiliation_strings":["Yahoo! Research","Yahoo! research,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research","institution_ids":[]},{"raw_affiliation_string":"Yahoo! research,","institution_ids":["https://openalex.org/I2800095910"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108541542","display_name":"Andrei Broder","orcid":null},"institutions":[{"id":"https://openalex.org/I2800095910","display_name":"Yahoo (Spain)","ror":"https://ror.org/03gq8sg42","country_code":"ES","type":"company","lineage":["https://openalex.org/I2800095910","https://openalex.org/I4210134091"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Andrei Zary Broder","raw_affiliation_strings":["Yahoo! Research","Yahoo! research,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research","institution_ids":[]},{"raw_affiliation_string":"Yahoo! research,","institution_ids":["https://openalex.org/I2800095910"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078048346","display_name":"Deepayan Chakrabarti","orcid":"https://orcid.org/0000-0002-3863-4928"},"institutions":[{"id":"https://openalex.org/I2800095910","display_name":"Yahoo (Spain)","ror":"https://ror.org/03gq8sg42","country_code":"ES","type":"company","lineage":["https://openalex.org/I2800095910","https://openalex.org/I4210134091"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Deepayan Chakrabarti","raw_affiliation_strings":["Yahoo! Research","Yahoo! research,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research","institution_ids":[]},{"raw_affiliation_string":"Yahoo! research,","institution_ids":["https://openalex.org/I2800095910"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041794167","display_name":"Dejan Diklic","orcid":null},"institutions":[{"id":"https://openalex.org/I2800095910","display_name":"Yahoo (Spain)","ror":"https://ror.org/03gq8sg42","country_code":"ES","type":"company","lineage":["https://openalex.org/I2800095910","https://openalex.org/I4210134091"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Dejan Diklic","raw_affiliation_strings":["Yahoo! Research","Yahoo! research,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research","institution_ids":[]},{"raw_affiliation_string":"Yahoo! research,","institution_ids":["https://openalex.org/I2800095910"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037908462","display_name":"Vanja Josifovski","orcid":null},"institutions":[{"id":"https://openalex.org/I2800095910","display_name":"Yahoo (Spain)","ror":"https://ror.org/03gq8sg42","country_code":"ES","type":"company","lineage":["https://openalex.org/I2800095910","https://openalex.org/I4210134091"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Vanja Josifovski","raw_affiliation_strings":["Yahoo! Research","Yahoo! research,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research","institution_ids":[]},{"raw_affiliation_string":"Yahoo! research,","institution_ids":["https://openalex.org/I2800095910"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5073819862","display_name":"Mayssam Sayyadian","orcid":null},"institutions":[{"id":"https://openalex.org/I2800095910","display_name":"Yahoo (Spain)","ror":"https://ror.org/03gq8sg42","country_code":"ES","type":"company","lineage":["https://openalex.org/I2800095910","https://openalex.org/I4210134091"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Mayssam Sayyadian","raw_affiliation_strings":["Yahoo! Research","Yahoo! research,"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Yahoo! Research","institution_ids":[]},{"raw_affiliation_string":"Yahoo! research,","institution_ids":["https://openalex.org/I2800095910"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":12.4361,"has_fulltext":false,"cited_by_count":49,"citation_normalized_percentile":{"value":0.98250594,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"16","last_page":"25"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11512","display_name":"Anomaly Detection Techniques and Applications","score":0.9914000034332275,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10064","display_name":"Complex Network Analysis Techniques","score":0.9901999831199646,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7775709629058838},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.6173274517059326},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6006523370742798},{"id":"https://openalex.org/keywords/hierarchy","display_name":"Hierarchy","score":0.5858540534973145},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.5399195551872253},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.4711032509803772},{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.47095662355422974},{"id":"https://openalex.org/keywords/sampling","display_name":"Sampling (signal processing)","score":0.46002545952796936},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.4542470872402191},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.4528043568134308},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4267267882823944},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.41317373514175415},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.37048494815826416},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.12995758652687073}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7775709629058838},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.6173274517059326},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6006523370742798},{"id":"https://openalex.org/C31170391","wikidata":"https://www.wikidata.org/wiki/Q188619","display_name":"Hierarchy","level":2,"score":0.5858540534973145},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.5399195551872253},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.4711032509803772},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.47095662355422974},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.46002545952796936},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.4542470872402191},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.4528043568134308},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4267267882823944},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.41317373514175415},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.37048494815826416},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.12995758652687073},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C34447519","wikidata":"https://www.wikidata.org/wiki/Q179522","display_name":"Market economy","level":1,"score":0.0},{"id":"https://openalex.org/C120665830","wikidata":"https://www.wikidata.org/wiki/Q14620","display_name":"Optics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1281192.1281198","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1281192.1281198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 13th ACM SIGKDD international conference on Knowledge discovery and data mining","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6800000071525574,"display_name":"Reduced inequalities","id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":19,"referenced_works":["https://openalex.org/W46877293","https://openalex.org/W1482090177","https://openalex.org/W2001792610","https://openalex.org/W2012425257","https://openalex.org/W2024760831","https://openalex.org/W2027472851","https://openalex.org/W2049633694","https://openalex.org/W2049898997","https://openalex.org/W2062881394","https://openalex.org/W2099664903","https://openalex.org/W2118502261","https://openalex.org/W2143022286","https://openalex.org/W2148143831","https://openalex.org/W2313953460","https://openalex.org/W2318487091","https://openalex.org/W3125953395","https://openalex.org/W4302150147","https://openalex.org/W6677724928","https://openalex.org/W6681402394"],"related_works":["https://openalex.org/W2931688134","https://openalex.org/W2377919138","https://openalex.org/W2378857091","https://openalex.org/W2999756192","https://openalex.org/W103652678","https://openalex.org/W4226090359","https://openalex.org/W2059697060","https://openalex.org/W936373746","https://openalex.org/W4382701072","https://openalex.org/W2461263520"],"abstract_inverted_index":{"We":[0],"consider":[1],"the":[2,28,42,45,62,68,71,93,109,119,124,177],"problem":[3,29],"of":[4,8,30,59,70,90,111,118,163,190],"estimating":[5,31],"occurrence":[6],"rates":[7,33,64,100],"rare":[9,186],"eventsfor":[10],"extremely":[11,185],"sparse":[12],"data,":[13],"using":[14,101],"pre-existing":[15],"hierarchies":[16,50,72],"to":[17,121,152],"perform":[18],"inference":[19],"at":[20,56,115,132],"multiple":[21],"resolutions.":[22],"In":[23],"particular,":[24],"we":[25,79,85,167],"focus":[26],"on":[27],"click":[32,63,99,192],"for":[34,123],"(webpage,":[35,112],"advertisement)":[36],"pairs":[37,114],"(called":[38],"impressions)":[39],"where":[40],"both":[41],"pages":[43,91],"and":[44,67,96,150],"ads":[46],"are":[47,65,148],"classified":[48],"into":[49],"that":[51,169],"capture":[52],"broad":[53],"contextual":[54],"information":[55],"different":[57],"levels":[58],"granularity.":[60],"Typically":[61],"low":[66],"coverage":[69],"is":[73],"sparse.":[74],"To":[75],"overcome":[76],"these":[77],"difficulties":[78],"devise":[80],"a":[81,102,142,159],"sampling":[82,125],"method":[83,181],"whereby":[84],"analyze":[86],"aspecially":[87],"chosen":[88],"sample":[89],"in":[92,176,188],"training":[94,178],"set,":[95,179],"then":[97],"estimate":[98],"two-stage":[103],"model.":[104,145],"The":[105,127],"first":[106],"stage":[107,129],"imputes":[108],"number":[110],"ad)":[113],"all":[116,133],"resolutions":[117,134],"hierarchy":[120],"adjust":[122],"bias.":[126],"second":[128],"estimates":[130],"clickrates":[131],"after":[135],"incorporating":[136],"correlations":[137],"among":[138],"sibling":[139],"nodes":[140],"through":[141],"tree-structured":[143],"Markov":[144],"Both":[146],"models":[147],"scalable":[149],"suited":[151],"large":[153],"scale":[154],"data":[155],"mining":[156],"applications.":[157],"On":[158],"real-world":[160],"dataset":[161],"consisting":[162],"1/2":[164],"billion":[165],"impressions,":[166],"demonstrate":[168],"even":[170],"with":[171],"95%":[172],"negative":[173],"(non-clicked)":[174],"events":[175,187],"our":[180],"can":[182],"effectively":[183],"discriminate":[184],"terms":[189],"their":[191],"propensity.":[193]},"counts_by_year":[{"year":2024,"cited_by_count":1},{"year":2021,"cited_by_count":2},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":3},{"year":2015,"cited_by_count":1},{"year":2014,"cited_by_count":3},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":4}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
