{"id":"https://openalex.org/W2004051715","doi":"https://doi.org/10.1145/2661829.2662044","title":"On Building Decision Trees from Large-scale Data in Applications of On-line Advertising","display_name":"On Building Decision Trees from Large-scale Data in Applications of On-line Advertising","publication_year":2014,"publication_date":"2014-11-03","ids":{"openalex":"https://openalex.org/W2004051715","doi":"https://doi.org/10.1145/2661829.2662044","mag":"2004051715"},"language":"en","primary_location":{"id":"doi:10.1145/2661829.2662044","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2661829.2662044","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd ACM International Conference on Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038200034","display_name":"Shivaram Kalyanakrishnan","orcid":null},"institutions":[{"id":"https://openalex.org/I59270414","display_name":"Indian Institute of Science Bangalore","ror":"https://ror.org/04dese585","country_code":"IN","type":"education","lineage":["https://openalex.org/I59270414"]}],"countries":["IN"],"is_corresponding":true,"raw_author_name":"Shivaram Kalyanakrishnan","raw_affiliation_strings":["Indian Institute of Science, Bengaluru, India","Indian Institute of Science, Bengaluru (India)"],"affiliations":[{"raw_affiliation_string":"Indian Institute of Science, Bengaluru, India","institution_ids":["https://openalex.org/I59270414"]},{"raw_affiliation_string":"Indian Institute of Science, Bengaluru (India)","institution_ids":["https://openalex.org/I59270414"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044522151","display_name":"Deepthi Singh","orcid":null},"institutions":[{"id":"https://openalex.org/I4210142485","display_name":"QNu Labs (India)","ror":"https://ror.org/03xcp1s96","country_code":"IN","type":"company","lineage":["https://openalex.org/I4210142485"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Deepthi Singh","raw_affiliation_strings":["Yahoo Labs Bangalore, Bengaluru, India"],"affiliations":[{"raw_affiliation_string":"Yahoo Labs Bangalore, Bengaluru, India","institution_ids":["https://openalex.org/I4210142485"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5003101801","display_name":"Ravi Kant","orcid":null},"institutions":[{"id":"https://openalex.org/I4210142485","display_name":"QNu Labs (India)","ror":"https://ror.org/03xcp1s96","country_code":"IN","type":"company","lineage":["https://openalex.org/I4210142485"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Ravi Kant","raw_affiliation_strings":["Yahoo Labs Bangalore, Bengaluru, India"],"affiliations":[{"raw_affiliation_string":"Yahoo Labs Bangalore, Bengaluru, India","institution_ids":["https://openalex.org/I4210142485"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5038200034"],"corresponding_institution_ids":["https://openalex.org/I59270414"],"apc_list":null,"apc_paid":null,"fwci":0.818,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.80014418,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":96},"biblio":{"volume":"3","issue":null,"first_page":"669","last_page":"678"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9921000003814697,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11652","display_name":"Imbalanced Data Classification Techniques","score":0.9911999702453613,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.7457693815231323},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7409351468086243},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.7135322093963623},{"id":"https://openalex.org/keywords/clickstream","display_name":"Clickstream","score":0.654029905796051},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6443760991096497},{"id":"https://openalex.org/keywords/decision-tree","display_name":"Decision tree","score":0.5769572854042053},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5502524375915527},{"id":"https://openalex.org/keywords/arity","display_name":"Arity","score":0.47492772340774536},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4538328945636749},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.42906326055526733},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4224357604980469},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3866107761859894},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.19556587934494019},{"id":"https://openalex.org/keywords/web-page","display_name":"Web page","score":0.15414530038833618}],"concepts":[{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.7457693815231323},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7409351468086243},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.7135322093963623},{"id":"https://openalex.org/C138744977","wikidata":"https://www.wikidata.org/wiki/Q5132438","display_name":"Clickstream","level":5,"score":0.654029905796051},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6443760991096497},{"id":"https://openalex.org/C84525736","wikidata":"https://www.wikidata.org/wiki/Q831366","display_name":"Decision tree","level":2,"score":0.5769572854042053},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5502524375915527},{"id":"https://openalex.org/C110546421","wikidata":"https://www.wikidata.org/wiki/Q1315869","display_name":"Arity","level":2,"score":0.47492772340774536},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4538328945636749},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.42906326055526733},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4224357604980469},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3866107761859894},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.19556587934494019},{"id":"https://openalex.org/C21959979","wikidata":"https://www.wikidata.org/wiki/Q36774","display_name":"Web page","level":2,"score":0.15414530038833618},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C127613066","wikidata":"https://www.wikidata.org/wiki/Q557770","display_name":"Web API","level":4,"score":0.0},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.0},{"id":"https://openalex.org/C130436687","wikidata":"https://www.wikidata.org/wiki/Q7978591","display_name":"Web modeling","level":3,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2661829.2662044","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2661829.2662044","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 23rd ACM International Conference on Conference on Information and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5199999809265137,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W1480376833","https://openalex.org/W1504694836","https://openalex.org/W1506806321","https://openalex.org/W1509515766","https://openalex.org/W1521843029","https://openalex.org/W1545265859","https://openalex.org/W1554944419","https://openalex.org/W1585743408","https://openalex.org/W1601142477","https://openalex.org/W1663973292","https://openalex.org/W1680392829","https://openalex.org/W1780185704","https://openalex.org/W1969675113","https://openalex.org/W1970210633","https://openalex.org/W1990381576","https://openalex.org/W1990777911","https://openalex.org/W1995200249","https://openalex.org/W1995945562","https://openalex.org/W2008183828","https://openalex.org/W2009708807","https://openalex.org/W2012905273","https://openalex.org/W2018049374","https://openalex.org/W2020663993","https://openalex.org/W2023163512","https://openalex.org/W2043779491","https://openalex.org/W2070996757","https://openalex.org/W2073241381","https://openalex.org/W2073358075","https://openalex.org/W2073404525","https://openalex.org/W2073459066","https://openalex.org/W2093217068","https://openalex.org/W2098824882","https://openalex.org/W2107103101","https://openalex.org/W2112651261","https://openalex.org/W2141014056","https://openalex.org/W2149706766","https://openalex.org/W2162979096","https://openalex.org/W2173213060","https://openalex.org/W2189465200","https://openalex.org/W2294062369","https://openalex.org/W2787894218","https://openalex.org/W2791559636","https://openalex.org/W2911964244","https://openalex.org/W3002175806","https://openalex.org/W3100094457","https://openalex.org/W3106889297","https://openalex.org/W3125937743","https://openalex.org/W6629510986","https://openalex.org/W6676297361","https://openalex.org/W6687322159","https://openalex.org/W6697367263"],"related_works":["https://openalex.org/W46644190","https://openalex.org/W4362597605","https://openalex.org/W1550666490","https://openalex.org/W1574414179","https://openalex.org/W1721465857","https://openalex.org/W1479691804","https://openalex.org/W4297676672","https://openalex.org/W3009056573","https://openalex.org/W4402156073","https://openalex.org/W2252427982"],"abstract_inverted_index":{"Decision":[0],"trees":[1,66,115],"have":[2],"been":[3],"used":[4],"for":[5,71],"several":[6],"decades":[7],"as":[8,34,76,125],"simple":[9],"and":[10,56,132,142],"effective":[11],"solutions":[12],"to":[13,20,88,93,102,129],"supervised":[14],"learning":[15],"problems.":[16],"Their":[17],"success":[18],"extends":[19],"tasks":[21,151],"across":[22],"a":[23,100,126],"variety":[24],"of":[25,45,73,164],"areas.":[26],"Yet,":[27],"data":[28],"collected":[29],"today":[30],"through":[31],"web-domains":[32],"such":[33],"on-line":[35,74,153],"advertising":[36,75],"presents":[37],"many":[38],"new":[39],"challenges:":[40],"sheer":[41],"size,":[42],"the":[43,59,162],"prevalence":[44],"high-arity":[46,95],"categorical":[47,96],"features,":[48,97],"unknown":[49],"feature-values,":[50],"\"cold":[51],"starts\",":[52],"sparse":[53],"training":[54],"instances,":[55],"imbalance":[57],"in":[58,152,161],"class":[60],"labels.":[61],"We":[62],"argue":[63],"that":[64,139],"decision":[65],"remain":[67],"an":[68],"ideal":[69],"choice":[70],"applications":[72],"they":[77],"naturally":[78],"construct":[79],"higher-order":[80],"conjunctive":[81],"features;":[82],"we":[83,98,122,136],"then":[84],"contribute":[85],"two":[86],"ideas":[87],"improve":[89],"tree-building":[90],"accordingly.":[91],"First,":[92],"handle":[94],"introduce":[99],"method":[101],"cluster":[103],"feature-values":[104],"based":[105],"on":[106,147],"their":[107],"output":[108],"responses.":[109],"The":[110],"result":[111],"is":[112],"more":[113],"\"data-dense\"":[114],"with":[116],"relatively":[117],"small":[118],"branching":[119],"factors.":[120],"Second,":[121],"employ":[123],"cross-validation":[124],"principled":[127],"approach":[128],"derive":[130],"splitting":[131],"stopping":[133],"criteria:":[134],"thereby":[135],"identify":[137],"splits":[138],"generalize":[140],"well,":[141],"also":[143],"curb":[144],"overfitting.":[145],"Evaluated":[146],"three":[148],"distinct":[149],"probability-estimation":[150],"advertising,":[154],"our":[155],"method,":[156],"\"CCDT\",":[157],"shows":[158],"significant":[159],"improvements":[160],"accuracy":[163],"prediction.":[165]},"counts_by_year":[{"year":2019,"cited_by_count":2},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
