{"id":"https://openalex.org/W2005104010","doi":"https://doi.org/10.1145/1809400.1809414","title":"Design and analysis of the KDD cup 2009","display_name":"Design and analysis of the KDD cup 2009","publication_year":2010,"publication_date":"2010-05-27","ids":{"openalex":"https://openalex.org/W2005104010","doi":"https://doi.org/10.1145/1809400.1809414","mag":"2005104010"},"language":"en","primary_location":{"id":"doi:10.1145/1809400.1809414","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1809400.1809414","pdf_url":null,"source":{"id":"https://openalex.org/S4210176598","display_name":"ACM SIGKDD Explorations Newsletter","issn_l":"1931-0145","issn":["1931-0145","1931-0153"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGKDD Explorations Newsletter","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5006360335","display_name":"Isabelle Guyon","orcid":"https://orcid.org/0000-0002-9266-1783"},"institutions":[{"id":"https://openalex.org/I4210086945","display_name":"Clopinet","ror":"https://ror.org/000px4v03","country_code":"US","type":"company","lineage":["https://openalex.org/I4210086945"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Isabelle Guyon","raw_affiliation_strings":["Clopinet, Berkeley, California"],"affiliations":[{"raw_affiliation_string":"Clopinet, Berkeley, California","institution_ids":["https://openalex.org/I4210086945"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103118554","display_name":"Vincent Lemaire","orcid":"https://orcid.org/0000-0002-6030-2356"},"institutions":[{"id":"https://openalex.org/I19370010","display_name":"Orange (France)","ror":"https://ror.org/035j0tq82","country_code":"FR","type":"company","lineage":["https://openalex.org/I19370010"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Vincent Lemaire","raw_affiliation_strings":["Orange Labs, Lannion, France"],"affiliations":[{"raw_affiliation_string":"Orange Labs, Lannion, France","institution_ids":["https://openalex.org/I19370010"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111936967","display_name":"Marc Boull\u00e9","orcid":null},"institutions":[{"id":"https://openalex.org/I19370010","display_name":"Orange (France)","ror":"https://ror.org/035j0tq82","country_code":"FR","type":"company","lineage":["https://openalex.org/I19370010"]}],"countries":["FR"],"is_corresponding":false,"raw_author_name":"Marc Boull\u00e9","raw_affiliation_strings":["Orange Labs, Lannion, France"],"affiliations":[{"raw_affiliation_string":"Orange Labs, Lannion, France","institution_ids":["https://openalex.org/I19370010"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062245154","display_name":"Gideon Dror","orcid":null},"institutions":[{"id":"https://openalex.org/I4210141777","display_name":"Academic College of Tel Aviv-Yafo","ror":"https://ror.org/04cg6c004","country_code":"IL","type":"education","lineage":["https://openalex.org/I4210141777"]}],"countries":["IL"],"is_corresponding":false,"raw_author_name":"Gideon Dror","raw_affiliation_strings":["Academic College of TelAvivYaffo, Tel Aviv, Israel"],"affiliations":[{"raw_affiliation_string":"Academic College of TelAvivYaffo, Tel Aviv, Israel","institution_ids":["https://openalex.org/I4210141777"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062753224","display_name":"David S. Vogel","orcid":"https://orcid.org/0000-0002-3591-8490"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"David Vogel","raw_affiliation_strings":["Data Mining Solutions, Orlando, Florida"],"affiliations":[{"raw_affiliation_string":"Data Mining Solutions, Orlando, Florida","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5006360335"],"corresponding_institution_ids":["https://openalex.org/I4210086945"],"apc_list":null,"apc_paid":null,"fwci":3.8819,"has_fulltext":false,"cited_by_count":24,"citation_normalized_percentile":{"value":0.93204578,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":"11","issue":"2","first_page":"68","last_page":"76"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12384","display_name":"Customer churn and segmentation","score":0.9896000027656555,"subfield":{"id":"https://openalex.org/subfields/1406","display_name":"Marketing"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12384","display_name":"Customer churn and segmentation","score":0.9896000027656555,"subfield":{"id":"https://openalex.org/subfields/1406","display_name":"Marketing"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9840999841690063,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11871","display_name":"Advanced Statistical Methods and Models","score":0.9771000146865845,"subfield":{"id":"https://openalex.org/subfields/2613","display_name":"Statistics and Probability"},"field":{"id":"https://openalex.org/fields/26","display_name":"Mathematics"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8094260692596436},{"id":"https://openalex.org/keywords/popularity","display_name":"Popularity","score":0.6814301609992981},{"id":"https://openalex.org/keywords/categorical-variable","display_name":"Categorical variable","score":0.5821848511695862},{"id":"https://openalex.org/keywords/knowledge-extraction","display_name":"Knowledge extraction","score":0.4331839680671692},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.3767877221107483},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3752918541431427},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.375236839056015},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.3325914740562439}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8094260692596436},{"id":"https://openalex.org/C2780586970","wikidata":"https://www.wikidata.org/wiki/Q1357284","display_name":"Popularity","level":2,"score":0.6814301609992981},{"id":"https://openalex.org/C5274069","wikidata":"https://www.wikidata.org/wiki/Q2285707","display_name":"Categorical variable","level":2,"score":0.5821848511695862},{"id":"https://openalex.org/C120567893","wikidata":"https://www.wikidata.org/wiki/Q1582085","display_name":"Knowledge extraction","level":2,"score":0.4331839680671692},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.3767877221107483},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3752918541431427},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.375236839056015},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.3325914740562439},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1809400.1809414","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1809400.1809414","pdf_url":null,"source":{"id":"https://openalex.org/S4210176598","display_name":"ACM SIGKDD Explorations Newsletter","issn_l":"1931-0145","issn":["1931-0145","1931-0153"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ACM SIGKDD Explorations Newsletter","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.47999998927116394}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W174542576","https://openalex.org/W183657245","https://openalex.org/W1480376833","https://openalex.org/W1554944419","https://openalex.org/W1565746575","https://openalex.org/W1678356000","https://openalex.org/W1784548050","https://openalex.org/W1974758710","https://openalex.org/W1980264541","https://openalex.org/W2058815839","https://openalex.org/W2087347434","https://openalex.org/W2105506044","https://openalex.org/W2112076978","https://openalex.org/W2118796860","https://openalex.org/W2148603752","https://openalex.org/W2150446468","https://openalex.org/W2168278308","https://openalex.org/W2911964244","https://openalex.org/W2912934387","https://openalex.org/W2997546679","https://openalex.org/W3000180494","https://openalex.org/W3001304634","https://openalex.org/W3154964538","https://openalex.org/W4241727697","https://openalex.org/W4285719527","https://openalex.org/W6676769703","https://openalex.org/W6677732441","https://openalex.org/W6738852829","https://openalex.org/W7071374342"],"related_works":["https://openalex.org/W2368605798","https://openalex.org/W2518037665","https://openalex.org/W2348524959","https://openalex.org/W2368049389","https://openalex.org/W2170801710","https://openalex.org/W2384861574","https://openalex.org/W2952704802","https://openalex.org/W4294565801","https://openalex.org/W2142306706","https://openalex.org/W2477036161"],"abstract_inverted_index":{"We":[0,116],"organized":[1],"the":[2,11,61,71,93,129,170,173,179,227,232,278,281],"KDD":[3,45,233],"cup":[4],"2009":[5,47],"around":[6],"a":[7,29,37,56,136,149,156,217],"marketing":[8,42,58],"problem":[9,126],"with":[10,184,259],"goal":[12],"of":[13,19,40,73,138,152,159,169,172,181,226,251,262,268,272,280],"identifying":[14],"data":[15,276],"mining":[16],"techniques":[17],"capable":[18],"rapidly":[20],"building":[21],"predictive":[22],"models":[23],"and":[24,140,155,178,201,216,248,264,270,277,287],"scoring":[25],"new":[26,80],"entries":[27],"on":[28,55],"large":[30,57,150,157,260],"database.":[31],"Customer":[32],"Relationship":[33],"Management":[34],"(CRM)":[35],"is":[36],"key":[38],"element":[39],"modern":[41],"strategies.":[43],"The":[44,66,98,224,238,275],"Cup":[46],"offered":[48],"to":[49,53,69,75,89,91,105,120,128,219,257],"participants":[50,112,222],"an":[51],"opportunity":[52],"work":[54],"database":[59],"from":[60,102,113,206],"French":[62],"Telecom":[63],"company":[64],"Orange.":[65],"tasks":[67],"were":[68,229],"predict":[70],"propensity":[72],"customers":[74],"switch":[76],"provider":[77],"(churn),":[78],"buy":[79,86],"products":[81],"or":[82,85],"services":[83],"(appetency),":[84],"upgrades/addons":[87],"proposed":[88],"them":[90],"make":[92],"sale":[94],"more":[95],"profitable":[96],"(upselling).":[97],"challenge,":[99],"which":[100],"lasted":[101],"March":[103],"10":[104],"May":[106],"11,":[107],"2009,":[108],"attracted":[109],"over":[110],"450":[111],"46":[114],"countries.":[115],"attribute":[117],"its":[118],"popularity":[119],"several":[121],"factors:":[122],"(1)":[123],"A":[124,197],"generic":[125],"relevant":[127],"Industry":[130],"(a":[131],"classification":[132],"problem),":[133],"but":[134],"presenting":[135],"number":[137,151,158],"scientific":[139],"technical":[141],"challenges,":[142],"including":[143],"many":[144,185],"missing":[145,273],"values":[146],"(about":[147],"60%),":[148],"features":[153],"(15000)":[154],"training":[160],"examples":[161,171],"(50000),":[162],"unbalanced":[163],"class":[164],"proportions":[165],"(fewer":[166],"than":[167],"10%":[168],"positive":[174],"class),":[175],"noisy":[176],"data,":[177],"presence":[180],"categorical":[182],"variables":[183],"different":[186],"values.":[187,274],"(2)":[188],"Prizes":[189],"(Orange":[190],"offers":[191],"10000":[192],"Euros":[193],"in":[194],"prizes).":[195],"(3)":[196],"well":[198],"designed":[199],"protocol":[200],"web":[202],"site":[203],"(we":[204],"benefitted":[205],"past":[207],"experience).":[208],"(4)":[209],"An":[210],"effective":[211,247],"advertising":[212],"campaign":[213],"using":[214],"mailings":[215],"teleconference":[218],"answer":[220],"potential":[221],"questions.":[223],"results":[225],"challenge":[228,282],"discussed":[230],"at":[231,290],"conference":[234],"(June":[235],"28,":[236],"2009).":[237],"principal":[239],"conclusions":[240],"are":[241,245],"that":[242,249],"ensemble":[243,250],"methods":[244],"very":[246],"decision":[252],"trees":[253],"offer":[254],"off-the-shelf":[255],"solutions":[256],"problems":[258],"numbers":[261],"samples":[263],"attributes,":[265],"mixed":[266],"types":[267],"variables,":[269],"lots":[271],"platform":[279],"remain":[283],"available":[284],"for":[285],"research":[286],"educational":[288],"purposes":[289],"http://www.kddcup-orange.com/.":[291]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":2},{"year":2022,"cited_by_count":1},{"year":2020,"cited_by_count":2},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":3},{"year":2017,"cited_by_count":2},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":4},{"year":2014,"cited_by_count":1},{"year":2013,"cited_by_count":2},{"year":2012,"cited_by_count":2}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
