{"id":"https://openalex.org/W2035488079","doi":"https://doi.org/10.1109/icde.2013.6544913","title":"Machine learning on Big Data","display_name":"Machine learning on Big Data","publication_year":2013,"publication_date":"2013-04-01","ids":{"openalex":"https://openalex.org/W2035488079","doi":"https://doi.org/10.1109/icde.2013.6544913","mag":"2035488079"},"language":"en","primary_location":{"id":"doi:10.1109/icde.2013.6544913","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icde.2013.6544913","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE 29th International Conference on Data Engineering (ICDE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5014353497","display_name":"Tyson Condie","orcid":null},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"T. Condie","raw_affiliation_strings":["Cloud and Information Services Lab, Microsoft, Redmond, USA","Cloud & Inf. Services Lab., Microsoft, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Cloud and Information Services Lab, Microsoft, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Cloud & Inf. Services Lab., Microsoft, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009698276","display_name":"Paul Mineiro","orcid":"https://orcid.org/0000-0003-1965-6547"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"P. Mineiro","raw_affiliation_strings":["Cloud and Information Services Lab, Microsoft, Redmond, USA","Cloud & Inf. Services Lab., Microsoft, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Cloud and Information Services Lab, Microsoft, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Cloud & Inf. Services Lab., Microsoft, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010950113","display_name":"Neoklis Polyzotis","orcid":"https://orcid.org/0000-0002-2694-8591"},"institutions":[{"id":"https://openalex.org/I185103710","display_name":"University of California, Santa Cruz","ror":"https://ror.org/03s65by71","country_code":"US","type":"education","lineage":["https://openalex.org/I185103710"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"N. Polyzotis","raw_affiliation_strings":["University of California, Santa Cruz, Santa Cruz, CA, USA","University of California-Santa Cruz, Santa Cruz, CA, USA,"],"affiliations":[{"raw_affiliation_string":"University of California, Santa Cruz, Santa Cruz, CA, USA","institution_ids":["https://openalex.org/I185103710"]},{"raw_affiliation_string":"University of California-Santa Cruz, Santa Cruz, CA, USA,","institution_ids":["https://openalex.org/I185103710"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023179995","display_name":"Markus Weimer","orcid":"https://orcid.org/0009-0003-2620-663X"},"institutions":[{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"M. Weimer","raw_affiliation_strings":["Cloud and Information Services Lab, Microsoft, Redmond, USA","Cloud & Inf. Services Lab., Microsoft, Redmond, WA, USA"],"affiliations":[{"raw_affiliation_string":"Cloud and Information Services Lab, Microsoft, Redmond, USA","institution_ids":["https://openalex.org/I1290206253"]},{"raw_affiliation_string":"Cloud & Inf. Services Lab., Microsoft, Redmond, WA, USA","institution_ids":["https://openalex.org/I1290206253"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5014353497"],"corresponding_institution_ids":["https://openalex.org/I1290206253"],"apc_list":null,"apc_paid":null,"fwci":4.809,"has_fulltext":false,"cited_by_count":34,"citation_normalized_percentile":{"value":0.94825596,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"1242","last_page":"1244"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9939000010490417,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7598240971565247},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6319751739501953},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6172729134559631},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.5807788968086243},{"id":"https://openalex.org/keywords/big-data","display_name":"Big data","score":0.5288692116737366},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.47316843271255493},{"id":"https://openalex.org/keywords/artificial-neural-network","display_name":"Artificial neural network","score":0.4721377491950989},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.38173621892929077},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.1373547613620758},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.12370389699935913}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7598240971565247},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6319751739501953},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6172729134559631},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.5807788968086243},{"id":"https://openalex.org/C75684735","wikidata":"https://www.wikidata.org/wiki/Q858810","display_name":"Big data","level":2,"score":0.5288692116737366},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.47316843271255493},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.4721377491950989},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.38173621892929077},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.1373547613620758},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.12370389699935913},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icde.2013.6544913","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icde.2013.6544913","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2013 IEEE 29th International Conference on Data Engineering (ICDE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W182911965","https://openalex.org/W1995897489","https://openalex.org/W2046833425","https://openalex.org/W2096544401","https://openalex.org/W2109722477","https://openalex.org/W2124537004","https://openalex.org/W2131975293","https://openalex.org/W2136922672","https://openalex.org/W2146682077","https://openalex.org/W2157462866","https://openalex.org/W2168231600","https://openalex.org/W2170616854","https://openalex.org/W2173213060","https://openalex.org/W2952437656","https://openalex.org/W3133666419","https://openalex.org/W6607435017","https://openalex.org/W6676367512","https://openalex.org/W6679815717","https://openalex.org/W6681710355","https://openalex.org/W6684859321"],"related_works":["https://openalex.org/W4390608645","https://openalex.org/W4247566972","https://openalex.org/W2960264696","https://openalex.org/W3090563135","https://openalex.org/W2497432351","https://openalex.org/W4206777497","https://openalex.org/W4233347783","https://openalex.org/W2910064364","https://openalex.org/W4255224757","https://openalex.org/W1981780420"],"abstract_inverted_index":{"Statistical":[0],"Machine":[1,83,147,155],"Learning":[2,148,156],"has":[3],"undergone":[4],"a":[5,9],"phase":[6],"transition":[7],"from":[8],"pure":[10],"academic":[11],"endeavor":[12],"to":[13,122],"being":[14],"one":[15],"of":[16,20,65,82,109,125,133,146],"the":[17,63,69,89,100,107,110,118,123,126,141],"main":[18],"drivers":[19],"modern":[21],"commerce":[22],"and":[23,37,60,71,88,149],"science.":[24],"Even":[25],"more":[26],"so,":[27],"recent":[28,152],"results":[29],"such":[30],"as":[31],"those":[32],"on":[33,38,95],"tera-scale":[34],"learning":[35,73],"[1]":[36],"very":[39],"large":[40,79],"neural":[41],"networks":[42],"[2]":[43],"suggest":[44],"that":[45],"scale":[46,80],"is":[47],"an":[48],"important":[49],"ingredient":[50],"in":[51,103,106,117,154],"quality":[52],"modeling.":[53],"This":[54,120],"tutorial":[55,76],"introduces":[56],"current":[57,78,101],"applications,":[58],"techniques":[59],"systems":[61,104,138],"with":[62],"aim":[64],"cross-fertilizing":[66],"research":[67,135],"between":[68],"database":[70],"machine":[72],"communities.":[74],"The":[75],"covers":[77],"applications":[81],"Learning,":[84],"their":[85],"computational":[86],"model":[87],"workflow":[90],"behind":[91],"building":[92],"those.":[93],"Based":[94],"this":[96],"foundation,":[97],"we":[98,129],"present":[99],"state-of-the-art":[102],"support":[105,139,150],"bulk":[108],"tutorial.":[111],"We":[112],"also":[113],"identify":[114],"critical":[115],"gaps":[116],"state-of-the-art.":[119],"leads":[121],"closing":[124],"seminar,":[127],"where":[128],"introduce":[130],"two":[131],"sets":[132],"open":[134],"questions:":[136],"Better":[137],"for":[140,151],"already":[142],"established":[143],"use":[144],"cases":[145],"advances":[153],"research.":[157]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":4},{"year":2022,"cited_by_count":3},{"year":2020,"cited_by_count":3},{"year":2019,"cited_by_count":6},{"year":2018,"cited_by_count":5},{"year":2017,"cited_by_count":1},{"year":2016,"cited_by_count":1},{"year":2015,"cited_by_count":5},{"year":2014,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
