{"id":"https://openalex.org/W3136696550","doi":"https://doi.org/10.1109/bigdata50022.2020.9378082","title":"Smart-ML: A System for Machine Learning Model Exploration using Pipeline Graph","display_name":"Smart-ML: A System for Machine Learning Model Exploration using Pipeline Graph","publication_year":2020,"publication_date":"2020-12-10","ids":{"openalex":"https://openalex.org/W3136696550","doi":"https://doi.org/10.1109/bigdata50022.2020.9378082","mag":"3136696550"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata50022.2020.9378082","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata50022.2020.9378082","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5033934770","display_name":"Dhaval Patel","orcid":"https://orcid.org/0000-0002-5449-6975"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Dhaval Patel","raw_affiliation_strings":["AI Applications, IBM Research, NY, USA"],"affiliations":[{"raw_affiliation_string":"AI Applications, IBM Research, NY, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044958272","display_name":"Shrey Shrivastava","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shrey Shrivastava","raw_affiliation_strings":["AI Applications, IBM Research, NY, USA"],"affiliations":[{"raw_affiliation_string":"AI Applications, IBM Research, NY, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064019498","display_name":"Wesley M. Gifford","orcid":"https://orcid.org/0000-0003-3678-8410"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wesley Gifford","raw_affiliation_strings":["AI Applications, IBM Research, NY, USA"],"affiliations":[{"raw_affiliation_string":"AI Applications, IBM Research, NY, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059334687","display_name":"Stuart Siegel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stuart Siegel","raw_affiliation_strings":["AI Applications, IBM Research, NY, USA"],"affiliations":[{"raw_affiliation_string":"AI Applications, IBM Research, NY, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057936833","display_name":"Jayant Kalagnanam","orcid":"https://orcid.org/0009-0009-5051-2606"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jayant Kalagnanam","raw_affiliation_strings":["AI Applications, IBM Research, NY, USA"],"affiliations":[{"raw_affiliation_string":"AI Applications, IBM Research, NY, USA","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5112852091","display_name":"Chandra Reddy","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chandra Reddy","raw_affiliation_strings":["AI Applications, IBM Research, NY, USA"],"affiliations":[{"raw_affiliation_string":"AI Applications, IBM Research, NY, USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5033934770"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.6628,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.77079943,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9943000078201294,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8241598606109619},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6467914581298828},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.5881341695785522},{"id":"https://openalex.org/keywords/pipeline-transport","display_name":"Pipeline transport","score":0.5155186653137207},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5035578608512878},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5027120113372803},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.47659438848495483},{"id":"https://openalex.org/keywords/graph-database","display_name":"Graph database","score":0.4601393938064575},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4262908101081848},{"id":"https://openalex.org/keywords/directed-acyclic-graph","display_name":"Directed acyclic graph","score":0.41145703196525574},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.36293283104896545},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.3618907332420349},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.2016792893409729},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.1878138780593872},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.15722909569740295}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8241598606109619},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6467914581298828},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.5881341695785522},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.5155186653137207},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5035578608512878},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5027120113372803},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.47659438848495483},{"id":"https://openalex.org/C176225458","wikidata":"https://www.wikidata.org/wiki/Q595971","display_name":"Graph database","level":3,"score":0.4601393938064575},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4262908101081848},{"id":"https://openalex.org/C74197172","wikidata":"https://www.wikidata.org/wiki/Q1195339","display_name":"Directed acyclic graph","level":2,"score":0.41145703196525574},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.36293283104896545},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3618907332420349},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.2016792893409729},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.1878138780593872},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.15722909569740295},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C87717796","wikidata":"https://www.wikidata.org/wiki/Q146326","display_name":"Environmental engineering","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata50022.2020.9378082","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata50022.2020.9378082","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure","score":0.4099999964237213}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":32,"referenced_works":["https://openalex.org/W2097998348","https://openalex.org/W2101234009","https://openalex.org/W2182361439","https://openalex.org/W2295598076","https://openalex.org/W2295611744","https://openalex.org/W2542459869","https://openalex.org/W2556522401","https://openalex.org/W2798476254","https://openalex.org/W2798650501","https://openalex.org/W2889510677","https://openalex.org/W2941332886","https://openalex.org/W2942646859","https://openalex.org/W2947123069","https://openalex.org/W2948742859","https://openalex.org/W2949676527","https://openalex.org/W2951775784","https://openalex.org/W2963815651","https://openalex.org/W2964022491","https://openalex.org/W2964024268","https://openalex.org/W3040879595","https://openalex.org/W3100008240","https://openalex.org/W3102476541","https://openalex.org/W3105704032","https://openalex.org/W6674385629","https://openalex.org/W6675354045","https://openalex.org/W6685961532","https://openalex.org/W6697084357","https://openalex.org/W6730169791","https://openalex.org/W6762022119","https://openalex.org/W6762903864","https://openalex.org/W6780874407","https://openalex.org/W6786310888"],"related_works":["https://openalex.org/W2593692294","https://openalex.org/W2291678262","https://openalex.org/W4282570934","https://openalex.org/W1971922661","https://openalex.org/W1984775058","https://openalex.org/W1817956424","https://openalex.org/W2060064441","https://openalex.org/W4245771833","https://openalex.org/W3094989083","https://openalex.org/W2020100607"],"abstract_inverted_index":{"In":[0],"this":[1],"paper,":[2],"we":[3,125,160],"describe":[4],"an":[5,99],"overarching":[6],"ML":[7,19,53,68,144],"system":[8,31],"with":[9,94,122],"a":[10,33,62,95,103,116,127,141],"simple":[11],"programming":[12,35],"interface":[13,64],"that":[14,159],"leverages":[15],"existing":[16],"AI":[17,155],"and":[18,74,86,98,130,157,187],"frameworks":[20],"to":[21,101,135,140,151,164],"make":[22],"the":[23,58,91,137,165,175],"task":[24],"of":[25,45,106,143,182],"model":[26],"exploration":[27,133],"easier.":[28],"The":[29],"proposed":[30],"introduces":[32],"new":[34],"construct":[36],"namely":[37],"pipeline":[38,59,92,119],"graph":[39,60,93,120],"(a":[40],"directed":[41],"acyclic":[42],"graph)":[43],"consisting":[44],"multiple":[46],"machine":[47],"learning":[48],"operations":[49],"provided":[50,126],"by":[51],"different":[52,67,82],"repositories.":[54],"End":[55],"user":[56],"uses":[57],"as":[61,71],"common":[63],"for":[65],"modeling":[66],"tasks":[69],"such":[70],"classification,":[72],"regression,":[73],"timeseries":[75],"prediction,":[76],"while":[77,168],"enabling":[78],"efficient":[79,131],"execution":[80],"on":[81,184],"environments":[83],"(Spark,":[84],"Celery":[85],"Cloud).":[87],"We":[88,146],"further":[89],"annotated":[90],"hyper-parameter":[96],"grid":[97],"option":[100],"try-out":[102],"wide":[104],"range":[105],"optimization":[107],"strategies":[108],"(i.e.,":[109],"Random,":[110],"Bayesian,":[111],"Bandit,":[112],"AutoLearn,":[113],"etc).":[114],"Given":[115],"large":[117],"pre-defined":[118],"along":[121],"its":[123],"hyper-parameters,":[124],"general-purpose,":[128],"scalable":[129],"pipeline-graph":[132],"technique":[134],"provide":[136],"automated":[138,149,154],"solutions":[139],"variety":[142],"tasks.":[145],"compare":[147],"our":[148],"approach":[150],"several":[152],"state-of-the-art":[153],"systems":[156],"find":[158],"achieve":[161],"performance":[162],"comparable":[163],"best":[166],"results,":[167],"often":[169],"producing":[170],"simpler":[171],"pipelines":[172],"using":[173],"off":[174],"shelf":[176],"components.":[177],"Our":[178],"evaluation":[179],"suite":[180],"consists":[181],"experiments":[183],"60+":[185],"classifications":[186],"regressions":[188],"datasets.":[189]},"counts_by_year":[{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
