{"id":"https://openalex.org/W4387847216","doi":"https://doi.org/10.1145/3583780.3615051","title":"Selecting Top-k Data Science Models by Example Dataset","display_name":"Selecting Top-k Data Science Models by Example Dataset","publication_year":2023,"publication_date":"2023-10-21","ids":{"openalex":"https://openalex.org/W4387847216","doi":"https://doi.org/10.1145/3583780.3615051"},"language":"en","primary_location":{"id":"doi:10.1145/3583780.3615051","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3583780.3615051","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100775500","display_name":"Mengying Wang","orcid":"https://orcid.org/0000-0001-8150-8436"},"institutions":[{"id":"https://openalex.org/I58956616","display_name":"Case Western Reserve University","ror":"https://ror.org/051fd9666","country_code":"US","type":"education","lineage":["https://openalex.org/I58956616"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Mengying Wang","raw_affiliation_strings":["Case Western Reserve University, Cleveland, OH, USA"],"affiliations":[{"raw_affiliation_string":"Case Western Reserve University, Cleveland, OH, USA","institution_ids":["https://openalex.org/I58956616"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003434623","display_name":"Sheng Guan","orcid":"https://orcid.org/0000-0003-0977-1787"},"institutions":[{"id":"https://openalex.org/I58956616","display_name":"Case Western Reserve University","ror":"https://ror.org/051fd9666","country_code":"US","type":"education","lineage":["https://openalex.org/I58956616"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sheng Guan","raw_affiliation_strings":["Case Western Reserve University, Cleveland, OH, USA"],"affiliations":[{"raw_affiliation_string":"Case Western Reserve University, Cleveland, OH, USA","institution_ids":["https://openalex.org/I58956616"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078704605","display_name":"Hanchao Ma","orcid":"https://orcid.org/0000-0002-5811-4305"},"institutions":[{"id":"https://openalex.org/I58956616","display_name":"Case Western Reserve University","ror":"https://ror.org/051fd9666","country_code":"US","type":"education","lineage":["https://openalex.org/I58956616"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hanchao Ma","raw_affiliation_strings":["Case Western Reserve University, Cleveland, OH, USA"],"affiliations":[{"raw_affiliation_string":"Case Western Reserve University, Cleveland, OH, USA","institution_ids":["https://openalex.org/I58956616"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026082387","display_name":"Yiyang Bian","orcid":"https://orcid.org/0000-0002-9860-2725"},"institutions":[{"id":"https://openalex.org/I58956616","display_name":"Case Western Reserve University","ror":"https://ror.org/051fd9666","country_code":"US","type":"education","lineage":["https://openalex.org/I58956616"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yiyang Bian","raw_affiliation_strings":["Case Western Reserve University, Cleveland, OH, USA"],"affiliations":[{"raw_affiliation_string":"Case Western Reserve University, Cleveland, OH, USA","institution_ids":["https://openalex.org/I58956616"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072765591","display_name":"Haolai Che","orcid":"https://orcid.org/0009-0000-1989-0734"},"institutions":[{"id":"https://openalex.org/I58956616","display_name":"Case Western Reserve University","ror":"https://ror.org/051fd9666","country_code":"US","type":"education","lineage":["https://openalex.org/I58956616"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Haolai Che","raw_affiliation_strings":["Case Western Reserve University, Cleveland, OH, USA"],"affiliations":[{"raw_affiliation_string":"Case Western Reserve University, Cleveland, OH, USA","institution_ids":["https://openalex.org/I58956616"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064842562","display_name":"Abhishek Daundkar","orcid":"https://orcid.org/0000-0002-8105-8073"},"institutions":[{"id":"https://openalex.org/I58956616","display_name":"Case Western Reserve University","ror":"https://ror.org/051fd9666","country_code":"US","type":"education","lineage":["https://openalex.org/I58956616"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abhishek Daundkar","raw_affiliation_strings":["Case Western Reserve University, Cleveland, OH, USA"],"affiliations":[{"raw_affiliation_string":"Case Western Reserve University, Cleveland, OH, USA","institution_ids":["https://openalex.org/I58956616"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050957935","display_name":"Alp Sehirlioglu","orcid":"https://orcid.org/0000-0002-9708-4049"},"institutions":[{"id":"https://openalex.org/I58956616","display_name":"Case Western Reserve University","ror":"https://ror.org/051fd9666","country_code":"US","type":"education","lineage":["https://openalex.org/I58956616"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alp Sehirlioglu","raw_affiliation_strings":["Case Western Reserve University, Cleveland, OH, USA"],"affiliations":[{"raw_affiliation_string":"Case Western Reserve University, Cleveland, OH, USA","institution_ids":["https://openalex.org/I58956616"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5071093153","display_name":"Yinghui Wu","orcid":"https://orcid.org/0000-0003-3991-5155"},"institutions":[{"id":"https://openalex.org/I58956616","display_name":"Case Western Reserve University","ror":"https://ror.org/051fd9666","country_code":"US","type":"education","lineage":["https://openalex.org/I58956616"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yinghui Wu","raw_affiliation_strings":["Case Western Reserve University, Cleveland, OH, USA"],"affiliations":[{"raw_affiliation_string":"Case Western Reserve University, Cleveland, OH, USA","institution_ids":["https://openalex.org/I58956616"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5100775500"],"corresponding_institution_ids":["https://openalex.org/I58956616"],"apc_list":null,"apc_paid":null,"fwci":0.3457,"has_fulltext":false,"cited_by_count":2,"citation_normalized_percentile":{"value":0.66700249,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":94,"max":96},"biblio":{"volume":null,"issue":null,"first_page":"2686","last_page":"2695"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9994000196456909,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11273","display_name":"Advanced Graph Neural Networks","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8300362825393677},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.5565716028213501},{"id":"https://openalex.org/keywords/domain-knowledge","display_name":"Domain knowledge","score":0.552977979183197},{"id":"https://openalex.org/keywords/pipeline-transport","display_name":"Pipeline transport","score":0.48248007893562317},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4530600309371948},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.45093971490859985},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.44546547532081604},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.4445390999317169},{"id":"https://openalex.org/keywords/data-modeling","display_name":"Data modeling","score":0.4140288829803467},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.31966912746429443},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.16608867049217224},{"id":"https://openalex.org/keywords/theoretical-computer-science","display_name":"Theoretical computer science","score":0.12517020106315613}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8300362825393677},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.5565716028213501},{"id":"https://openalex.org/C207685749","wikidata":"https://www.wikidata.org/wiki/Q2088941","display_name":"Domain knowledge","level":2,"score":0.552977979183197},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.48248007893562317},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4530600309371948},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.45093971490859985},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.44546547532081604},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.4445390999317169},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.4140288829803467},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31966912746429443},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.16608867049217224},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.12517020106315613},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C87717796","wikidata":"https://www.wikidata.org/wiki/Q146326","display_name":"Environmental engineering","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3583780.3615051","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3583780.3615051","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.46000000834465027,"id":"https://metadata.un.org/sdg/9","display_name":"Industry, innovation and infrastructure"}],"awards":[{"id":"https://openalex.org/G2296916099","display_name":null,"funder_award_id":"ECCS-1","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G3284713303","display_name":null,"funder_award_id":"ECCS-1933279","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G388053966","display_name":null,"funder_award_id":"CNS-1932574","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G4304986854","display_name":"Collaborative Research: Online Data Stream Fusion and Deep Learning for Virtual Meter in Smart Power Distribution Systems","funder_award_id":"1933279","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5137275545","display_name":null,"funder_award_id":"DE-EE0009353","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"},{"id":"https://openalex.org/G5616988581","display_name":"Elements: Crowdsourced Materials Data Engine for Unpublished XRD Results","funder_award_id":"2104007","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5647725531","display_name":null,"funder_award_id":"CNS-1932574,ECCS-1933279,CNS-2028748,OAC-2104007","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6204808334","display_name":null,"funder_award_id":"1932574","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6242636793","display_name":null,"funder_award_id":"CNS-2028748","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6390304386","display_name":"SaTC: CORE: Small: Scalable Cyber Attack Investigation using Declarative Queriesand Interrogative Analysis","funder_award_id":"2028748","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8296311834","display_name":"Technician Support:  Stable Isotope Laboratory at the University of Tennessee","funder_award_id":"0004104","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8810070980","display_name":null,"funder_award_id":"DE-EE0009353,DE-NA0004104","funder_id":"https://openalex.org/F4320306084","funder_display_name":"U.S. Department of Energy"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320306084","display_name":"U.S. Department of Energy","ror":"https://ror.org/01bj3aw27"},{"id":"https://openalex.org/F4320337392","display_name":"Division of Electrical, Communications and Cyber Systems","ror":"https://ror.org/01krpsy48"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":20,"referenced_works":["https://openalex.org/W2132708887","https://openalex.org/W2165698076","https://openalex.org/W2475334473","https://openalex.org/W2913560138","https://openalex.org/W2914721378","https://openalex.org/W2945526235","https://openalex.org/W2945623882","https://openalex.org/W2945827670","https://openalex.org/W2963146368","https://openalex.org/W2981848390","https://openalex.org/W3045200674","https://openalex.org/W3100278010","https://openalex.org/W3106439716","https://openalex.org/W3198659451","https://openalex.org/W3209295695","https://openalex.org/W4205556549","https://openalex.org/W4210334834","https://openalex.org/W4226237846","https://openalex.org/W4284707622","https://openalex.org/W6968855694"],"related_works":["https://openalex.org/W1995889332","https://openalex.org/W3104163240","https://openalex.org/W2804364458","https://openalex.org/W4298130764","https://openalex.org/W2132641928","https://openalex.org/W2090259340","https://openalex.org/W4310225030","https://openalex.org/W2083665254","https://openalex.org/W2393816671","https://openalex.org/W3008693296"],"abstract_inverted_index":{"Data":[0],"analytical":[1,213],"pipelines":[2,52],"routinely":[3],"involve":[4],"various":[5],"domain-specific":[6],"data":[7,50],"science":[8],"models.":[9],"Such":[10],"models":[11,31,48,107,151,166,184],"require":[12],"expensive":[13,21],"manual":[14],"or":[15],"training":[16],"effort":[17],"and":[18,38,45,98,125,185,209],"often":[19],"incur":[20],"validation":[22],"costs":[23],"(e.g.,":[24],"via":[25],"scientific":[26],"simulation":[27],"analysis).":[28],"Meanwhile,":[29],"high-value":[30],"remain":[32],"to":[33,111,146,181],"be":[34],"ad-hocly":[35],"created,":[36],"isolated,":[37],"underutilized":[39],"for":[40,49,57],"a":[41,66,84,89,103,122,127,131,141,153,158,177,197],"broad":[42],"community.":[43],"Searching":[44],"accessing":[46],"proper":[47],"analysis":[51],"is":[53,167],"desirable":[54],"yet":[55],"challenging":[56],"users":[58],"without":[59,161],"domain":[60],"knowledge.":[61],"This":[62],"paper":[63],"introduces":[64],"ModsNet,":[65],"novel":[67],"MODel":[68],"SelectioN":[69],"framework":[70,129],"that":[71,108],"only":[72],"requires":[73],"an":[74,99],"Example":[75],"daTaset.":[76],"(1)":[77,138],"We":[78,120,189],"investigate":[79],"the":[80,113,116,172],"following":[81],"problem:":[82],"Given":[83],"library":[85],"of":[86,92,95,191,196],"pre-trained":[87,150],"models,":[88],"limited":[90],"amount":[91],"historical":[93],"observations":[94],"their":[96,186],"performance,":[97],"\"example\"":[100],"dataset":[101,160],"as":[102],"query,":[104],"return":[105],"k":[106],"are":[109],"expected":[110],"perform":[112],"best":[114],"over":[115,211],"query":[117],"dataset.":[118],"(2)":[119,169],"formulate":[121],"regression":[123],"problem":[124],"introduce":[126],"knowledge-enhanced":[128],"using":[130],"model-data":[132],"interaction":[133,163],"graph.":[134],"Unlike":[135],"traditional":[136],"methods,":[137],"ModsNet":[139,192],"uses":[140],"dynamic,":[142],"cost-bounded":[143],"\"probe-and-select\"":[144],"strategy":[145,180],"incrementally":[147],"identify":[148],"promising":[149],"in":[152],"strict":[154],"cold-start":[155],"scenario":[156],"(when":[157],"new":[159],"any":[162],"with":[164],"existing":[165],"given).":[168],"To":[170],"reduce":[171],"learning":[173],"cost,":[174],"we":[175],"develop":[176],"clustering-based":[178],"sparsification":[179],"prune":[182],"unpromising":[183],"interactions.":[187],"(3)":[188],"showcase":[190],"built":[193],"on":[194],"top":[195],"crowdsourced":[198],"materials":[199],"knowledge":[200],"base":[201],"platform.":[202],"Our":[203],"experiments":[204],"verified":[205],"its":[206],"effectiveness,":[207],"efficiency,":[208],"applications":[210],"real-world":[212],"pipelines.":[214]},"counts_by_year":[{"year":2024,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
