{"id":"https://openalex.org/W2806779957","doi":"https://doi.org/10.1145/3209900.3209908","title":"SchemaDrill","display_name":"SchemaDrill","publication_year":2018,"publication_date":"2018-06-04","ids":{"openalex":"https://openalex.org/W2806779957","doi":"https://doi.org/10.1145/3209900.3209908","mag":"2806779957"},"language":"en","primary_location":{"id":"doi:10.1145/3209900.3209908","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3209900.3209908","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3209900.3209908","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Workshop on Human-In-the-Loop Data Analytics","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3209900.3209908","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023353797","display_name":"William Spoth","orcid":null},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"William Spoth","raw_affiliation_strings":["University at Buffalo, SUNY"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University at Buffalo, SUNY","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101496579","display_name":"Ting Xie","orcid":"https://orcid.org/0000-0001-8742-3855"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ting Xie","raw_affiliation_strings":["University at Buffalo, SUNY"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University at Buffalo, SUNY","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071259962","display_name":"Oliver Kennedy","orcid":"https://orcid.org/0000-0003-0632-1668"},"institutions":[{"id":"https://openalex.org/I63190737","display_name":"University at Buffalo, State University of New York","ror":"https://ror.org/01y64my43","country_code":"US","type":"education","lineage":["https://openalex.org/I63190737"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Oliver Kennedy","raw_affiliation_strings":["University at Buffalo, SUNY"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University at Buffalo, SUNY","institution_ids":["https://openalex.org/I63190737"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101642721","display_name":"Ying Yang","orcid":"https://orcid.org/0000-0003-4758-1917"},"institutions":[{"id":"https://openalex.org/I1342911587","display_name":"Oracle (United States)","ror":"https://ror.org/006c77m33","country_code":"US","type":"company","lineage":["https://openalex.org/I1342911587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ying Yang","raw_affiliation_strings":["Oracle"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Oracle","institution_ids":["https://openalex.org/I1342911587"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041506788","display_name":"Beda Christoph Hammerschmidt","orcid":null},"institutions":[{"id":"https://openalex.org/I1342911587","display_name":"Oracle (United States)","ror":"https://ror.org/006c77m33","country_code":"US","type":"company","lineage":["https://openalex.org/I1342911587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Beda Hammerschmidt","raw_affiliation_strings":["Oracle"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Oracle","institution_ids":["https://openalex.org/I1342911587"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5111489764","display_name":"Zhen Hua Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I1342911587","display_name":"Oracle (United States)","ror":"https://ror.org/006c77m33","country_code":"US","type":"company","lineage":["https://openalex.org/I1342911587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhen Hua Liu","raw_affiliation_strings":["Oracle"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Oracle","institution_ids":["https://openalex.org/I1342911587"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007788082","display_name":"Dieter Gawlick","orcid":"https://orcid.org/0000-0002-7882-0565"},"institutions":[{"id":"https://openalex.org/I1342911587","display_name":"Oracle (United States)","ror":"https://ror.org/006c77m33","country_code":"US","type":"company","lineage":["https://openalex.org/I1342911587"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dieter Gawlick","raw_affiliation_strings":["Oracle"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Oracle","institution_ids":["https://openalex.org/I1342911587"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.2338,"has_fulltext":true,"cited_by_count":10,"citation_normalized_percentile":{"value":0.85493922,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"7"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10538","display_name":"Data Mining Algorithms and Applications","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9973999857902527,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/json","display_name":"JSON","score":0.9930790662765503},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8334898352622986},{"id":"https://openalex.org/keywords/schema","display_name":"Schema (genetic algorithms)","score":0.5956409573554993},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5014195442199707},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.4358600378036499}],"concepts":[{"id":"https://openalex.org/C2780416260","wikidata":"https://www.wikidata.org/wiki/Q2063","display_name":"JSON","level":2,"score":0.9930790662765503},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8334898352622986},{"id":"https://openalex.org/C52146309","wikidata":"https://www.wikidata.org/wiki/Q7431116","display_name":"Schema (genetic algorithms)","level":2,"score":0.5956409573554993},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5014195442199707},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.4358600378036499}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3209900.3209908","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3209900.3209908","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3209900.3209908","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Workshop on Human-In-the-Loop Data Analytics","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3209900.3209908","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3209900.3209908","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3209900.3209908","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Workshop on Human-In-the-Loop Data Analytics","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G133560476","display_name":"TWC: Medium: Collaborative: Data is Social: Exploiting Data Relationships to Detect Insider Attacks","funder_award_id":"1409551","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G329461525","display_name":null,"funder_award_id":"IIS-1750460, ACI-1640864, SaTC-1409551","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7478733536","display_name":"CIF21 DIBBs: EI: Vizier, Streamlined Data Curation","funder_award_id":"1640864","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8266101516","display_name":null,"funder_award_id":"IIS-1750460","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8697568595","display_name":"CAREER: Declarative Uncertainty","funder_award_id":"1750460","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2806779957.pdf","grobid_xml":"https://content.openalex.org/works/W2806779957.grobid-xml"},"referenced_works_count":17,"referenced_works":["https://openalex.org/W1597994773","https://openalex.org/W1842847600","https://openalex.org/W1998871699","https://openalex.org/W2064766209","https://openalex.org/W2064853889","https://openalex.org/W2072191579","https://openalex.org/W2079785597","https://openalex.org/W2122789628","https://openalex.org/W2134356404","https://openalex.org/W2170061697","https://openalex.org/W2293962327","https://openalex.org/W2434390175","https://openalex.org/W2438877200","https://openalex.org/W2583864825","https://openalex.org/W2604790380","https://openalex.org/W2751338424","https://openalex.org/W4252403066"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2753132265","https://openalex.org/W4234766820","https://openalex.org/W4321232174","https://openalex.org/W3117520771","https://openalex.org/W2482048793","https://openalex.org/W4388027365","https://openalex.org/W2938860153","https://openalex.org/W4312551432"],"abstract_inverted_index":{"Ad-hoc":[0],"data":[1,52],"models":[2],"like":[3],"JSON":[4,23,51,66,83,126],"make":[5],"it":[6,31,97],"easy":[7],"to":[8,12,34,88,145],"evolve":[9],"schemas":[10,63,127,151],"and":[11,40,95,108,135],"multiplex":[13],"different":[14,150],"data-types":[15],"into":[16,37,99],"a":[17,38,75,129],"single":[18],"stream.":[19],"This":[20],"flexibility":[21],"makes":[22,30],"great":[24],"for":[25,64,79],"generating":[26],"data,":[27],"but":[28],"also":[29],"much":[32],"harder":[33],"query,":[35],"ingest":[36],"database,":[39],"index.":[41],"In":[42],"this":[43],"paper,":[44],"we":[45,57],"explore":[46],"the":[47,59,90,123,153],"first":[48],"step":[49],"of":[50,61,82,113,125,139],"loading:":[53],"schema":[54,118,140],"design.":[55],"Specifically,":[56],"consider":[58],"challenge":[60],"designing":[62],"existing":[65],"datasets":[67],"as":[68],"an":[69],"interactive":[70],"problem.":[71],"We":[72,106],"present":[73],"SchemaDrill,":[74],"roll-up/drill-down":[76],"style":[77],"interface":[78],"exploring":[80],"collections":[81],"records.":[84],"SchemaDrill":[85],"helps":[86],"users":[87,144],"visualize":[89],"collection,":[91],"identify":[92],"relevant":[93],"fragments,":[94],"map":[96],"down":[98],"one":[100],"or":[101],"more":[102],"flat,":[103],"relational":[104],"schemas.":[105],"describe":[107],"evaluate":[109],"two":[110],"key":[111],"components":[112],"SchemaDrill:":[114],"(1)":[115],"A":[116,137],"summary":[117],"representation":[119],"that":[120,142],"significantly":[121],"reduces":[122],"complexity":[124],"without":[128],"meaningful":[130],"reduction":[131],"in":[132,152],"information":[133],"content,":[134],"(2)":[136],"collection":[138],"visualizations":[141],"help":[143],"qualitatively":[146],"survey":[147],"variability":[148],"amongst":[149],"collection.":[154]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":1},{"year":2022,"cited_by_count":3},{"year":2021,"cited_by_count":1},{"year":2020,"cited_by_count":2}],"updated_date":"2026-06-22T08:00:12.763002","created_date":"2018-06-13T00:00:00"}
