{"id":"https://openalex.org/W4404181101","doi":"https://doi.org/10.14778/3685800.3685880","title":"LakeCompass: An End-to-End System for Data Maintenance, Search and Analysis in Data Lakes","display_name":"LakeCompass: An End-to-End System for Data Maintenance, Search and Analysis in Data Lakes","publication_year":2024,"publication_date":"2024-08-01","ids":{"openalex":"https://openalex.org/W4404181101","doi":"https://doi.org/10.14778/3685800.3685880"},"language":"en","primary_location":{"id":"doi:10.14778/3685800.3685880","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3685800.3685880","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5054869135","display_name":"Chengliang Chai","orcid":"https://orcid.org/0009-0003-5386-1330"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chengliang Chai","raw_affiliation_strings":["Beijing Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044971195","display_name":"Yuhao Deng","orcid":"https://orcid.org/0009-0002-4473-4527"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuhao Deng","raw_affiliation_strings":["Beijing Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011258051","display_name":"Yihua Zhan","orcid":"https://orcid.org/0009-0004-3347-9764"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yutong Zhan","raw_affiliation_strings":["Beijing Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101316745","display_name":"Ziqi Cao","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziqi Cao","raw_affiliation_strings":["Beijing Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056366190","display_name":"Yuan\u2010Fang Zhang","orcid":"https://orcid.org/0000-0002-2903-9027"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuanfang Zhang","raw_affiliation_strings":["Beijing Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049926126","display_name":"Lei Cao","orcid":"https://orcid.org/0000-0001-9909-8607"},"institutions":[{"id":"https://openalex.org/I138006243","display_name":"University of Arizona","ror":"https://ror.org/03m2x1q45","country_code":"US","type":"education","lineage":["https://openalex.org/I138006243"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lei Cao","raw_affiliation_strings":["University of Arizona/MIT"],"affiliations":[{"raw_affiliation_string":"University of Arizona/MIT","institution_ids":["https://openalex.org/I138006243"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100339106","display_name":"Yu\u2010Ping Wang","orcid":"https://orcid.org/0000-0001-9340-5864"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuping Wang","raw_affiliation_strings":["Beijing Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061240612","display_name":"Zhiwei Zhang","orcid":"https://orcid.org/0000-0003-3482-6831"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhiwei Zhang","raw_affiliation_strings":["Beijing Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5117866386","display_name":"Ye Yuan","orcid":null},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ye Yuan","raw_affiliation_strings":["Beijing Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054991337","display_name":"Guoren Wang","orcid":"https://orcid.org/0000-0002-0181-8379"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guoren Wang","raw_affiliation_strings":["Beijing Institute of Technology"],"affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology","institution_ids":["https://openalex.org/I125839683"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101824160","display_name":"Nan Tang","orcid":"https://orcid.org/0000-0003-2832-0295"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nan Tang","raw_affiliation_strings":["HKUST (GZ)"],"affiliations":[{"raw_affiliation_string":"HKUST (GZ)","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":11,"corresponding_author_ids":["https://openalex.org/A5054869135"],"corresponding_institution_ids":["https://openalex.org/I125839683"],"apc_list":null,"apc_paid":null,"fwci":2.9865,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.91747537,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":"17","issue":"12","first_page":"4381","last_page":"4384"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9890999794006348,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/end-to-end-principle","display_name":"End-to-end principle","score":0.6842248439788818},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4562583565711975},{"id":"https://openalex.org/keywords/end-user","display_name":"End user","score":0.42252254486083984},{"id":"https://openalex.org/keywords/data-science","display_name":"Data science","score":0.34820258617401123},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.23301944136619568},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.09611836075782776}],"concepts":[{"id":"https://openalex.org/C74296488","wikidata":"https://www.wikidata.org/wiki/Q2527392","display_name":"End-to-end principle","level":2,"score":0.6842248439788818},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4562583565711975},{"id":"https://openalex.org/C91262260","wikidata":"https://www.wikidata.org/wiki/Q528074","display_name":"End user","level":2,"score":0.42252254486083984},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.34820258617401123},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.23301944136619568},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.09611836075782776}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.14778/3685800.3685880","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3685800.3685880","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":6,"referenced_works":["https://openalex.org/W2810954846","https://openalex.org/W2970059736","https://openalex.org/W3196904276","https://openalex.org/W4283367762","https://openalex.org/W4375928372","https://openalex.org/W6753529518"],"related_works":["https://openalex.org/W4299590256","https://openalex.org/W2151749779","https://openalex.org/W3163634122","https://openalex.org/W2110442089","https://openalex.org/W3119482857","https://openalex.org/W2919182614","https://openalex.org/W2166381389","https://openalex.org/W4393280045","https://openalex.org/W2054736184","https://openalex.org/W3159728998"],"abstract_inverted_index":{"Searching":[0],"tables":[1,86,111],"from":[2],"poorly":[3],"maintained":[4],"data":[5,19],"lakes":[6],"has":[7],"long":[8],"been":[9],"recognized":[10],"as":[11,47],"a":[12],"formidable":[13],"challenge":[14],"in":[15,118],"the":[16,34,114],"realm":[17],"of":[18,36,43,91],"management.":[20],"There":[21],"are":[22,93],"three":[23],"pivotal":[24],"tasks:":[25],"keyword-based,":[26],"joinable":[27],"and":[28,73,128],"unionable":[29],"table":[30],"search,":[31],"which":[32,88],"form":[33],"backbone":[35],"tasks":[37,69],"that":[38,60],"aim":[39],"to":[40,95,112,131],"make":[41],"sense":[42],"diverse":[44,89],"datasets,":[45],"such":[46],"machine":[48],"learning.":[49],"In":[50],"this":[51],"demo,":[52],"we":[53,123],"propose":[54],"LakeCompass,":[55],"an":[56,119],"end-to-end":[57],"prototype":[58],"system":[59],"maintains":[61],"abundant":[62],"tabular":[63],"data,":[64],"supports":[65],"all":[66],"above":[67],"search":[68,98],"with":[70],"high":[71],"efficacy,":[72],"well":[74],"serves":[75],"downstream":[76,115],"ML":[77],"modeling.":[78],"To":[79],"be":[80],"specific,":[81],"LakeCompass":[82,105],"manages":[83],"numerous":[84],"real":[85],"over":[87],"types":[90],"indexes":[92],"built":[94],"support":[96],"efficient":[97],"based":[99],"on":[100],"different":[101],"user":[102,134],"requirements.":[103],"Particularly,":[104],"could":[106],"automatically":[107],"integrate":[108],"these":[109],"discovered":[110],"improve":[113],"model":[116],"performance":[117],"iterative":[120],"approach.":[121],"Finally,":[122],"provide":[124],"both":[125],"Python":[126],"APIs":[127],"Web":[129],"interface":[130],"facilitate":[132],"flexible":[133],"interaction.":[135]},"counts_by_year":[{"year":2025,"cited_by_count":6}],"updated_date":"2026-03-24T08:02:53.985720","created_date":"2025-10-10T00:00:00"}
