{"id":"https://openalex.org/W4282585030","doi":"https://doi.org/10.1145/3514221.3526054","title":"Photon: A Fast Query Engine for Lakehouse Systems","display_name":"Photon: A Fast Query Engine for Lakehouse Systems","publication_year":2022,"publication_date":"2022-06-10","ids":{"openalex":"https://openalex.org/W4282585030","doi":"https://doi.org/10.1145/3514221.3526054"},"language":"en","primary_location":{"id":"doi:10.1145/3514221.3526054","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3514221.3526054","pdf_url":null,"source":{"id":"https://openalex.org/S4363608845","display_name":"Proceedings of the 2022 International Conference on Management of Data","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 International Conference on Management of Data","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5039486762","display_name":"Alexander Behm","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Alexander Behm","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014756843","display_name":"Shoumik Palkar","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shoumik Palkar","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5038219269","display_name":"Utkarsh Agarwal","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Utkarsh Agarwal","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042916733","display_name":"Timothy G. Armstrong","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Timothy Armstrong","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073100734","display_name":"David Cashman","orcid":"https://orcid.org/0000-0003-4534-2947"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"David Cashman","raw_affiliation_strings":["Databricks Inc., Toronto, Canada"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., Toronto, Canada","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112840756","display_name":"Ankur Dave","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ankur Dave","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043915113","display_name":"Todd Greenstein","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Todd Greenstein","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085276284","display_name":"Shant Hovsepian","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shant Hovsepian","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071638205","display_name":"Ryan Johnson","orcid":"https://orcid.org/0000-0002-5800-7796"},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ryan Johnson","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057473667","display_name":"Arvind Sai Krishnan","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Arvind Sai Krishnan","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036033566","display_name":"Paul Leventis","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Paul Leventis","raw_affiliation_strings":["Databricks Inc., Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., Amsterdam, Netherlands","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037168792","display_name":"Ala Luszczak","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ala Luszczak","raw_affiliation_strings":["Databricks Inc., Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., Amsterdam, Netherlands","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025654427","display_name":"Prashanth Menon","orcid":"https://orcid.org/0000-0003-1345-6050"},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Prashanth Menon","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053315572","display_name":"Mostafa Mokhtar","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mostafa Mokhtar","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032233956","display_name":"Gene Pang","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gene Pang","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5052926368","display_name":"Sameer Paranjpye","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sameer Paranjpye","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011987775","display_name":"Greg Rahn","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Greg Rahn","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058202025","display_name":"Bart Samwel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bart Samwel","raw_affiliation_strings":["Databricks Inc., Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., Amsterdam, Netherlands","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021911378","display_name":"Tom van Bussel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tom van Bussel","raw_affiliation_strings":["Databricks Inc., Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., Amsterdam, Netherlands","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056163057","display_name":"Herman van H\u00f6vell","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Herman van Hovell","raw_affiliation_strings":["Databricks Inc., Amsterdam, Netherlands"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., Amsterdam, Netherlands","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025345309","display_name":"Maryann Xue","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Maryann Xue","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000259060","display_name":"Reynold Xin","orcid":null},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Reynold Xin","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005554337","display_name":"Matei Zaharia","orcid":"https://orcid.org/0000-0002-7547-7204"},"institutions":[{"id":"https://openalex.org/I4401726825","display_name":"Databricks (United States)","ror":"https://ror.org/01ynzx943","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726825"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Matei Zaharia","raw_affiliation_strings":["Databricks Inc., San Francisco, CA, USA"],"affiliations":[{"raw_affiliation_string":"Databricks Inc., San Francisco, CA, USA","institution_ids":["https://openalex.org/I4401726825"]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":23,"corresponding_author_ids":["https://openalex.org/A5039486762"],"corresponding_institution_ids":["https://openalex.org/I4401726825"],"apc_list":null,"apc_paid":null,"fwci":6.8687,"has_fulltext":false,"cited_by_count":33,"citation_normalized_percentile":{"value":0.98630705,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2326","last_page":"2339"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9997000098228455,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11719","display_name":"Data Quality and Management","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8311914205551147},{"id":"https://openalex.org/keywords/sql","display_name":"SQL","score":0.8084003925323486},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.6307957172393799},{"id":"https://openalex.org/keywords/spark","display_name":"SPARK (programming language)","score":0.599449634552002},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.5444009304046631},{"id":"https://openalex.org/keywords/vectorization","display_name":"Vectorization (mathematics)","score":0.5288136005401611},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.48389872908592224},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.44218388199806213},{"id":"https://openalex.org/keywords/query-optimization","display_name":"Query optimization","score":0.411424458026886},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.3968547582626343},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.37953805923461914},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.32674139738082886},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.2299436330795288},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.20939576625823975}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8311914205551147},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.8084003925323486},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.6307957172393799},{"id":"https://openalex.org/C2781215313","wikidata":"https://www.wikidata.org/wiki/Q3493345","display_name":"SPARK (programming language)","level":2,"score":0.599449634552002},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.5444009304046631},{"id":"https://openalex.org/C41681595","wikidata":"https://www.wikidata.org/wiki/Q7917855","display_name":"Vectorization (mathematics)","level":2,"score":0.5288136005401611},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.48389872908592224},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.44218388199806213},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.411424458026886},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.3968547582626343},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.37953805923461914},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.32674139738082886},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2299436330795288},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.20939576625823975},{"id":"https://openalex.org/C205649164","wikidata":"https://www.wikidata.org/wiki/Q1071","display_name":"Geography","level":0,"score":0.0},{"id":"https://openalex.org/C13280743","wikidata":"https://www.wikidata.org/wiki/Q131089","display_name":"Geodesy","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C187736073","wikidata":"https://www.wikidata.org/wiki/Q2920921","display_name":"Management","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3514221.3526054","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3514221.3526054","pdf_url":null,"source":{"id":"https://openalex.org/S4363608845","display_name":"Proceedings of the 2022 International Conference on Management of Data","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2022 International Conference on Management of Data","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W174317439","https://openalex.org/W1493893823","https://openalex.org/W1570477871","https://openalex.org/W1746258828","https://openalex.org/W2005294557","https://openalex.org/W2013344760","https://openalex.org/W2038412523","https://openalex.org/W2086977914","https://openalex.org/W2106771621","https://openalex.org/W2106911865","https://openalex.org/W2124011064","https://openalex.org/W2124851765","https://openalex.org/W2137259192","https://openalex.org/W2146757372","https://openalex.org/W2147076738","https://openalex.org/W2430301697","https://openalex.org/W2439390339","https://openalex.org/W2542459869","https://openalex.org/W2765206444","https://openalex.org/W2807799957","https://openalex.org/W2914209329","https://openalex.org/W2949762319","https://openalex.org/W3005237218","https://openalex.org/W3085477028","https://openalex.org/W3136655632","https://openalex.org/W3173180775","https://openalex.org/W3177128963","https://openalex.org/W4292169167"],"related_works":["https://openalex.org/W2762467749","https://openalex.org/W2378211422","https://openalex.org/W2374048355","https://openalex.org/W2161584192","https://openalex.org/W1556784671","https://openalex.org/W2558523485","https://openalex.org/W4379407450","https://openalex.org/W2905107896","https://openalex.org/W2895375519","https://openalex.org/W2356335648"],"abstract_inverted_index":{"Many":[0],"organizations":[1],"are":[2,47],"shifting":[3],"to":[4,37,147],"a":[5,73,149],"data":[6,18,24,50,57],"management":[7],"paradigm":[8],"called":[9],"the":[10,14,42,96,102,155],"\"Lakehouse,\"":[11],"which":[12],"implements":[13],"functionality":[15],"of":[16,22],"structured":[17,56],"warehouses":[19,89],"on":[20,41,55,90],"top":[21],"unstructured":[23],"lakes.":[25],"This":[26],"presents":[27],"new":[28,150],"challenges":[29],"for":[30,77,154],"query":[31,75],"execution":[32],"engines.":[33],"The":[34],"engine":[35,76],"needs":[36],"provide":[38],"good":[39],"performance":[40,54,152],"raw":[43],"uncurated":[44],"datasets":[45],"that":[46,80],"ubiquitous":[48],"in":[49,59,107],"lakes,":[51],"and":[52,93,114,122,129,142],"excellent":[53],"stored":[58],"popular":[60],"columnar":[61],"file":[62],"formats":[63],"like":[64],"Apache":[65,97,123],"Parquet.":[66],"Toward":[67],"these":[68],"goals,":[69],"we":[70,81,105],"present":[71],"Photon,":[72],"vectorized":[74],"Lakehouse":[78],"environments":[79],"developed":[82],"at":[83],"Databricks.":[84],"Photon":[85,108,133],"can":[86],"outperform":[87],"existing":[88,120],"SQL":[91,121],"workloads":[92,138],"also":[94],"supports":[95],"Spark":[98,124],"API.":[99],"We":[100],"discuss":[101],"design":[103],"choices":[104],"made":[106],"(e.g.,":[109],"vectorization":[110],"vs.":[111],"code":[112],"generation)":[113],"describe":[115],"its":[116,126,130],"integration":[117],"with":[118],"our":[119],"runtimes,":[125],"task":[127],"model,":[128],"memory":[131],"manager.":[132],"has":[134,143],"accelerated":[135],"some":[136],"customer":[137],"by":[139],"over":[140],"10x":[141],"recently":[144],"allowed":[145],"Databricks":[146],"set":[148],"audited":[151],"record":[153],"official":[156],"100TB":[157],"TPC-DS":[158],"benchmark.":[159]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":12},{"year":2023,"cited_by_count":8},{"year":2022,"cited_by_count":1}],"updated_date":"2026-04-12T07:58:50.170612","created_date":"2025-10-10T00:00:00"}
