{"id":"https://openalex.org/W4406461021","doi":"https://doi.org/10.1109/bigdata62323.2024.10825377","title":"FaaS and Furious: abstractions and differential caching for efficient data pre-processing","display_name":"FaaS and Furious: abstractions and differential caching for efficient data pre-processing","publication_year":2024,"publication_date":"2024-12-15","ids":{"openalex":"https://openalex.org/W4406461021","doi":"https://doi.org/10.1109/bigdata62323.2024.10825377"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata62323.2024.10825377","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825377","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5008079520","display_name":"Jacopo Tagliabue","orcid":"https://orcid.org/0000-0001-8634-6122"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Jacopo Tagliabue","raw_affiliation_strings":["Bauplan Labs,New York,US"],"affiliations":[{"raw_affiliation_string":"Bauplan Labs,New York,US","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114658465","display_name":"Ryan Curtin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ryan Curtin","raw_affiliation_strings":["Bauplan Labs,Atlanta,US"],"affiliations":[{"raw_affiliation_string":"Bauplan Labs,Atlanta,US","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062556651","display_name":"Ciro Greco","orcid":"https://orcid.org/0009-0007-0359-4130"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ciro Greco","raw_affiliation_strings":["Bauplan Labs,New York,US"],"affiliations":[{"raw_affiliation_string":"Bauplan Labs,New York,US","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5008079520"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.0984,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.80931308,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"3562","last_page":"3567"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8356032371520996},{"id":"https://openalex.org/keywords/differential","display_name":"Differential (mechanical device)","score":0.509828507900238},{"id":"https://openalex.org/keywords/differential-privacy","display_name":"Differential privacy","score":0.416491836309433},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.23321175575256348}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8356032371520996},{"id":"https://openalex.org/C93226319","wikidata":"https://www.wikidata.org/wiki/Q193137","display_name":"Differential (mechanical device)","level":2,"score":0.509828507900238},{"id":"https://openalex.org/C23130292","wikidata":"https://www.wikidata.org/wiki/Q5275358","display_name":"Differential privacy","level":2,"score":0.416491836309433},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.23321175575256348},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata62323.2024.10825377","is_oa":false,"landing_page_url":"https://doi.org/10.1109/bigdata62323.2024.10825377","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Big Data (BigData)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":21,"referenced_works":["https://openalex.org/W2734941459","https://openalex.org/W2795027513","https://openalex.org/W3082494217","https://openalex.org/W3118813946","https://openalex.org/W3146147323","https://openalex.org/W3182747618","https://openalex.org/W3199439011","https://openalex.org/W4296563717","https://openalex.org/W4353115367","https://openalex.org/W4385774813","https://openalex.org/W4398233610","https://openalex.org/W4399117333","https://openalex.org/W4402041923","https://openalex.org/W6633828322","https://openalex.org/W6750206174","https://openalex.org/W6792927796","https://openalex.org/W6843428833","https://openalex.org/W6850850318","https://openalex.org/W6855224118","https://openalex.org/W6869428873","https://openalex.org/W6874102660"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W3038283795","https://openalex.org/W2604501336","https://openalex.org/W2558166297","https://openalex.org/W2734500670","https://openalex.org/W2315671126","https://openalex.org/W798507144","https://openalex.org/W2964481303"],"abstract_inverted_index":{"Data":[0],"pre-processing":[1,66],"pipelines":[2,20],"are":[3],"the":[4,85],"bread":[5],"and":[6,49,94,97],"butter":[7],"of":[8,62],"any":[9],"successful":[10],"AI":[11],"project.":[12],"We":[13,82],"introduce":[14],"a":[15,22,47],"novel":[16],"programming":[17,91],"model":[18],"for":[19,56],"in":[21,32,65],"data":[23,57,106],"lakehouse,":[24],"allowing":[25],"users":[26],"to":[27,52],"interact":[28],"declaratively":[29],"with":[30,46],"assets":[31],"object":[33],"storage.":[34],"Motivated":[35],"by":[36],"real-world":[37],"industry":[38],"usage":[39],"patterns,":[40],"we":[41],"exploit":[42],"these":[43],"new":[44,86],"abstractions":[45],"columnar":[48],"differential":[50],"cache":[51,87],"maximize":[53],"iteration":[54],"speed":[55],"scientists,":[58],"who":[59],"spent":[60],"most":[61],"their":[63],"time":[64,75,95],"\u2013":[67],"adding":[68],"or":[69,73,79],"removing":[70],"features,":[71],"restricting":[72],"relaxing":[74],"windows,":[76,96],"wrangling":[77],"current":[78],"older":[80],"datasets.":[81],"show":[83],"how":[84],"works":[88],"transparently":[89],"across":[90],"languages,":[92],"schemas":[93],"provide":[98],"preliminary":[99],"evidence":[100],"on":[101,104],"its":[102],"efficiency":[103],"standard":[105],"workloads.":[107]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2025-10-10T00:00:00"}
