{"id":"https://openalex.org/W4413968267","doi":"https://doi.org/10.14778/3746405.3746437","title":"ArrayMorph: Optimizing Hyperslab Queries on the Cloud for Machine Learning Pipelines","display_name":"ArrayMorph: Optimizing Hyperslab Queries on the Cloud for Machine Learning Pipelines","publication_year":2025,"publication_date":"2025-05-01","ids":{"openalex":"https://openalex.org/W4413968267","doi":"https://doi.org/10.14778/3746405.3746437"},"language":"en","primary_location":{"id":"doi:10.14778/3746405.3746437","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3746405.3746437","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5075655663","display_name":"Ruochen Jiang","orcid":"https://orcid.org/0000-0003-3049-9087"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ruochen Jiang","raw_affiliation_strings":["The Ohio State University, Columbus, OH, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Ohio State University, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001035930","display_name":"Spyros Blanas","orcid":"https://orcid.org/0009-0004-2703-7177"},"institutions":[{"id":"https://openalex.org/I52357470","display_name":"The Ohio State University","ror":"https://ror.org/00rs6vg23","country_code":"US","type":"education","lineage":["https://openalex.org/I52357470"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Spyros Blanas","raw_affiliation_strings":["The Ohio State University, Columbus, OH, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"The Ohio State University, Columbus, OH, USA","institution_ids":["https://openalex.org/I52357470"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.32052817,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"18","issue":"9","first_page":"3189","last_page":"3202"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.7729700803756714},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6832060813903809},{"id":"https://openalex.org/keywords/pipeline-transport","display_name":"Pipeline transport","score":0.6505066752433777},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.33558282256126404},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.15351903438568115},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.15038156509399414},{"id":"https://openalex.org/keywords/mechanical-engineering","display_name":"Mechanical engineering","score":0.06943288445472717}],"concepts":[{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.7729700803756714},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6832060813903809},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.6505066752433777},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.33558282256126404},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.15351903438568115},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.15038156509399414},{"id":"https://openalex.org/C78519656","wikidata":"https://www.wikidata.org/wiki/Q101333","display_name":"Mechanical engineering","level":1,"score":0.06943288445472717}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.14778/3746405.3746437","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3746405.3746437","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W142258998","https://openalex.org/W1516019649","https://openalex.org/W1967091776","https://openalex.org/W1969241434","https://openalex.org/W2011129635","https://openalex.org/W2014830756","https://openalex.org/W2038412523","https://openalex.org/W2048773562","https://openalex.org/W2110086534","https://openalex.org/W2430301697","https://openalex.org/W2440979603","https://openalex.org/W2574839832","https://openalex.org/W2752236330","https://openalex.org/W2894398417","https://openalex.org/W3029471531","https://openalex.org/W3031868945","https://openalex.org/W3101868768","https://openalex.org/W3106045941","https://openalex.org/W3159219445","https://openalex.org/W3159401322","https://openalex.org/W3169404295","https://openalex.org/W4206368588","https://openalex.org/W4210883322","https://openalex.org/W4214582717","https://openalex.org/W4235746825","https://openalex.org/W4243657877","https://openalex.org/W4298816067","https://openalex.org/W4309505072","https://openalex.org/W4323767619","https://openalex.org/W4385623027"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4244478748","https://openalex.org/W3150465815","https://openalex.org/W4223488648","https://openalex.org/W2134969820","https://openalex.org/W2251605416","https://openalex.org/W1997222214","https://openalex.org/W4413232173"],"abstract_inverted_index":{"Cloud":[0,12],"storage":[1,132],"services":[2],"such":[3,83],"as":[4,40,84,158],"Amazon":[5],"S3,":[6],"Azure":[7],"Blob":[8],"Storage,":[9],"and":[10,49,91,104,121,161,176,199],"Google":[11],"Storage":[13],"are":[14],"widely":[15],"used":[16],"to":[17,68,77,142,144,180,183,196],"store":[18],"raw":[19],"data":[20,27,65,108,115,131,150,156,186],"for":[21],"machine":[22],"learning":[23,54],"applications.":[24],"When":[25],"the":[26,31,69,101,114,118,139,152],"is":[28,98,138,177],"later":[29],"processed,":[30],"analysis":[32],"predominantly":[33],"focuses":[34],"on":[35,151],"regions":[36,146],"of":[37,106,113,147],"interest":[38,148],"(such":[39],"a":[41,46,87,93,107,128,165],"small":[42],"bounding":[43],"box":[44],"in":[45],"larger":[47],"image)":[48],"discards":[50],"uninteresting":[51],"regions.":[52],"Machine":[53],"applications":[55,193],"can":[56],"significantly":[57],"accelerate":[58],"their":[59],"I/O":[60],"if":[61],"they":[62],"push":[63],"this":[64],"filtering":[66],"step":[67],"cloud.":[70,153],"Prior":[71],"work":[72],"has":[73],"proposed":[74],"different":[75],"methods":[76],"partially":[78],"read":[79],"array":[80,130],"(tensor)":[81],"objects,":[82],"chunking,":[85],"reading":[86],"contiguous":[88],"byte":[89],"range,":[90],"evaluating":[92],"lambda":[94],"function.":[95],"No":[96],"method":[97,141],"optimal;":[99],"estimating":[100],"total":[102],"time":[103],"cost":[105],"retrieval":[109],"requires":[110],"an":[111],"understanding":[112],"serialization":[116],"order,":[117],"chunk":[119],"size":[120],"platform-specific":[122],"properties.":[123],"This":[124,190],"paper":[125],"introduces":[126],"ArrayMorph,":[127],"cloud-based":[129],"system":[133],"that":[134],"automatically":[135],"determines":[136],"which":[137],"best":[140],"use":[143],"retrieve":[145],"from":[149],"ArrayMorph":[154,169],"formulates":[155],"accesses":[157],"hyperslab":[159],"queries,":[160],"optimizes":[162],"them":[163],"using":[164],"multi-phase":[166],"cost-based":[167],"approach.":[168],"seamlessly":[170],"integrates":[171],"with":[172],"Python/PyTorch-based":[173],"ML":[174,192],"applications,":[175],"experimentally":[178],"shown":[179],"transfer":[181],"up":[182,195],"9.8X":[184],"less":[185],"than":[187,202],"existing":[188],"systems.":[189],"makes":[191],"run":[194],"1.7X":[197],"faster":[198],"9X":[200],"cheaper":[201],"prior":[203],"solutions.":[204]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
