{"id":"https://openalex.org/W4417403178","doi":"https://doi.org/10.1109/pact65351.2025.00026","title":"DMO-DB: Mitigating the Data Movement Bottlenecks of GPU-Accelerated Relational OLAP","display_name":"DMO-DB: Mitigating the Data Movement Bottlenecks of GPU-Accelerated Relational OLAP","publication_year":2025,"publication_date":"2025-11-03","ids":{"openalex":"https://openalex.org/W4417403178","doi":"https://doi.org/10.1109/pact65351.2025.00026"},"language":null,"primary_location":{"id":"doi:10.1109/pact65351.2025.00026","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pact65351.2025.00026","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 34th International Conference on Parallel Architectures and Compilation Techniques (PACT)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102016776","display_name":"Chaemin Lim","orcid":"https://orcid.org/0000-0002-2665-6273"},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Chaemin Lim","raw_affiliation_strings":["Yonsei University,Department of Computer Science and Engineering,Seoul,South Korea"],"affiliations":[{"raw_affiliation_string":"Yonsei University,Department of Computer Science and Engineering,Seoul,South Korea","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101426506","display_name":"Soo-Hyun Lee","orcid":"https://orcid.org/0000-0001-5257-2068"},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Suhyun Lee","raw_affiliation_strings":["Yonsei University,Department of Computer Science and Engineering,Seoul,South Korea"],"affiliations":[{"raw_affiliation_string":"Yonsei University,Department of Computer Science and Engineering,Seoul,South Korea","institution_ids":["https://openalex.org/I193775966"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101690727","display_name":"Jinwoo Choi","orcid":"https://orcid.org/0000-0001-7122-4309"},"institutions":[{"id":"https://openalex.org/I58716616","display_name":"Korea Institute of Science and Technology","ror":"https://ror.org/05kzfa883","country_code":"KR","type":"facility","lineage":["https://openalex.org/I27494661","https://openalex.org/I2801339556","https://openalex.org/I2801339556","https://openalex.org/I4210144908","https://openalex.org/I4387152098","https://openalex.org/I4387152098","https://openalex.org/I58716616"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jinwoo Choi","raw_affiliation_strings":["Korea Institute of Science and Technology,Seoul,South Korea"],"affiliations":[{"raw_affiliation_string":"Korea Institute of Science and Technology,Seoul,South Korea","institution_ids":["https://openalex.org/I58716616"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109307149","display_name":"Joon\u2010Sung Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I848706","display_name":"Sungkyunkwan University","ror":"https://ror.org/04q78tk20","country_code":"KR","type":"education","lineage":["https://openalex.org/I848706"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Joonsung Kim","raw_affiliation_strings":["Sungkyunkwan University,Department of Semiconductor Systems Engineering,Suwon,South Korea"],"affiliations":[{"raw_affiliation_string":"Sungkyunkwan University,Department of Semiconductor Systems Engineering,Suwon,South Korea","institution_ids":["https://openalex.org/I848706"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100447633","display_name":"Jinho Lee","orcid":"https://orcid.org/0000-0003-4010-6611"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jinho Lee","raw_affiliation_strings":["Seoul National University,Department of Electrical and Computer Engineering,Seoul,South Korea"],"affiliations":[{"raw_affiliation_string":"Seoul National University,Department of Electrical and Computer Engineering,Seoul,South Korea","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5088551237","display_name":"Youngsok Kim","orcid":"https://orcid.org/0000-0002-1015-9969"},"institutions":[{"id":"https://openalex.org/I193775966","display_name":"Yonsei University","ror":"https://ror.org/01wjejq96","country_code":"KR","type":"education","lineage":["https://openalex.org/I193775966"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Youngsok Kim","raw_affiliation_strings":["Yonsei University,Department of Computer Science and Engineering,Seoul,South Korea"],"affiliations":[{"raw_affiliation_string":"Yonsei University,Department of Computer Science and Engineering,Seoul,South Korea","institution_ids":["https://openalex.org/I193775966"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5102016776"],"corresponding_institution_ids":["https://openalex.org/I193775966"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.48080698,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"172","last_page":"185"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9111999869346619,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10317","display_name":"Advanced Database Systems and Queries","score":0.9111999869346619,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.03550000116229057,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.008999999612569809,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/online-analytical-processing","display_name":"Online analytical processing","score":0.8119999766349792},{"id":"https://openalex.org/keywords/relational-database","display_name":"Relational database","score":0.6966999769210815},{"id":"https://openalex.org/keywords/sql","display_name":"SQL","score":0.6579999923706055},{"id":"https://openalex.org/keywords/cache","display_name":"Cache","score":0.4650999903678894},{"id":"https://openalex.org/keywords/query-optimization","display_name":"Query optimization","score":0.45980000495910645},{"id":"https://openalex.org/keywords/relational-database-management-system","display_name":"Relational database management system","score":0.4180999994277954},{"id":"https://openalex.org/keywords/pci-express","display_name":"PCI Express","score":0.4052000045776367},{"id":"https://openalex.org/keywords/sargable","display_name":"Sargable","score":0.3986000120639801},{"id":"https://openalex.org/keywords/data-warehouse","display_name":"Data warehouse","score":0.39399999380111694},{"id":"https://openalex.org/keywords/data-structure","display_name":"Data structure","score":0.3939000070095062}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8913999795913696},{"id":"https://openalex.org/C201932085","wikidata":"https://www.wikidata.org/wiki/Q642514","display_name":"Online analytical processing","level":3,"score":0.8119999766349792},{"id":"https://openalex.org/C5655090","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database","level":2,"score":0.6966999769210815},{"id":"https://openalex.org/C510870499","wikidata":"https://www.wikidata.org/wiki/Q47607","display_name":"SQL","level":2,"score":0.6579999923706055},{"id":"https://openalex.org/C115537543","wikidata":"https://www.wikidata.org/wiki/Q165596","display_name":"Cache","level":2,"score":0.4650999903678894},{"id":"https://openalex.org/C157692150","wikidata":"https://www.wikidata.org/wiki/Q2919848","display_name":"Query optimization","level":2,"score":0.45980000495910645},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.44269999861717224},{"id":"https://openalex.org/C24394798","wikidata":"https://www.wikidata.org/wiki/Q192588","display_name":"Relational database management system","level":3,"score":0.4180999994277954},{"id":"https://openalex.org/C64270927","wikidata":"https://www.wikidata.org/wiki/Q206924","display_name":"PCI Express","level":3,"score":0.4052000045776367},{"id":"https://openalex.org/C192939062","wikidata":"https://www.wikidata.org/wiki/Q104840822","display_name":"Sargable","level":4,"score":0.3986000120639801},{"id":"https://openalex.org/C135572916","wikidata":"https://www.wikidata.org/wiki/Q193351","display_name":"Data warehouse","level":2,"score":0.39399999380111694},{"id":"https://openalex.org/C162319229","wikidata":"https://www.wikidata.org/wiki/Q175263","display_name":"Data structure","level":2,"score":0.3939000070095062},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.3855000138282776},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.37540000677108765},{"id":"https://openalex.org/C126831891","wikidata":"https://www.wikidata.org/wiki/Q221673","display_name":"Host (biology)","level":2,"score":0.3700999915599823},{"id":"https://openalex.org/C68339613","wikidata":"https://www.wikidata.org/wiki/Q1549489","display_name":"Speedup","level":2,"score":0.3449000120162964},{"id":"https://openalex.org/C192028432","wikidata":"https://www.wikidata.org/wiki/Q845739","display_name":"Query language","level":2,"score":0.33180001378059387},{"id":"https://openalex.org/C189783530","wikidata":"https://www.wikidata.org/wiki/Q352090","display_name":"CPU cache","level":3,"score":0.3244999945163727},{"id":"https://openalex.org/C40207289","wikidata":"https://www.wikidata.org/wiki/Q755662","display_name":"Relational model","level":3,"score":0.3230000138282776},{"id":"https://openalex.org/C74912251","wikidata":"https://www.wikidata.org/wiki/Q6815727","display_name":"Memory footprint","level":2,"score":0.31709998846054077},{"id":"https://openalex.org/C147224247","wikidata":"https://www.wikidata.org/wiki/Q885373","display_name":"Bloom filter","level":2,"score":0.3116999864578247},{"id":"https://openalex.org/C194222762","wikidata":"https://www.wikidata.org/wiki/Q114486","display_name":"Query by Example","level":4,"score":0.3102000057697296},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.30070000886917114},{"id":"https://openalex.org/C7366592","wikidata":"https://www.wikidata.org/wiki/Q1255620","display_name":"Dram","level":2,"score":0.29899999499320984},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.288100004196167},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.2838999927043915},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.2770000100135803},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.2745000123977661},{"id":"https://openalex.org/C123593499","wikidata":"https://www.wikidata.org/wiki/Q6008583","display_name":"In-Memory Processing","level":5,"score":0.27410000562667847},{"id":"https://openalex.org/C46681722","wikidata":"https://www.wikidata.org/wiki/Q4725589","display_name":"Alias","level":2,"score":0.27230000495910645},{"id":"https://openalex.org/C49154492","wikidata":"https://www.wikidata.org/wiki/Q5300","display_name":"Central processing unit","level":2,"score":0.2694000005722046},{"id":"https://openalex.org/C191087605","wikidata":"https://www.wikidata.org/wiki/Q1501395","display_name":"Online transaction processing","level":4,"score":0.2676999866962433},{"id":"https://openalex.org/C56288433","wikidata":"https://www.wikidata.org/wiki/Q58673","display_name":"Data manipulation language","level":2,"score":0.2669000029563904},{"id":"https://openalex.org/C52723943","wikidata":"https://www.wikidata.org/wiki/Q1127410","display_name":"Serialization","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.26019999384880066},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.25459998846054077},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.25380000472068787},{"id":"https://openalex.org/C150670458","wikidata":"https://www.wikidata.org/wiki/Q4272815","display_name":"Data transformation","level":3,"score":0.25360000133514404}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/pact65351.2025.00026","is_oa":false,"landing_page_url":"https://doi.org/10.1109/pact65351.2025.00026","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 34th International Conference on Parallel Architectures and Compilation Techniques (PACT)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":55,"referenced_works":["https://openalex.org/W1864199185","https://openalex.org/W1987238352","https://openalex.org/W1992558790","https://openalex.org/W1997824438","https://openalex.org/W2000335122","https://openalex.org/W2012449229","https://openalex.org/W2068418796","https://openalex.org/W2085601491","https://openalex.org/W2086977914","https://openalex.org/W2106329447","https://openalex.org/W2106771621","https://openalex.org/W2110975861","https://openalex.org/W2123845384","https://openalex.org/W2136083615","https://openalex.org/W2151822116","https://openalex.org/W2159287299","https://openalex.org/W2159481344","https://openalex.org/W2262100274","https://openalex.org/W2276395270","https://openalex.org/W2342922783","https://openalex.org/W2424351436","https://openalex.org/W2440046523","https://openalex.org/W2548941637","https://openalex.org/W2604606554","https://openalex.org/W2611538725","https://openalex.org/W2767106296","https://openalex.org/W2782087530","https://openalex.org/W2798422034","https://openalex.org/W2907714110","https://openalex.org/W2908321983","https://openalex.org/W2951543943","https://openalex.org/W2953564033","https://openalex.org/W2969414999","https://openalex.org/W3011144431","https://openalex.org/W3023442443","https://openalex.org/W3028661980","https://openalex.org/W3032789239","https://openalex.org/W3106620263","https://openalex.org/W3109106363","https://openalex.org/W3158564519","https://openalex.org/W3173612853","https://openalex.org/W3173778203","https://openalex.org/W3196498014","https://openalex.org/W3209568355","https://openalex.org/W4214681936","https://openalex.org/W4225869830","https://openalex.org/W4281927114","https://openalex.org/W4282554945","https://openalex.org/W4312559100","https://openalex.org/W4366572671","https://openalex.org/W4385270195","https://openalex.org/W4385270282","https://openalex.org/W4391054892","https://openalex.org/W4408060256","https://openalex.org/W4410538551"],"related_works":[],"abstract_inverted_index":{"Graphics":[0],"Processing":[1,19,43],"Units":[2],"(GPUs)":[3],"offer":[4],"high":[5],"computational":[6],"throughput":[7],"and":[8,51,92,107,120,192,269,286],"memory":[9,91,98,125,208],"bandwidth,":[10],"making":[11],"them":[12],"promising":[13],"accelerators":[14],"for":[15],"relational":[16,22,26,145,151,160],"OnLine":[17],"Analytical":[18],"(OLAP).":[20],"GPU-accelerated":[21,57,144],"OLAP":[23,146,152],"executes":[24],"the":[25,40,76,84,89,96,131,170,179,207],"operations":[27,161],"of":[28,39,159,278],"a":[29,36,56,141],"Structured":[30],"Query":[31],"Language":[32],"(SQL)":[33],"query":[34,59],"on":[35,47,166],"GPU":[37,77,97,117,124,213],"instead":[38],"host":[41,90,230],"Central":[42],"Unit":[44],"(CPU).":[45],"Depending":[46],"where":[48],"input":[49,72,85,167,201,239],"columns":[50,73,86,168],"their":[52,204],"values":[53,202,220],"reside":[54,87],"in,":[55],"SQL":[58,154],"execution":[60,261],"can":[61,163],"be":[62,164],"classified":[63],"into":[64,156],"two":[65,180,186],"scenarios:":[66],"1)":[67],"in-GPU,":[68],"in":[69,75,82,88],"which":[70,83,197],"all":[71],"fit":[74],"memory,":[78],"or":[79],"2)":[80],"in-host,":[81],"get":[93],"transferred":[94],"to":[95,177,258],"when":[99],"needed.":[100],"However,":[101],"both":[102],"scenarios":[103],"incur":[104,115],"significant":[105],"intraGPU":[106],"host-to-GPU":[108,133],"data":[109,134,181,215],"movement":[110,182,205],"overheads,":[111],"respectively.":[112],"In-GPU":[113],"executions":[114,128],"excessive":[116],"cache":[118],"misses":[119],"thus":[121],"frequent":[122],"off-chip":[123,224],"accesses.":[126,226],"In-host":[127],"suffer":[129],"from":[130,169],"limited":[132],"transfer":[135,243],"bandwidth.":[136],"This":[137],"paper":[138],"presents":[139],"DMO-DB,":[140],"Data":[142],"Movement-Optimized":[143],"engine.":[147],"Since":[148],"modern":[149],"GPUaccelerated":[150],"decomposes":[153],"queries":[155],"multiple":[157,249],"pipelines-sequences":[158],"that":[162,274],"executed":[165],"same":[171],"table,":[172],"DMO-DB":[173,184,275],"leverages":[174],"inter-pipeline":[175,250],"dependencies":[176,251],"overcome":[178],"bottlenecks.":[183],"introduces":[185],"key":[187],"ideas:":[188],"cache-fit":[189,216,234,255],"bloom":[190,256],"filtering":[191],"Ahead-of-Time":[193],"value":[194],"Discarding":[195],"(AoTD),":[196],"preemptively":[198],"eliminate":[199],"unnecessary":[200,238],"before":[203,221],"across":[206],"hierarchies.":[209],"For":[210,227],"in-GPU":[211,284],"execution,":[212,229],"L1":[214],"filters":[217,235,257],"discard":[218],"non-contributing":[219],"triggering":[222],"costly":[223],"DRAM":[225],"in-host":[228,289],"CPU":[231],"last":[232],"level":[233],"strategically":[236],"prune":[237],"values,":[240],"minimizing":[241],"PCIe":[242],"overhead.":[244],"After":[245],"that,":[246],"AoTD":[247],"exploits":[248],"by":[252],"collecting":[253],"these":[254],"earlier":[259],"pipeline":[260],"stages.":[262],"Our":[263],"evaluation":[264],"using":[265],"NVIDIA":[266],"RTX":[267,271],"A4000":[268],"TITAN":[270],"GPUs":[272],"shows":[273],"achieves":[276],"speedups":[277],"$\\mathbf{1.":[279],"5":[280],"3":[281],"x}$":[282],"over":[283,288],"Crystal-Opt":[285],"6.10x":[287],"HeavyDB.":[290]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-12-16T00:00:00"}
