{"id":"https://openalex.org/W4323343904","doi":"https://doi.org/10.14778/3579075.3579083","title":"FastFlow: Accelerating Deep Learning Model Training with Smart Offloading of Input Data Pipeline","display_name":"FastFlow: Accelerating Deep Learning Model Training with Smart Offloading of Input Data Pipeline","publication_year":2023,"publication_date":"2023-01-01","ids":{"openalex":"https://openalex.org/W4323343904","doi":"https://doi.org/10.14778/3579075.3579083"},"language":"en","primary_location":{"id":"doi:10.14778/3579075.3579083","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3579075.3579083","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5041189187","display_name":"Taegeon Um","orcid":"https://orcid.org/0000-0002-4372-6712"},"institutions":[{"id":"https://openalex.org/I4210101778","display_name":"Samsung (United States)","ror":"https://ror.org/01bfbvm65","country_code":"US","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210101778"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Taegeon Um","raw_affiliation_strings":["Samsung Research"],"affiliations":[{"raw_affiliation_string":"Samsung Research","institution_ids":["https://openalex.org/I4210101778"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003011755","display_name":"Byungsoo Oh","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101778","display_name":"Samsung (United States)","ror":"https://ror.org/01bfbvm65","country_code":"US","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210101778"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Byungsoo Oh","raw_affiliation_strings":["Samsung Research"],"affiliations":[{"raw_affiliation_string":"Samsung Research","institution_ids":["https://openalex.org/I4210101778"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085810961","display_name":"Byeongchan Seo","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101778","display_name":"Samsung (United States)","ror":"https://ror.org/01bfbvm65","country_code":"US","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210101778"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Byeongchan Seo","raw_affiliation_strings":["Samsung Research"],"affiliations":[{"raw_affiliation_string":"Samsung Research","institution_ids":["https://openalex.org/I4210101778"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028087500","display_name":"Minhyeok Kweun","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101778","display_name":"Samsung (United States)","ror":"https://ror.org/01bfbvm65","country_code":"US","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210101778"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Minhyeok Kweun","raw_affiliation_strings":["Samsung Research"],"affiliations":[{"raw_affiliation_string":"Samsung Research","institution_ids":["https://openalex.org/I4210101778"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083776993","display_name":"Goeun Kim","orcid":"https://orcid.org/0000-0002-4937-4092"},"institutions":[{"id":"https://openalex.org/I4210101778","display_name":"Samsung (United States)","ror":"https://ror.org/01bfbvm65","country_code":"US","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210101778"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Goeun Kim","raw_affiliation_strings":["Samsung Research"],"affiliations":[{"raw_affiliation_string":"Samsung Research","institution_ids":["https://openalex.org/I4210101778"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5039177659","display_name":"Woo-Yeon Lee","orcid":null},"institutions":[{"id":"https://openalex.org/I4210101778","display_name":"Samsung (United States)","ror":"https://ror.org/01bfbvm65","country_code":"US","type":"company","lineage":["https://openalex.org/I2250650973","https://openalex.org/I4210101778"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Woo-Yeon Lee","raw_affiliation_strings":["Samsung Research"],"affiliations":[{"raw_affiliation_string":"Samsung Research","institution_ids":["https://openalex.org/I4210101778"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5041189187"],"corresponding_institution_ids":["https://openalex.org/I4210101778"],"apc_list":null,"apc_paid":null,"fwci":3.4573,"has_fulltext":false,"cited_by_count":29,"citation_normalized_percentile":{"value":0.94150241,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"16","issue":"5","first_page":"1086","last_page":"1099"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10764","display_name":"Privacy-Preserving Technologies in Data","score":0.9969000220298767,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11612","display_name":"Stochastic Gradient Optimization Techniques","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8593045473098755},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.813392162322998},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.7560040950775146},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.7067789435386658},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.5636275410652161},{"id":"https://openalex.org/keywords/pipeline-transport","display_name":"Pipeline transport","score":0.4916861653327942},{"id":"https://openalex.org/keywords/throughput","display_name":"Throughput","score":0.46125614643096924},{"id":"https://openalex.org/keywords/preprocessor","display_name":"Preprocessor","score":0.45680612325668335},{"id":"https://openalex.org/keywords/computation-offloading","display_name":"Computation offloading","score":0.4451931416988373},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4345557391643524},{"id":"https://openalex.org/keywords/coprocessor","display_name":"Coprocessor","score":0.4325815737247467},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.4295508861541748},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.35995036363601685},{"id":"https://openalex.org/keywords/real-time-computing","display_name":"Real-time computing","score":0.33804085850715637},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.21758988499641418},{"id":"https://openalex.org/keywords/edge-computing","display_name":"Edge computing","score":0.14578282833099365},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.13830915093421936}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8593045473098755},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.813392162322998},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.7560040950775146},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.7067789435386658},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.5636275410652161},{"id":"https://openalex.org/C175309249","wikidata":"https://www.wikidata.org/wiki/Q725864","display_name":"Pipeline transport","level":2,"score":0.4916861653327942},{"id":"https://openalex.org/C157764524","wikidata":"https://www.wikidata.org/wiki/Q1383412","display_name":"Throughput","level":3,"score":0.46125614643096924},{"id":"https://openalex.org/C34736171","wikidata":"https://www.wikidata.org/wiki/Q918333","display_name":"Preprocessor","level":2,"score":0.45680612325668335},{"id":"https://openalex.org/C2781041963","wikidata":"https://www.wikidata.org/wiki/Q18348618","display_name":"Computation offloading","level":4,"score":0.4451931416988373},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4345557391643524},{"id":"https://openalex.org/C86111242","wikidata":"https://www.wikidata.org/wiki/Q859595","display_name":"Coprocessor","level":2,"score":0.4325815737247467},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.4295508861541748},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.35995036363601685},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.33804085850715637},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.21758988499641418},{"id":"https://openalex.org/C2778456923","wikidata":"https://www.wikidata.org/wiki/Q5337692","display_name":"Edge computing","level":3,"score":0.14578282833099365},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.13830915093421936},{"id":"https://openalex.org/C87717796","wikidata":"https://www.wikidata.org/wiki/Q146326","display_name":"Environmental engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.14778/3579075.3579083","is_oa":false,"landing_page_url":"https://doi.org/10.14778/3579075.3579083","pdf_url":null,"source":{"id":"https://openalex.org/S4210226185","display_name":"Proceedings of the VLDB Endowment","issn_l":"2150-8097","issn":["2150-8097"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319798","host_organization_name":"Association for Computing Machinery","host_organization_lineage":["https://openalex.org/P4310319798"],"host_organization_lineage_names":["Association for Computing Machinery"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the VLDB Endowment","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.5199999809265137,"id":"https://metadata.un.org/sdg/8","display_name":"Decent work and economic growth"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":15,"referenced_works":["https://openalex.org/W2108598243","https://openalex.org/W2734941459","https://openalex.org/W2763188033","https://openalex.org/W2808631503","https://openalex.org/W3097882114","https://openalex.org/W3104414677","https://openalex.org/W3115267280","https://openalex.org/W3138303811","https://openalex.org/W3152218910","https://openalex.org/W3189562561","https://openalex.org/W3196732841","https://openalex.org/W3198095237","https://openalex.org/W4214753187","https://openalex.org/W4220938834","https://openalex.org/W4281657584"],"related_works":["https://openalex.org/W2359178629","https://openalex.org/W4366459479","https://openalex.org/W2794269381","https://openalex.org/W4313289316","https://openalex.org/W2899307613","https://openalex.org/W4377967120","https://openalex.org/W4310621653","https://openalex.org/W2120735706","https://openalex.org/W117939781","https://openalex.org/W4323343904"],"abstract_inverted_index":{"When":[0],"training":[1,36,40,60,71,122,167],"a":[2,69],"deep":[3],"learning":[4],"(DL)":[5],"model,":[6],"input":[7,47,83],"data":[8,48],"are":[9,18,130],"pre-processed":[10],"on":[11,95,150,158],"CPUs":[12,110],"and":[13,101,108,119,128,190],"transformed":[14],"into":[15,21],"tensors,":[16],"which":[17],"then":[19],"fed":[20],"GPUs":[22,30],"for":[23,46,135],"gradient":[24],"computations":[25],"of":[26,116],"model":[27],"training.":[28],"Expensive":[29],"must":[31],"be":[32],"fully":[33],"utilized":[34],"during":[35],"to":[37,54,85,99,111,137,174,183,196],"accelerate":[38],"the":[39,76,113,121,139,145,166],"speed.":[41],"However,":[42],"intensive":[43],"CPU":[44,55,77,187],"operations":[45],"preprocessing":[49],"(input":[50],"pipeline)":[51],"often":[52],"lead":[53],"bottlenecks;":[56],"correspondingly,":[57],"various":[58,91,159],"DL":[59,70,153],"jobs":[61],"suffer":[62],"from":[63],"GPU":[64,197],"under-utilization.":[65],"We":[66],"propose":[67],"FastFlow,":[68],"system":[72],"that":[73,163],"automatically":[74],"mitigates":[75],"bottleneck":[78],"by":[79,169,178,191],"offloading":[80,92,126,141,188,198],"(scaling":[81],"out)":[82],"pipelines":[84],"remote":[86,109,117],"CPUs.":[87],"FastFlow":[88,164],"carefully":[89],"decides":[90],"decisions":[93],"based":[94],"performance":[96],"metrics":[97],"specific":[98],"applications":[100],"allocated":[102],"resources,":[103],"while":[104],"leveraging":[105],"both":[106],"local":[107],"prevent":[112],"inefficient":[114],"use":[115],"resources":[118],"minimize":[120],"time.":[123],"FastFlow's":[124],"smart":[125,140],"policy":[127],"mechanisms":[129],"seamlessly":[131],"integrated":[132],"with":[133,155,185],"TensorFlow":[134,175,184],"users":[136],"enjoy":[138],"features":[142],"without":[143,176],"modifying":[144],"main":[146],"logic.":[147],"Our":[148],"evaluations":[149],"our":[151],"private":[152],"cloud":[154],"diverse":[156],"workloads":[157],"resource":[160],"environments":[161],"show":[162],"improves":[165],"throughput":[168],"1":[170,179],"~":[171,180,193],"4.34X":[172],"compared":[173,182,195],"offloading,":[177],"4.52X":[181],"manual":[186],"(tf.data.service),":[189],"0.63":[192],"2.06X":[194],"(DALI).":[199]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":11},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
