{"id":"https://openalex.org/W4380669423","doi":"https://doi.org/10.1145/3578338.3593571","title":"SplitRPC: A {Control + Data} Path Splitting RPC Stack for ML Inference Serving","display_name":"SplitRPC: A {Control + Data} Path Splitting RPC Stack for ML Inference Serving","publication_year":2023,"publication_date":"2023-06-13","ids":{"openalex":"https://openalex.org/W4380669423","doi":"https://doi.org/10.1145/3578338.3593571"},"language":"en","primary_location":{"id":"doi:10.1145/3578338.3593571","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3578338.3593571","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Abstract Proceedings of the 2023 ACM SIGMETRICS International Conference on Measurement and Modeling of Computer Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5018757871","display_name":"Adithya Kumar","orcid":"https://orcid.org/0009-0005-3876-0624"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Adithya Kumar","raw_affiliation_strings":["The Pennsylvania State University, University Park, PA, USA"],"affiliations":[{"raw_affiliation_string":"The Pennsylvania State University, University Park, PA, USA","institution_ids":["https://openalex.org/I130769515"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5033253809","display_name":"Anand Sivasubramaniam","orcid":"https://orcid.org/0000-0001-6173-687X"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Anand Sivasubramaniam","raw_affiliation_strings":["Penn State University, University Park, PA, USA"],"affiliations":[{"raw_affiliation_string":"Penn State University, University Park, PA, USA","institution_ids":["https://openalex.org/I130769515"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5024530225","display_name":"Timothy Zhu","orcid":"https://orcid.org/0000-0001-8394-8953"},"institutions":[{"id":"https://openalex.org/I130769515","display_name":"Pennsylvania State University","ror":"https://ror.org/04p491231","country_code":"US","type":"education","lineage":["https://openalex.org/I130769515"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Timothy Zhu","raw_affiliation_strings":["The Pennsylvania State University, University Park, PA, USA"],"affiliations":[{"raw_affiliation_string":"The Pennsylvania State University, University Park, PA, USA","institution_ids":["https://openalex.org/I130769515"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5018757871"],"corresponding_institution_ids":["https://openalex.org/I130769515"],"apc_list":null,"apc_paid":null,"fwci":0.1997,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.48087756,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":"13","last_page":"14"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10714","display_name":"Software-Defined Networks and 5G","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8519871234893799},{"id":"https://openalex.org/keywords/datapath","display_name":"Datapath","score":0.4490984082221985},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.4468232989311218},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.44215071201324463},{"id":"https://openalex.org/keywords/payload","display_name":"Payload (computing)","score":0.42373138666152954},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.3779309391975403},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3528062701225281},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.33521440625190735},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.2098405659198761}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8519871234893799},{"id":"https://openalex.org/C2781198647","wikidata":"https://www.wikidata.org/wiki/Q1633673","display_name":"Datapath","level":2,"score":0.4490984082221985},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.4468232989311218},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.44215071201324463},{"id":"https://openalex.org/C134066672","wikidata":"https://www.wikidata.org/wiki/Q1424639","display_name":"Payload (computing)","level":3,"score":0.42373138666152954},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.3779309391975403},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3528062701225281},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.33521440625190735},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.2098405659198761},{"id":"https://openalex.org/C158379750","wikidata":"https://www.wikidata.org/wiki/Q214111","display_name":"Network packet","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3578338.3593571","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3578338.3593571","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Abstract Proceedings of the 2023 ACM SIGMETRICS International Conference on Measurement and Modeling of Computer Systems","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G877853932","display_name":null,"funder_award_id":"2211018, 1912495, 1909004, 1714389, 1912495, 1629915, 1629129, 1763681","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":1,"referenced_works":["https://openalex.org/W3012088208"],"related_works":["https://openalex.org/W2109699519","https://openalex.org/W2006568360","https://openalex.org/W102726818","https://openalex.org/W4233616027","https://openalex.org/W2059591361","https://openalex.org/W970262775","https://openalex.org/W4244724753","https://openalex.org/W1972081536","https://openalex.org/W2535673728","https://openalex.org/W1831618318"],"abstract_inverted_index":{"The":[0],"growing":[1],"adoption":[2],"of":[3,95,115,140],"hardware":[4],"accelerators":[5],"driven":[6],"by":[7,37],"their":[8,22],"intelligent":[9],"compiler":[10],"and":[11,19,59,92,109,145,188,190,207],"runtime":[12],"system":[13],"counterparts":[14],"has":[15],"democratized":[16],"ML":[17,80,158],"services":[18,56],"precipitously":[20],"reduced":[21],"execution":[23],"times.":[24],"This":[25],"motivates":[26],"us":[27,163],"to":[28,32,87,105,122,127,164,168,176],"shift":[29],"our":[30],"attention":[31],"characterize":[33],"the":[34,38,53,57,90,93,107,120,123,136,166,169,174,198],"overheads":[35],"imposed":[36],"RPC":[39,49,155,199],"mechanism":[40,156],"(`RPC":[41],"tax')":[42],"when":[43],"serving":[44,78],"them":[45],"on":[46,62,184],"accelerators.":[47,97],"Conventional":[48],"implementations":[50],"implicitly":[51],"assume":[52],"host":[54],"CPU":[55,175],"requests,":[58],"we":[60,143],"focus":[61],"expanding":[63],"such":[64],"works":[65],"towards":[66],"accelerator-based":[67],"services.":[68],"While":[69],"SmartNIC":[70],"based":[71],"solutions":[72],"work":[73],"well":[74],"for":[75,112,157],"simple":[76],"applications,":[77],"complex":[79],"models":[81],"requires":[82],"a":[83,149],"more":[84],"nuanced":[85],"view":[86],"optimize":[88,165],"both":[89,185],"data-path":[91],"control/orchestration":[94],"these":[96,132,141],"We":[98,181],"program":[99],"commodity":[100,186],"network":[101],"interface":[102],"cards":[103],"(NICs)":[104],"split":[106],"control":[108,116],"data":[110],"paths":[111,133],"effective":[113,195],"transfer":[114],"while":[117,171,201],"efficiently":[118],"transferring":[119],"payload":[121],"accelerator.":[124],"As":[125],"opposed":[126],"unified":[128],"approaches":[129],"that":[130,192],"bundle":[131],"together,":[134],"limiting":[135],"flexibility":[137],"in":[138,196,205],"each":[139],"paths,":[142],"design":[144],"implement":[146,182],"SplitRPC":[147,161,183,193],"-":[148],"{control":[150],"+":[151],"data}":[152],"path":[153],"optimizing":[154],"inference":[159],"serving.":[160],"allows":[162],"datapath":[167],"accelerator":[170],"simultaneously":[172],"allowing":[173],"maintain":[177],"full":[178],"orchestration":[179],"capabilities.":[180],"NICs":[187],"SmartNICs":[189],"demonstrate":[191],"is":[194],"minimizing":[197],"tax":[200],"providing":[202],"significant":[203],"gains":[204],"throughput":[206],"latency.":[208]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
