{"id":"https://openalex.org/W2323909431","doi":"https://doi.org/10.1145/2872362.2872368","title":"Baymax","display_name":"Baymax","publication_year":2016,"publication_date":"2016-03-25","ids":{"openalex":"https://openalex.org/W2323909431","doi":"https://doi.org/10.1145/2872362.2872368","mag":"2323909431"},"language":"en","primary_location":{"id":"doi:10.1145/2872362.2872368","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2872362.2872368","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Twenty-First International Conference on Architectural Support for Programming Languages and Operating Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100377840","display_name":"Quan Chen","orcid":"https://orcid.org/0000-0001-5832-0347"},"institutions":[{"id":"https://openalex.org/I4210140958","display_name":"Ann Arbor Center for Independent Living","ror":"https://ror.org/045pcya52","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210140958"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Quan Chen","raw_affiliation_strings":["Shanghai Jiao Tong University, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I4210140958"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018705589","display_name":"Hailong Yang","orcid":"https://orcid.org/0000-0003-1101-7927"},"institutions":[{"id":"https://openalex.org/I4210140958","display_name":"Ann Arbor Center for Independent Living","ror":"https://ror.org/045pcya52","country_code":"US","type":"nonprofit","lineage":["https://openalex.org/I4210140958"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hailong Yang","raw_affiliation_strings":["Beihang University, Ann Arbor, USA"],"affiliations":[{"raw_affiliation_string":"Beihang University, Ann Arbor, USA","institution_ids":["https://openalex.org/I4210140958"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053236545","display_name":"Jason Mars","orcid":"https://orcid.org/0000-0002-7029-5292"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jason Mars","raw_affiliation_strings":["University of Michigan, Ann Arbor, USA"],"affiliations":[{"raw_affiliation_string":"University of Michigan, Ann Arbor, USA","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5065128438","display_name":"Lingjia Tang","orcid":"https://orcid.org/0000-0002-5609-7775"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lingjia Tang","raw_affiliation_strings":["University of Michigan, Ann Arbor, USA"],"affiliations":[{"raw_affiliation_string":"University of Michigan, Ann Arbor, USA","institution_ids":["https://openalex.org/I27837315"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5100377840"],"corresponding_institution_ids":["https://openalex.org/I4210140958"],"apc_list":null,"apc_paid":null,"fwci":15.0609,"has_fulltext":false,"cited_by_count":113,"citation_normalized_percentile":{"value":0.99115741,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"681","last_page":"696"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10273","display_name":"IoT and Edge/Fog Computing","score":0.9990000128746033,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9987000226974487,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8616144061088562},{"id":"https://openalex.org/keywords/pci-express","display_name":"PCI Express","score":0.7123414278030396},{"id":"https://openalex.org/keywords/quality-of-service","display_name":"Quality of service","score":0.6365439891815186},{"id":"https://openalex.org/keywords/workload","display_name":"Workload","score":0.492573082447052},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.4901452958583832},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.48014065623283386},{"id":"https://openalex.org/keywords/bandwidth","display_name":"Bandwidth (computing)","score":0.45325523614883423},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.4355877935886383},{"id":"https://openalex.org/keywords/x86","display_name":"x86","score":0.4203188717365265},{"id":"https://openalex.org/keywords/latency","display_name":"Latency (audio)","score":0.41866326332092285},{"id":"https://openalex.org/keywords/multi-core-processor","display_name":"Multi-core processor","score":0.41673731803894043},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.35625746846199036},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.33609268069267273},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.26180577278137207},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.2572787404060364},{"id":"https://openalex.org/keywords/software","display_name":"Software","score":0.17110824584960938}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8616144061088562},{"id":"https://openalex.org/C64270927","wikidata":"https://www.wikidata.org/wiki/Q206924","display_name":"PCI Express","level":3,"score":0.7123414278030396},{"id":"https://openalex.org/C5119721","wikidata":"https://www.wikidata.org/wiki/Q220501","display_name":"Quality of service","level":2,"score":0.6365439891815186},{"id":"https://openalex.org/C2778476105","wikidata":"https://www.wikidata.org/wiki/Q628539","display_name":"Workload","level":2,"score":0.492573082447052},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.4901452958583832},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.48014065623283386},{"id":"https://openalex.org/C2776257435","wikidata":"https://www.wikidata.org/wiki/Q1576430","display_name":"Bandwidth (computing)","level":2,"score":0.45325523614883423},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.4355877935886383},{"id":"https://openalex.org/C170723468","wikidata":"https://www.wikidata.org/wiki/Q182933","display_name":"x86","level":3,"score":0.4203188717365265},{"id":"https://openalex.org/C82876162","wikidata":"https://www.wikidata.org/wiki/Q17096504","display_name":"Latency (audio)","level":2,"score":0.41866326332092285},{"id":"https://openalex.org/C78766204","wikidata":"https://www.wikidata.org/wiki/Q555032","display_name":"Multi-core processor","level":2,"score":0.41673731803894043},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.35625746846199036},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.33609268069267273},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.26180577278137207},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.2572787404060364},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.17110824584960938},{"id":"https://openalex.org/C76155785","wikidata":"https://www.wikidata.org/wiki/Q418","display_name":"Telecommunications","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/2872362.2872368","is_oa":false,"landing_page_url":"https://doi.org/10.1145/2872362.2872368","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Twenty-First International Conference on Architectural Support for Programming Languages and Operating Systems","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4695101022","display_name":null,"funder_award_id":"CNS-CSR-1419243","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":71,"referenced_works":["https://openalex.org/W115476871","https://openalex.org/W297966986","https://openalex.org/W833222660","https://openalex.org/W1513326124","https://openalex.org/W1524333225","https://openalex.org/W1667652561","https://openalex.org/W1677409904","https://openalex.org/W1937235839","https://openalex.org/W1971910541","https://openalex.org/W1972971542","https://openalex.org/W1978502921","https://openalex.org/W1979717209","https://openalex.org/W1982063824","https://openalex.org/W1982825626","https://openalex.org/W1984993578","https://openalex.org/W1987403831","https://openalex.org/W1994790794","https://openalex.org/W1997486487","https://openalex.org/W2000438057","https://openalex.org/W2011389593","https://openalex.org/W2017004353","https://openalex.org/W2020172164","https://openalex.org/W2022832305","https://openalex.org/W2023214828","https://openalex.org/W2059638322","https://openalex.org/W2060204338","https://openalex.org/W2068681864","https://openalex.org/W2072652898","https://openalex.org/W2075200534","https://openalex.org/W2079248286","https://openalex.org/W2080592089","https://openalex.org/W2082000934","https://openalex.org/W2085434892","https://openalex.org/W2095908137","https://openalex.org/W2097643185","https://openalex.org/W2098126897","https://openalex.org/W2098921539","https://openalex.org/W2099517310","https://openalex.org/W2102621631","https://openalex.org/W2105528986","https://openalex.org/W2109488193","https://openalex.org/W2112168774","https://openalex.org/W2123892809","https://openalex.org/W2124592110","https://openalex.org/W2125551452","https://openalex.org/W2133156997","https://openalex.org/W2142801765","https://openalex.org/W2144335215","https://openalex.org/W2150139096","https://openalex.org/W2153635508","https://openalex.org/W2156077332","https://openalex.org/W2156885227","https://openalex.org/W2160121678","https://openalex.org/W2169049902","https://openalex.org/W2170764938","https://openalex.org/W2222512263","https://openalex.org/W2308884720","https://openalex.org/W2427881153","https://openalex.org/W2487770199","https://openalex.org/W2616747538","https://openalex.org/W2970040153","https://openalex.org/W3141739369","https://openalex.org/W4234141727","https://openalex.org/W4236267470","https://openalex.org/W4256629673","https://openalex.org/W6668411398","https://openalex.org/W6670560480","https://openalex.org/W6674550445","https://openalex.org/W6678424907","https://openalex.org/W7010394419","https://openalex.org/W7061458307"],"related_works":["https://openalex.org/W1657880117","https://openalex.org/W4385894176","https://openalex.org/W2595172197","https://openalex.org/W2347371119","https://openalex.org/W2612768808","https://openalex.org/W2127970246","https://openalex.org/W2915358162","https://openalex.org/W2096357811","https://openalex.org/W2791952321","https://openalex.org/W2072005592"],"abstract_inverted_index":{"Modern":[0],"warehouse-scale":[1],"computers":[2],"(WSCs)":[3],"are":[4,130],"being":[5],"outfitted":[6],"with":[7],"accelerators":[8,76],"to":[9,49,92,137,166,233],"provide":[10],"the":[11,37,104,120,131,138,153,168,176,205,212,225],"significant":[12],"compute":[13,121,156],"required":[14,169],"by":[15,208,231],"emerging":[16],"intelligent":[17],"personal":[18],"assistant":[19],"(IPA)":[20],"workloads":[21],"such":[22],"as":[23],"voice":[24],"recognition,":[25],"image":[26],"classification,":[27],"and":[28,56,58,85,123,161,174,191],"natural":[29],"language":[30],"processing.":[31],"It":[32],"is":[33,77],"well":[34],"known":[35],"that":[36,116,135,151,202],"diurnal":[38],"user":[39],"access":[40],"pattern":[41],"of":[42,90,141,155,228],"user-facing":[43,142,172,219,229],"services":[44],"provides":[45],"a":[46,87,148,181,195],"strong":[47],"incentive":[48],"co-locate":[50],"applications":[51,73,160,173,193,230],"for":[52,107,119,127,171,217,218],"better":[53],"accelerator":[54,177,206],"utilization":[55,207],"efficiency,":[57],"prior":[59],"work":[60],"has":[61],"focused":[62],"on":[63,66,74,82,194],"enabling":[64],"co-location":[65],"multicore":[67],"processors.":[68],"However,":[69],"interference":[70],"when":[71],"co-locating":[72],"non-preemptive":[75],"fundamentally":[78],"different":[79,159],"than":[80],"contention":[81,126,165],"multi-core":[83],"CPUs":[84],"introduces":[86],"new":[88],"set":[89],"challenges":[91],"reduce":[93],"QoS":[94,108,170],"violation.":[95],"To":[96],"address":[97],"this":[98],"open":[99],"problem,":[100],"we":[101],"first":[102],"identify":[103],"underlying":[105],"causes":[106],"violation":[109],"in":[110],"accelerator-outfitted":[111],"servers.":[112],"Our":[113],"experiments":[114],"show":[115],"queuing":[117],"delay":[118],"resources":[122],"PCI-e":[124,163],"bandwidth":[125,164],"data":[128],"transfer":[129],"main":[132],"two":[133],"factors":[134],"contribute":[136],"long":[139],"tails":[140],"applications.":[143,220],"We":[144],"then":[145],"present":[146],"Baymax,":[147],"runtime":[149],"system":[150],"orchestrates":[152],"execution":[154],"tasks":[157],"from":[158],"mitigates":[162],"deliver":[167],"increase":[175],"utilization.":[178],"Using":[179],"DjiNN,":[180],"deep":[182],"neural":[183],"network":[184],"service,":[185],"Sirius,":[186],"an":[187],"end-to-end":[188],"IPA":[189],"workload,":[190],"traditional":[192],"Nvidia":[196],"K40":[197],"GPU,":[198],"our":[199],"evaluation":[200],"shows":[201],"Baymax":[203,223],"improves":[204],"91.3%":[209],"while":[210],"achieving":[211],"desired":[213],"99%-ile":[214,226],"latency":[215,227],"target":[216],"In":[221],"fact,":[222],"reduces":[224],"up":[232],"195x":[234],"over":[235],"default":[236],"execution.":[237]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":7},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":16},{"year":2020,"cited_by_count":19},{"year":2019,"cited_by_count":17},{"year":2018,"cited_by_count":12},{"year":2017,"cited_by_count":21},{"year":2016,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2016-06-24T00:00:00"}
