{"id":"https://openalex.org/W4381611549","doi":"https://doi.org/10.1145/3593856.3595912","title":"System Virtualization for Neural Processing Units","display_name":"System Virtualization for Neural Processing Units","publication_year":2023,"publication_date":"2023-06-22","ids":{"openalex":"https://openalex.org/W4381611549","doi":"https://doi.org/10.1145/3593856.3595912"},"language":"en","primary_location":{"id":"doi:10.1145/3593856.3595912","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3593856.3595912","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th Workshop on Hot Topics in Operating Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101548931","display_name":"Yuqi Xue","orcid":"https://orcid.org/0009-0002-0363-9486"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Yuqi Xue","raw_affiliation_strings":["University of Illinois Urbana Champaign, Urbana, United States"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana Champaign, Urbana, United States","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032573239","display_name":"Yiqi Liu","orcid":"https://orcid.org/0009-0006-8171-4970"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yiqi Liu","raw_affiliation_strings":["University of Illinois Urbana Champaign, Urbana, USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana Champaign, Urbana, USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5005380910","display_name":"Jian Huang","orcid":"https://orcid.org/0000-0002-1125-671X"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jian Huang","raw_affiliation_strings":["University of Illinois Urbana Champaign, Urbana, United States"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana Champaign, Urbana, United States","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5101548931"],"corresponding_institution_ids":["https://openalex.org/I157725225"],"apc_list":null,"apc_paid":null,"fwci":3.3198,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.9283755,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"80","last_page":"86"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10502","display_name":"Advanced Memory and Neural Computing","score":0.9980000257492065,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/virtualization","display_name":"Virtualization","score":0.8402982354164124},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8339816331863403},{"id":"https://openalex.org/keywords/cloud-computing","display_name":"Cloud computing","score":0.6680232286453247},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.574970543384552},{"id":"https://openalex.org/keywords/application-virtualization","display_name":"Application virtualization","score":0.5473090410232544},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.544446587562561},{"id":"https://openalex.org/keywords/temporal-isolation-among-virtual-machines","display_name":"Temporal isolation among virtual machines","score":0.543339192867279},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.5074488520622253},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.4914637804031372},{"id":"https://openalex.org/keywords/full-virtualization","display_name":"Full virtualization","score":0.4790312349796295},{"id":"https://openalex.org/keywords/isolation","display_name":"Isolation (microbiology)","score":0.4593982398509979},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.4086177945137024},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.10846883058547974}],"concepts":[{"id":"https://openalex.org/C513985346","wikidata":"https://www.wikidata.org/wiki/Q270471","display_name":"Virtualization","level":3,"score":0.8402982354164124},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8339816331863403},{"id":"https://openalex.org/C79974875","wikidata":"https://www.wikidata.org/wiki/Q483639","display_name":"Cloud computing","level":2,"score":0.6680232286453247},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.574970543384552},{"id":"https://openalex.org/C13062989","wikidata":"https://www.wikidata.org/wiki/Q651531","display_name":"Application virtualization","level":5,"score":0.5473090410232544},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.544446587562561},{"id":"https://openalex.org/C142355369","wikidata":"https://www.wikidata.org/wiki/Q7698919","display_name":"Temporal isolation among virtual machines","level":4,"score":0.543339192867279},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5074488520622253},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.4914637804031372},{"id":"https://openalex.org/C47878483","wikidata":"https://www.wikidata.org/wiki/Q848333","display_name":"Full virtualization","level":4,"score":0.4790312349796295},{"id":"https://openalex.org/C2775941552","wikidata":"https://www.wikidata.org/wiki/Q25212305","display_name":"Isolation (microbiology)","level":2,"score":0.4593982398509979},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.4086177945137024},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.10846883058547974},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C89423630","wikidata":"https://www.wikidata.org/wiki/Q7193","display_name":"Microbiology","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3593856.3595912","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3593856.3595912","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 19th Workshop on Hot Topics in Operating Systems","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1171700966","display_name":null,"funder_award_id":"NSF CAREER","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G164177236","display_name":"SPX: Collaborative Research: Scaling the Software-Defined Data Center with Network-Storage Stack Co-Design","funder_award_id":"1919044","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G2460662635","display_name":null,"funder_award_id":"2144796","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G6671297155","display_name":null,"funder_award_id":"CAREER","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G678292349","display_name":null,"funder_award_id":"CCF-1919044","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":8,"referenced_works":["https://openalex.org/W2100926301","https://openalex.org/W2150139096","https://openalex.org/W2152839228","https://openalex.org/W2156077332","https://openalex.org/W2323909431","https://openalex.org/W2604514113","https://openalex.org/W3011280959","https://openalex.org/W4380881153"],"related_works":["https://openalex.org/W2021257679","https://openalex.org/W2134071009","https://openalex.org/W1902822905","https://openalex.org/W2096801503","https://openalex.org/W2133508824","https://openalex.org/W1483119918","https://openalex.org/W2156826906","https://openalex.org/W2376957770","https://openalex.org/W2022726031","https://openalex.org/W1952450835"],"abstract_inverted_index":{"Modern":[0],"cloud":[1,42],"platforms":[2,43],"have":[3],"been":[4],"employing":[5],"hardware":[6,73],"accelerators":[7],"such":[8],"as":[9],"neural":[10],"processing":[11],"units":[12],"(NPUs)":[13],"to":[14,28,112],"meet":[15],"the":[16,29,35,62,69,105,114],"increasing":[17],"demand":[18],"for":[19,22,66,124],"computing":[20],"resources":[21],"AI-based":[23],"application":[24,55],"services.":[25,56],"However,":[26],"due":[27],"lack":[30],"of":[31,38],"system":[32,63],"virtualization":[33,64,79,95],"support,":[34],"current":[36],"way":[37],"using":[39],"NPUs":[40,67],"in":[41],"suffers":[44],"from":[45],"either":[46],"low":[47],"resource":[48,97,115],"utilization":[49],"or":[50],"poor":[51],"isolation":[52,123],"between":[53],"multi-tenant":[54],"In":[57],"this":[58,101],"paper,":[59],"we":[60],"investigate":[61],"techniques":[65],"across":[68],"entire":[70],"software":[71],"and":[72,75,96,103,109,121],"stack,":[74],"present":[76],"our":[77],"NPU":[78,87,94],"solution":[80],"named":[81,89],"NeuCloud.":[82],"We":[83,99],"propose":[84],"a":[85],"flexible":[86],"abstraction":[88,102],"vNPU":[90,106,125],"that":[91],"allows":[92],"fine-grained":[93],"management.":[98],"leverage":[100],"design":[104],"allocation,":[107],"mapping,":[108],"scheduling":[110],"policies":[111],"maximize":[113],"utilization,":[116],"while":[117],"achieving":[118],"both":[119],"performance":[120],"security":[122],"instances":[126],"at":[127],"runtime.":[128]},"counts_by_year":[{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":2}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
