{"id":"https://openalex.org/W3189983613","doi":"https://doi.org/10.1109/mm.2021.3097287","title":"Datacenter-Scale Analysis and Optimization of GPU Machine Learning Workloads","display_name":"Datacenter-Scale Analysis and Optimization of GPU Machine Learning Workloads","publication_year":2021,"publication_date":"2021-08-24","ids":{"openalex":"https://openalex.org/W3189983613","doi":"https://doi.org/10.1109/mm.2021.3097287","mag":"3189983613"},"language":"en","primary_location":{"id":"doi:10.1109/mm.2021.3097287","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mm.2021.3097287","pdf_url":null,"source":{"id":"https://openalex.org/S59697426","display_name":"IEEE Micro","issn_l":"0272-1732","issn":["0272-1732","1937-4143"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Micro","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5065258502","display_name":"Lukasz Wesolowski","orcid":"https://orcid.org/0000-0002-8377-9691"},"institutions":[{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]},{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Lukasz Wesolowski","raw_affiliation_strings":["Facebook, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Facebook, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444","https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005070359","display_name":"Bilge Acun","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]},{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bilge Acun","raw_affiliation_strings":["Facebook, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Facebook, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444","https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5019208852","display_name":"Valentin Andrei","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]},{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Valentin Andrei","raw_affiliation_strings":["Facebook, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Facebook, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444","https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112689277","display_name":"Adnan Aziz","orcid":"https://orcid.org/0009-0003-5855-6861"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]},{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Adnan Aziz","raw_affiliation_strings":["Facebook, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Facebook, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444","https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5006064073","display_name":"Gisle Dankel","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]},{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Gisle Dankel","raw_affiliation_strings":["Facebook, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Facebook, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444","https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5059629600","display_name":"Chris Gregg","orcid":"https://orcid.org/0000-0003-1856-2661"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]},{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]},{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Christopher Gregg","raw_affiliation_strings":["Stanford University, Stanford, CA, USA","Facebook, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Stanford University, Stanford, CA, USA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Facebook, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444","https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100948767","display_name":"Xiaoqiao Meng","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]},{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiaoqiao Meng","raw_affiliation_strings":["Facebook, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Facebook, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444","https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085892095","display_name":"Cyril Meurillon","orcid":null},"institutions":[{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]},{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Cyril Meurillon","raw_affiliation_strings":["Facebook, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Facebook, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444","https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049554375","display_name":"Denis Sheahan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]},{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Denis Sheahan","raw_affiliation_strings":["Facebook, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Facebook, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444","https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101550588","display_name":"Lei Tian","orcid":"https://orcid.org/0000-0001-7052-0907"},"institutions":[{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]},{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lei Tian","raw_affiliation_strings":["Facebook, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Facebook, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444","https://openalex.org/I4210099336"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101920284","display_name":"Janet Yang","orcid":"https://orcid.org/0000-0002-4237-7493"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Janet Yang","raw_affiliation_strings":["Carnegie Mellon University, Pittsburgh, PA, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, Pittsburgh, PA, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013419180","display_name":"Peifeng Yu","orcid":"https://orcid.org/0000-0001-7001-6647"},"institutions":[{"id":"https://openalex.org/I27837315","display_name":"University of Michigan\u2013Ann Arbor","ror":"https://ror.org/00jmfr291","country_code":"US","type":"education","lineage":["https://openalex.org/I27837315"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Peifeng Yu","raw_affiliation_strings":["University of Michigan, Ann Arbor, MI, USA"],"affiliations":[{"raw_affiliation_string":"University of Michigan, Ann Arbor, MI, USA","institution_ids":["https://openalex.org/I27837315"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5046756907","display_name":"Kim Hazelwood","orcid":"https://orcid.org/0000-0002-2713-8507"},"institutions":[{"id":"https://openalex.org/I4210114444","display_name":"Meta (United States)","ror":"https://ror.org/01zbnvs85","country_code":"US","type":"company","lineage":["https://openalex.org/I4210114444"]},{"id":"https://openalex.org/I4210099336","display_name":"Menlo School","ror":"https://ror.org/01240pn49","country_code":"US","type":"education","lineage":["https://openalex.org/I4210099336"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Kim Hazelwood","raw_affiliation_strings":["Facebook, Inc., Menlo Park, CA, USA"],"affiliations":[{"raw_affiliation_string":"Facebook, Inc., Menlo Park, CA, USA","institution_ids":["https://openalex.org/I4210114444","https://openalex.org/I4210099336"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5065258502"],"corresponding_institution_ids":["https://openalex.org/I4210099336","https://openalex.org/I4210114444"],"apc_list":null,"apc_paid":null,"fwci":1.7018,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.87539425,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":93,"max":99},"biblio":{"volume":"41","issue":"5","first_page":"101","last_page":"112"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11181","display_name":"Advanced Data Storage Technologies","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12761","display_name":"Data Stream Mining Techniques","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8966110944747925},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.8205322027206421},{"id":"https://openalex.org/keywords/software-deployment","display_name":"Software deployment","score":0.7156770825386047},{"id":"https://openalex.org/keywords/server","display_name":"Server","score":0.6984015703201294},{"id":"https://openalex.org/keywords/profiling","display_name":"Profiling (computer programming)","score":0.6265614032745361},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.5897039175033569},{"id":"https://openalex.org/keywords/stack","display_name":"Stack (abstract data type)","score":0.4473690390586853},{"id":"https://openalex.org/keywords/operating-system","display_name":"Operating system","score":0.37697091698646545},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.27823883295059204}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8966110944747925},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.8205322027206421},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.7156770825386047},{"id":"https://openalex.org/C93996380","wikidata":"https://www.wikidata.org/wiki/Q44127","display_name":"Server","level":2,"score":0.6984015703201294},{"id":"https://openalex.org/C187191949","wikidata":"https://www.wikidata.org/wiki/Q1138496","display_name":"Profiling (computer programming)","level":2,"score":0.6265614032745361},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5897039175033569},{"id":"https://openalex.org/C9395851","wikidata":"https://www.wikidata.org/wiki/Q177929","display_name":"Stack (abstract data type)","level":2,"score":0.4473690390586853},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.37697091698646545},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.27823883295059204}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mm.2021.3097287","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mm.2021.3097287","pdf_url":null,"source":{"id":"https://openalex.org/S59697426","display_name":"IEEE Micro","issn_l":"0272-1732","issn":["0272-1732","1937-4143"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Micro","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W2604291737","https://openalex.org/W2606722458","https://openalex.org/W2612387305","https://openalex.org/W2963403751","https://openalex.org/W2970971581","https://openalex.org/W4295312788","https://openalex.org/W6736205984","https://openalex.org/W6758283263","https://openalex.org/W6766978945"],"related_works":["https://openalex.org/W2348361596","https://openalex.org/W1165680166","https://openalex.org/W2465593037","https://openalex.org/W2591061639","https://openalex.org/W1570191694","https://openalex.org/W2385119568","https://openalex.org/W2027457585","https://openalex.org/W2081035100","https://openalex.org/W2021850411","https://openalex.org/W4379620231"],"abstract_inverted_index":{"In":[0],"this":[1],"article,":[2],"we":[3],"present":[4,74],"a":[5,12],"system":[6,27,98],"to":[7,47,90],"collectively":[8],"optimize":[9],"efficiency":[10,33,54,110],"in":[11,112],"very":[13],"large":[14],"scale":[15],"deployment":[16],"of":[17,77,87],"GPU":[18,114],"servers":[19],"for":[20,35,63,70,106],"machine":[21],"learning":[22],"workloads":[23],"at":[24],"Facebook.":[25],"Our":[26],"1)":[28],"measures":[29],"and":[30,59,65,80,103,108],"stores":[31],"system-wide":[32],"metrics":[34],"every":[36],"executed":[37],"workflow;":[38],"2)":[39],"aggregates":[40],"data":[41],"from":[42],"across":[43],"the":[44,78,85,88,100],"execution":[45],"stack":[46,79],"identify":[48],"optimization":[49],"opportunities":[50],"that":[51],"maximize":[52],"fleet-wide":[53],"improvements;":[55],"3)":[56],"provides":[57],"periodic":[58],"on-demand":[60],"whole-system":[61],"profiling":[62],"workflows;":[64],"4)":[66],"automatically":[67],"analyzes":[68],"traces":[69],"common":[71],"antipatterns.":[72],"We":[73],"each":[75],"component":[76],"show":[81],"case":[82],"studies":[83],"demonstrating":[84],"use":[86],"tools":[89],"significantly":[91],"improve":[92],"performance.":[93],"To":[94],"our":[95,97],"knowledge,":[96],"is":[99],"most":[101],"complete":[102],"effective":[104],"solution":[105],"identifying":[107],"addressing":[109],"problems":[111],"datacenter-scale":[113],"deployments.":[115]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":4},{"year":2021,"cited_by_count":2}],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2025-10-10T00:00:00"}
