{"id":"https://openalex.org/W4380874786","doi":"https://doi.org/10.1145/3579371.3589350","title":"TPU v4: An Optically Reconfigurable Supercomputer for Machine Learning with Hardware Support for Embeddings","display_name":"TPU v4: An Optically Reconfigurable Supercomputer for Machine Learning with Hardware Support for Embeddings","publication_year":2023,"publication_date":"2023-06-16","ids":{"openalex":"https://openalex.org/W4380874786","doi":"https://doi.org/10.1145/3579371.3589350"},"language":"en","primary_location":{"id":"doi:10.1145/3579371.3589350","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3579371.3589350","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3579371.3589350","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 50th Annual International Symposium on Computer Architecture","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3579371.3589350","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050207942","display_name":"Norman P. Jouppi","orcid":"https://orcid.org/0000-0003-1765-1929"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Norm Jouppi","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085787384","display_name":"George Thomas Kurian","orcid":"https://orcid.org/0000-0002-3478-518X"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"George Kurian","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100765709","display_name":"Sheng Li","orcid":"https://orcid.org/0000-0003-1068-5261"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sheng Li","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051149049","display_name":"Peter Ma","orcid":"https://orcid.org/0000-0002-7264-1443"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Peter Ma","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009578714","display_name":"Rahul Nagarajan","orcid":"https://orcid.org/0009-0001-2146-8687"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rahul Nagarajan","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016524466","display_name":"Lifeng Nai","orcid":"https://orcid.org/0000-0002-8801-9384"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Lifeng Nai","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037285672","display_name":"Nishant Patil","orcid":"https://orcid.org/0000-0001-6620-0038"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nishant Patil","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103255393","display_name":"Suvinay Subramanian","orcid":"https://orcid.org/0000-0002-8715-8964"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Suvinay Subramanian","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074688105","display_name":"Andy Swing","orcid":"https://orcid.org/0009-0009-7039-8812"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Andy Swing","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010571977","display_name":"Brian Towles","orcid":"https://orcid.org/0009-0000-9409-7285"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Brian Towles","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035427716","display_name":"Cliff Young","orcid":"https://orcid.org/0000-0003-2172-1651"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Clifford Young","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102871836","display_name":"Xiang Zhou","orcid":"https://orcid.org/0000-0003-0121-6527"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiang Zhou","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103236132","display_name":"Zongwei Zhou","orcid":"https://orcid.org/0000-0002-4991-8424"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zongwei Zhou","raw_affiliation_strings":["Google, Mountain View, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077202069","display_name":"David A. Patterson","orcid":"https://orcid.org/0000-0003-0902-7093"},"institutions":[{"id":"https://openalex.org/I1291425158","display_name":"Google (United States)","ror":"https://ror.org/00njsd438","country_code":"US","type":"company","lineage":["https://openalex.org/I1291425158","https://openalex.org/I4210128969"]},{"id":"https://openalex.org/I95457486","display_name":"University of California, Berkeley","ror":"https://ror.org/01an7q238","country_code":"US","type":"education","lineage":["https://openalex.org/I95457486"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"David A Patterson","raw_affiliation_strings":["Google, Mountain View, CA, USA","University of California, Berkeley, CA, USA","Google, Mountain View, CA, USA University of California, Berkeley, CA, USA"],"affiliations":[{"raw_affiliation_string":"Google, Mountain View, CA, USA","institution_ids":["https://openalex.org/I1291425158"]},{"raw_affiliation_string":"University of California, Berkeley, CA, USA","institution_ids":["https://openalex.org/I95457486"]},{"raw_affiliation_string":"Google, Mountain View, CA, USA University of California, Berkeley, CA, USA","institution_ids":["https://openalex.org/I1291425158","https://openalex.org/I95457486"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":14,"corresponding_author_ids":["https://openalex.org/A5050207942"],"corresponding_institution_ids":["https://openalex.org/I1291425158"],"apc_list":null,"apc_paid":null,"fwci":181.0658,"has_fulltext":true,"cited_by_count":403,"citation_normalized_percentile":{"value":0.9999691,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"14"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.9987999796867371,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10829","display_name":"Interconnection Networks and Systems","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/supercomputer","display_name":"Supercomputer","score":0.817832887172699},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7524441480636597},{"id":"https://openalex.org/keywords/dataflow","display_name":"Dataflow","score":0.7242490649223328},{"id":"https://openalex.org/keywords/infiniband","display_name":"InfiniBand","score":0.5065876245498657},{"id":"https://openalex.org/keywords/pci-express","display_name":"PCI Express","score":0.47432276606559753},{"id":"https://openalex.org/keywords/modularity","display_name":"Modularity (biology)","score":0.4229433238506317},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.4105619490146637},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3280872106552124},{"id":"https://openalex.org/keywords/field-programmable-gate-array","display_name":"Field-programmable gate array","score":0.1072763204574585}],"concepts":[{"id":"https://openalex.org/C83283714","wikidata":"https://www.wikidata.org/wiki/Q121117","display_name":"Supercomputer","level":2,"score":0.817832887172699},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7524441480636597},{"id":"https://openalex.org/C96324660","wikidata":"https://www.wikidata.org/wiki/Q205446","display_name":"Dataflow","level":2,"score":0.7242490649223328},{"id":"https://openalex.org/C2781030343","wikidata":"https://www.wikidata.org/wiki/Q922437","display_name":"InfiniBand","level":2,"score":0.5065876245498657},{"id":"https://openalex.org/C64270927","wikidata":"https://www.wikidata.org/wiki/Q206924","display_name":"PCI Express","level":3,"score":0.47432276606559753},{"id":"https://openalex.org/C2779478453","wikidata":"https://www.wikidata.org/wiki/Q6889748","display_name":"Modularity (biology)","level":2,"score":0.4229433238506317},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.4105619490146637},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3280872106552124},{"id":"https://openalex.org/C42935608","wikidata":"https://www.wikidata.org/wiki/Q190411","display_name":"Field-programmable gate array","level":2,"score":0.1072763204574585},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C54355233","wikidata":"https://www.wikidata.org/wiki/Q7162","display_name":"Genetics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3579371.3589350","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3579371.3589350","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3579371.3589350","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 50th Annual International Symposium on Computer Architecture","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3579371.3589350","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3579371.3589350","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3579371.3589350","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 50th Annual International Symposium on Computer Architecture","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Affordable and clean energy","score":0.6600000262260437,"id":"https://metadata.un.org/sdg/7"}],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4380874786.pdf","grobid_xml":"https://content.openalex.org/works/W4380874786.grobid-xml"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W105472389","https://openalex.org/W1501077214","https://openalex.org/W1999085092","https://openalex.org/W2002555321","https://openalex.org/W2028263411","https://openalex.org/W2060204338","https://openalex.org/W2082887106","https://openalex.org/W2097561580","https://openalex.org/W2134839001","https://openalex.org/W2156275124","https://openalex.org/W2156838963","https://openalex.org/W2169731856","https://openalex.org/W2898781725","https://openalex.org/W3007855629","https://openalex.org/W3030163527","https://openalex.org/W3036878841","https://openalex.org/W3127736057","https://openalex.org/W3214897310","https://openalex.org/W4206561618","https://openalex.org/W4212973913","https://openalex.org/W4237249260","https://openalex.org/W4254255272","https://openalex.org/W4283704460","https://openalex.org/W4386730099","https://openalex.org/W6600109629","https://openalex.org/W6600297362","https://openalex.org/W6603649181","https://openalex.org/W6675465559"],"related_works":["https://openalex.org/W2040819538","https://openalex.org/W1966974913","https://openalex.org/W2966835246","https://openalex.org/W2937592512","https://openalex.org/W619618554","https://openalex.org/W1597650818","https://openalex.org/W2132218766","https://openalex.org/W3046837943","https://openalex.org/W1970502298","https://openalex.org/W2008781517"],"abstract_inverted_index":{"In":[0],"response":[1],"to":[2,42,154],"innovations":[3],"in":[4,213],"machine":[5],"learning":[6],"(ML)":[7],"models,":[8],"production":[9],"workloads":[10],"changed":[11],"radically":[12],"and":[13,25,51,67,72,81,109,121,136,147,177,181,205],"rapidly.":[14],"TPU":[15,87,114,117,127,190],"v4":[16,88,115,128],"is":[17,130,169,178],"the":[18,173,187,193],"fifth":[19],"Google":[20,199],"domain":[21],"specific":[22],"architecture":[23],"(DSA)":[24],"its":[26,39],"third":[27],"supercomputer":[28,129],"for":[29],"such":[30],"ML":[31],"models.":[32],"Optical":[33],"circuit":[34],"switches":[35],"(OCSes)":[36],"dynamically":[37],"reconfigure":[38],"interconnect":[40],"topology":[41,60],"improve":[43],"scale,":[44],"availability,":[45],"utilization,":[46],"modularity,":[47],"deployment,":[48],"security,":[49],"power,":[50,66],"performance;":[52],"users":[53],"can":[54],"pick":[55],"a":[56,150],"twisted":[57],"3D":[58],"torus":[59],"if":[61],"desired.":[62],"Much":[63],"cheaper,":[64],"lower":[65],"faster":[68,140,171,180],"than":[69,172,186,210],"Infiniband,":[70],"OCSes":[71],"underlying":[73],"optical":[74],"components":[75],"are":[76],"<5%":[77],"of":[78,83,106,159,161,198],"system":[79,84],"cost":[80],"<3%":[82],"power.":[85,110],"Each":[86],"includes":[89],"SparseCores,":[90],"dataflow":[91],"processors":[92],"that":[93,96],"accelerate":[94],"models":[95],"rely":[97],"on":[98],"embeddings":[99],"by":[100,119,124],"5x--7x":[101],"yet":[102],"use":[103,201],"only":[104],"5%":[105],"die":[107],"area":[108],"Deployed":[111],"since":[112],"2020,":[113],"outperforms":[116],"v3":[118],"2.1x":[120],"improves":[122],"performance/Watt":[123],"2.7x.":[125],"The":[126],"4x":[131],"larger":[132],"at":[133,156],"4096":[134],"chips":[135],"thus":[137],"nearly":[138],"10x":[139],"overall,":[141],"which":[142],"along":[143],"with":[144],"OCS":[145],"flexibility":[146],"availability":[148],"allows":[149],"large":[151],"language":[152],"model":[153],"train":[155],"an":[157],"average":[158],"~60%":[160],"peak":[162],"FLOPS/second.":[163],"For":[164],"similar":[165],"sized":[166],"systems,":[167],"it":[168],"~4.3x--4.5x":[170],"Graphcore":[174],"IPU":[175],"Bow":[176],"1.2x--1.7x":[179],"uses":[182],"1.3x--1.9x":[183],"less":[184,203,208],"power":[185],"Nvidia":[188],"A100.":[189],"v4s":[191],"inside":[192],"energy-optimized":[194],"warehouse":[195],"scale":[196],"computers":[197],"Cloud":[200],"~2--6x":[202],"energy":[204],"produce":[206],"~20x":[207],"CO2e":[209],"contemporary":[211],"DSAs":[212],"typical":[214],"on-premise":[215],"data":[216],"centers.":[217]},"counts_by_year":[{"year":2026,"cited_by_count":33},{"year":2025,"cited_by_count":209},{"year":2024,"cited_by_count":130},{"year":2023,"cited_by_count":29},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":1}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
