{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,11]],"date-time":"2026-03-11T01:55:26Z","timestamp":1773194126416,"version":"3.50.1"},"reference-count":47,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,6,1]],"date-time":"2021-06-01T00:00:00Z","timestamp":1622505600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,6,1]],"date-time":"2021-06-01T00:00:00Z","timestamp":1622505600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,6,1]],"date-time":"2021-06-01T00:00:00Z","timestamp":1622505600000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,6]]},"DOI":"10.1109\/isca52012.2021.00010","type":"proceedings-article","created":{"date-parts":[[2021,8,4]],"date-time":"2021-08-04T20:58:26Z","timestamp":1628110706000},"page":"1-14","source":"Crossref","is-referenced-by-count":295,"title":["Ten Lessons From Three Generations Shaped Google\u2019s TPUv4i : Industrial Product"],"prefix":"10.1109","author":[{"given":"Norman P.","family":"Jouppi","sequence":"first","affiliation":[]},{"given":"Doe","family":"Hyun Yoon","sequence":"additional","affiliation":[]},{"given":"Matthew","family":"Ashcraft","sequence":"additional","affiliation":[]},{"given":"Mark","family":"Gottscho","sequence":"additional","affiliation":[]},{"given":"Thomas B.","family":"Jablin","sequence":"additional","affiliation":[]},{"given":"George","family":"Kurian","sequence":"additional","affiliation":[]},{"given":"James","family":"Laudon","sequence":"additional","affiliation":[]},{"given":"Sheng","family":"Li","sequence":"additional","affiliation":[]},{"given":"Peter","family":"Ma","sequence":"additional","affiliation":[]},{"given":"Xiaoyu","family":"Ma","sequence":"additional","affiliation":[]},{"given":"Thomas","family":"Norrie","sequence":"additional","affiliation":[]},{"given":"Nishant","family":"Patil","sequence":"additional","affiliation":[]},{"given":"Sushma","family":"Prasad","sequence":"additional","affiliation":[]},{"given":"Cliff","family":"Young","sequence":"additional","affiliation":[]},{"given":"Zongwei","family":"Zhou","sequence":"additional","affiliation":[]},{"given":"David","family":"Patterson","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","author":"schmuelling","year":"0","journal-title":"NVIDIA MLPerf Inference System Under Test (SUT) performance tuning guide"},{"key":"ref38","author":"romero","year":"2019","journal-title":"Infaas A model-less inference serving system"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1145\/3132847.3132914"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1145\/3123939.3124545"},{"key":"ref31","year":"2020","journal-title":"NVIDIA T4 70W Low Profile PCIe GPU Accelerator PB-09256-001_v05"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2021.3058217"},{"key":"ref37","author":"patterson","year":"0","journal-title":"Embench&#x2122; A Modern Benchmark for Embedded Computing"},{"key":"ref36","author":"patel","year":"2019","journal-title":"Deep Learning Inferencing with Mipsology using Xilinx ALVEO&#x2122; on Dell EMC Infrastructure"},{"key":"ref35","author":"park","year":"2018","journal-title":"Deep learning inference in facebook data centers Characterization performance optimizations and hardware implications"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01225-0_36"},{"key":"ref10","year":"2020","journal-title":"Goya&#x2122; Inference Platform White Paper"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1145\/3306346.3322948"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2012.71"},{"key":"ref12","article-title":"Habana Wins Cigar for AI Inference","author":"gwennap","year":"2019","journal-title":"Microprocessor Report"},{"key":"ref13","author":"harmon","year":"2019","journal-title":"NVIDIA Tesla T4 AI Inferencing GPU Benchmarks and Review"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1145\/3282307"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/5.920580"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC.2014.6757323"},{"key":"ref17","author":"hruska","year":"2019","journal-title":"Intel Details Its Nervana Inference and Training AI Cards"},{"key":"ref18","year":"2020","journal-title":"Image"},{"key":"ref19","author":"jia","year":"2019","journal-title":"Dissecting the NVidia Turing T4 GPU via Microbenchmarking"},{"key":"ref28","year":"2020","journal-title":"Mlperf training v0 7 results"},{"key":"ref4","article-title":"Intel 10nm Spring Hill NNP-I Inference Chip","volume":"31","author":"cutress","year":"2019","journal-title":"Hot Chips"},{"key":"ref27","year":"0","journal-title":"MLPerf Inference 0 7 details"},{"key":"ref3","article-title":"Google Turning Its Lucrative Web Search Over to AI Machines","author":"clark","year":"2015","journal-title":"Bloomberg Technology"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/2408776.2408794"},{"key":"ref29","year":"0","journal-title":"All results 1\/8\/2021 All results 1\/8\/2021 Figure 2 Train-05-4 Train-0 5-20 Train-0 5-21 Table 6 Inf-0 5-25 Inf-0 5-21 Inf-0 5-33 Inf-0 7-119 Inf-0 5-31"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3361682"},{"key":"ref8","author":"fisher","year":"2005","journal-title":"Embedded Computing A VLIW Approach to Architecture Compilers and Tools"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/3362743.3362964"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.2200\/S00874ED3V01Y201809CAC046"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/HPCA.2019.00023"},{"key":"ref1","year":"0","journal-title":"Google breaks AI performance records in MLPerf with world&#x2019;s fastest training supercomputer"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1145\/1498765.1498785"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/HCS49909.2020.9220619"},{"key":"ref45","year":"0","journal-title":"Technology node"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3154484"},{"key":"ref47","article-title":"Problems Facing Analog and In -Memory Computing","author":"zimmer","year":"2020","journal-title":"UC Berkeley"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/3079856.3080246"},{"key":"ref42","author":"smith","year":"2020","journal-title":"Micron Spills on GDDR6X"},{"key":"ref24","author":"kalamkar","year":"2019","journal-title":"A study of BFLOAT16 for Deep Learning Training"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1038\/nature24270"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/3360307"},{"key":"ref44","first-page":"1","article-title":"Spring Hill (NNP-I 1000) Intel&#x2019;s data center inference chip","author":"wechsler","year":"2019","journal-title":"2019 IEEE Hot Chips 31 Symposium"},{"key":"ref26","year":"0","journal-title":"TN-ED-03 GDDR6 The Next-Generation Graphics DRAM"},{"key":"ref43","author":"stojanovi?","year":"2012","journal-title":"Designing VLSI Interconnects with Monolithically Integrated Silicon-Photonics"},{"key":"ref25","author":"knuth","year":"2008","journal-title":"Interview With Donald Knuth"}],"event":{"name":"2021 ACM\/IEEE 48th Annual International Symposium on Computer Architecture (ISCA)","location":"Valencia, Spain","start":{"date-parts":[[2021,6,14]]},"end":{"date-parts":[[2021,6,18]]}},"container-title":["2021 ACM\/IEEE 48th Annual International Symposium on Computer Architecture (ISCA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9499716\/9499722\/09499913.pdf?arnumber=9499913","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,7,9]],"date-time":"2022-07-09T02:19:22Z","timestamp":1657333162000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9499913\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,6]]},"references-count":47,"URL":"https:\/\/doi.org\/10.1109\/isca52012.2021.00010","relation":{},"subject":[],"published":{"date-parts":[[2021,6]]}}}