{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,19]],"date-time":"2026-04-19T22:45:57Z","timestamp":1776638757587,"version":"3.51.2"},"reference-count":139,"publisher":"IEEE","license":[{"start":{"date-parts":[[2021,9,20]],"date-time":"2021-09-20T00:00:00Z","timestamp":1632096000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2021,9,20]],"date-time":"2021-09-20T00:00:00Z","timestamp":1632096000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2021,9,20]],"date-time":"2021-09-20T00:00:00Z","timestamp":1632096000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,9,20]]},"DOI":"10.1109\/hpec49654.2021.9622867","type":"proceedings-article","created":{"date-parts":[[2021,12,1]],"date-time":"2021-12-01T20:57:36Z","timestamp":1638392256000},"page":"1-9","source":"Crossref","is-referenced-by-count":85,"title":["AI Accelerator Survey and Trends"],"prefix":"10.1109","author":[{"given":"Albert","family":"Reuther","sequence":"first","affiliation":[]},{"given":"Peter","family":"Michaleas","sequence":"additional","affiliation":[]},{"given":"Michael","family":"Jones","sequence":"additional","affiliation":[]},{"given":"Vijay","family":"Gadepally","sequence":"additional","affiliation":[]},{"given":"Siddharth","family":"Samsi","sequence":"additional","affiliation":[]},{"given":"Jeremy","family":"Kepner","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","article-title":"Blaize Ignites Edge-AI Performance","author":"demler","year":"2020","journal-title":"Tech Rep the Linley Group"},{"key":"ref38","article-title":"Bitmain SoC Brings AI to the Edge","author":"wheeler","year":"2019"},{"key":"ref33","article-title":"AMD Announces Radeon Instinct MI60 & MI50 Accelerators Powered By 7nm Vega","author":"smith","year":"2018"},{"key":"ref32","article-title":"Taking a Deeper Look at AMD Radeon Instinct GPUs for Deep Learning","year":"2017"},{"key":"ref31","article-title":"Deep dive into Amazon Inferentia: A custom-built chip to enhance ML and AI","author":"evangelist","year":"2020"},{"key":"ref30","article-title":"AWS Inferentia Machine Learning Processor","author":"hamilton","year":"2018"},{"key":"ref37","article-title":"Baidu Creates Kunlun Silicon for AI","author":"duckett","year":"2018"},{"key":"ref36","article-title":"Baidu Accelerator Rises in AI","author":"merritt","year":"2018"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC42613.2021.9366056"},{"key":"ref34","article-title":"Arm Ethos is for Ubiquitous AI At the Edge &#x2014; WikiChip Fuse","author":"schor","year":"2020"},{"key":"ref28","article-title":"Alibaba&#x2019;s New AI Chip Can Process Nearly 80K Images Per Second","author":"peng","year":"2019"},{"key":"ref27","article-title":"Startup Accelerates AI at the Sensor","author":"merritt","year":"2019"},{"key":"ref29","article-title":"Indo-US startup preps agent-based AI processor","author":"clarke","year":"2018"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3309551"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-18338-7_12"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.51593\/20190014"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1145\/3154484"},{"key":"ref23","article-title":"ImageNet Classification with Deep Convolutional Neural Networks","volume":"25","author":"krizhevsky","year":"2012","journal-title":"Neural Information Processing Systems"},{"key":"ref101","article-title":"Preferred Networks: A 500 W Custom PCIe Card using 3000 mm2 Silicon","author":"cutress","year":"2019"},{"key":"ref26","article-title":"aiWare3 Hardware IP Helps Drive Autonomous Vehicles To Production","year":"2018"},{"key":"ref100","article-title":"MN-Core","year":"2020"},{"key":"ref25","article-title":"FPGA acceleration card delivers on bandwidth, speed, and flexibility","author":"roos","year":"2019"},{"key":"ref50","article-title":"Tearing Apart Google&#x2019;s TPU 3.0 AI Coprocessor","author":"teich","year":"2018"},{"key":"ref51","first-page":"1","article-title":"Ten Lessons From Three Generations Shaped Google&#x2019;s TPUv4i","author":"jouppi","year":"2021","journal-title":"2021 ACM\/IEEE 48th Annual International Symposium on Computer Architecture (ISCA)"},{"key":"ref59","article-title":"Gyrfalcon Unveils Fourth AI Accelerator Chip &#x2014; EE Times","author":"ward-foxton","year":"2019"},{"key":"ref58","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00023"},{"key":"ref57","article-title":"Groq Shares Recipe for TSP Nodes, Systems","author":"hemsoth","year":"2020"},{"key":"ref56","article-title":"GAP9 for ML at the Edge EEJournal","author":"turley","year":"2020"},{"key":"ref55","article-title":"GAP application processors - GreenWaves Technologies","year":"2020"},{"key":"ref54","article-title":"Dell DSS8440 Graphcore IPU Server","year":"2020","journal-title":"Graphcore Tech Rep"},{"key":"ref53","article-title":"Preliminary IPU Benchmarks","author":"lacey","year":"2017"},{"key":"ref52","article-title":"Groq Rocks Neural Networks","author":"gwennap","year":"2020","journal-title":"Micropro-cessor Report Tech Rep"},{"key":"ref40","article-title":"Chinese AI Chip Maker Cambricon Unveils New Cloud-Based Smart Chip China Money Network","author":"wu","year":"2018"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1126\/science.aam9744"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC.2014.6757323"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3282307"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3430936"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC.2019.8662396"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1145\/3360307"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1145\/3361682"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC43674.2020.9286149"},{"key":"ref46","article-title":"Globalfoundries aids launch of Chinese AI startup","author":"clarke","year":"2019"},{"key":"ref45","article-title":"Cornami Achieves Unprecedented Performance at Lowest Power Dissipation for Deep Neural Networks","year":"2019"},{"key":"ref48","article-title":"Edge TPU","year":"2019"},{"key":"ref47","article-title":"Performance Estimation and Benchmarks for Real-World Edge Inference Applications","author":"mehta","year":"2020","journal-title":"Linley Spring Processor Conference"},{"key":"ref42","article-title":"Kendryte Embeds AI for Surveillance","author":"gwennap","year":"2019"},{"key":"ref41","article-title":"Cambricon, Maker of Hauwei&#x2019;s Kirin NPU IP, Build a Big AI Chip and PCIe Card","author":"cutress","year":"2018"},{"key":"ref44","article-title":"Cerebras Doubles AI Performance with Second-Gen 7nm Wafer Scale Engine","author":"trader","year":"2021"},{"key":"ref43","article-title":"Introducing the Cerebras CS-1, the Industry&#x2019;s Fastest Artificial Intelligence Computer - Cerebras","author":"hock","year":"2019"},{"key":"ref127","doi-asserted-by":"publisher","DOI":"10.1109\/JSSC.2016.2616357"},{"key":"ref126","first-page":"1","article-title":"Eyeriss: A Spatial Architecture for Energy-Efficient Dataflow for Convolutional Neural Networks","author":"chen","year":"2018","journal-title":"IEEE Micro"},{"key":"ref125","article-title":"Centaur Adds AI to Server Processor: First x86 SoC to Integrate Deep-Learning Accelerator","author":"gwennap","year":"2019","journal-title":"Tech Rep the Linley Group"},{"key":"ref124","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00013"},{"key":"ref73","article-title":"New Movidius Myriad X VPU Packs a Custom Neural Compute Engine","author":"hruska","year":"2017"},{"key":"ref72","article-title":"Intel FPGA Architecture Focuses on Deep Learning Inference","author":"hemsoth","year":"2018"},{"key":"ref129","doi-asserted-by":"publisher","DOI":"10.1145\/3093337.3037702"},{"key":"ref71","doi-asserted-by":"publisher","DOI":"10.1109\/FPL.2018.00077"},{"key":"ref128","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA.2016.30"},{"key":"ref70","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2015.2474396"},{"key":"ref76","article-title":"Intel Xeon Platinum 8280","year":"2020"},{"key":"ref130","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-019-1424-8"},{"key":"ref77","article-title":"Kalray&#x2019;s MPPA&#x00AE; Manycore Processor: At the Heart of Intelligent Systems","author":"dupont de dinechin","year":"0","journal-title":"IEEE International New Circuits and Systems Conference (NEWCAS)"},{"key":"ref74","article-title":"Intel&#x2019;s Xeon Cascade Lake vs. NVIDIA Turing: An Analysis in AI","author":"de gelas","year":"2019"},{"key":"ref75","article-title":"Intel Xeon Platinum 8180","year":"2020"},{"key":"ref133","doi-asserted-by":"publisher","DOI":"10.1109\/ACSSC.2014.7094761"},{"key":"ref134","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2011.5981829"},{"key":"ref131","doi-asserted-by":"publisher","DOI":"10.1145\/2996864"},{"key":"ref78","article-title":"NXP, Kalray demo Coolidge parallel processor in &#x2019;BlueBox&#x2019;","author":"clarke","year":"2020"},{"key":"ref132","first-page":"1","article-title":"Epiphany-V: A 1024 processor 64-bit RISC System-On-Chip","author":"olofsson","year":"2016"},{"key":"ref79","article-title":"Kneron&#x2019;s Next-Gen Edge AI Chip Gets $40m Boost","author":"ward-foxton","year":"2020"},{"key":"ref136","article-title":"Convnet Burden","author":"albanie","year":"2019"},{"key":"ref135","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00045"},{"key":"ref138","article-title":"NVIDIA Tesla T4 AI Inferencing GPU Benchmarks and Review","author":"harmon","year":"2019"},{"key":"ref137","doi-asserted-by":"publisher","DOI":"10.1145\/1498765.1498785"},{"key":"ref60","article-title":"SolidRun, Gyrfalcon Develop Arm-based Edge Optimized AI Inference Server","year":"2020"},{"key":"ref139","article-title":"Virtual Conference Delivers Real Chips","author":"krewell","year":"2020"},{"key":"ref62","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2020.2975185"},{"key":"ref61","article-title":"Habana Offers Gaudi for AI Training","author":"gwennap","year":"2019","journal-title":"Technical report Microprocessor Report"},{"key":"ref63","article-title":"Habana Wins Cigar for AI Inference","author":"gwennap","year":"2019"},{"key":"ref64","article-title":"Details of Hailo AI Edge Accelerator Emerge","author":"ward-foxton","year":"2019"},{"key":"ref65","article-title":"Horizon Robotics Journey2 Automotive AI Processor Series","year":"2020"},{"key":"ref66","article-title":"Ascend 310 AI Processor","year":"2020"},{"key":"ref67","article-title":"Ascend 910 AI Processor","year":"2020"},{"key":"ref68","article-title":"IBM Finds Killer App for TrueNorth Neuromorphic Chip","author":"feldman","year":"2016"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MCSE.2017.29"},{"key":"ref69","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1604850113"},{"key":"ref1","article-title":"AI Enabling Technologies","author":"gadepally","year":"2019","journal-title":"MIT Lincoln Lab Lexington MA Rep"},{"key":"ref109","article-title":"Tenstorrent Scales AI Performance: Architecture Leads in Data-Center Power Efficiency","author":"gwennap","year":"2020","journal-title":"Technical report Microprocessor Report"},{"key":"ref95","article-title":"Defining AI Innovation with NVIDIA DGX A100","author":"campa","year":"2020"},{"key":"ref108","article-title":"Startup Rolls AI Chips for Audio","author":"merritt","year":"2018"},{"key":"ref94","article-title":"NVIDIA&#x2019;s DGX-2: Sixteen Tesla V100s, 30TB of NVMe, Only $400K","author":"cutress","year":"2018"},{"key":"ref107","article-title":"Tech Heavyweights Back AI Chip Startup","author":"mcgrath","year":"2018"},{"key":"ref93","article-title":"Nvidia Infuses DGX-1 with Volta, Eight V100s in a Single Chassis","author":"alcorn","year":"2017"},{"key":"ref106","article-title":"Machine Learning Moves to the Edge","author":"gwennap","year":"2020","journal-title":"Technical report Microprocessor Report"},{"key":"ref92","article-title":"NVIDIA Tesla V100 Tensor Core GPU","year":"2019"},{"key":"ref105","article-title":"Rockchip Released Its First AI Processor RK3399Pro NPU Performance Up to 2.4TOPs","year":"2018"},{"key":"ref91","article-title":"NVIDIA Turing Architecture In-Depth","author":"kilgariff","year":"2018"},{"key":"ref104","article-title":"Qualcomm Targets AI Inferencing in the Cloud &#x2014; EE Times","author":"mcgrath","year":"2019"},{"key":"ref90","article-title":"16GB NVIDIA Tesla V100 Gets Reprieve; Remains in Production","author":"smith","year":"2018"},{"key":"ref103","article-title":"Qualcomm Cloud AI 100 Promises Impressive Performance per Watt for Near-Edge AI","author":"ward-foxton","year":"2020"},{"key":"ref102","article-title":"Quadric Edge Supercomputer","author":"firu","year":"2019","journal-title":"Quadric Tech Rep"},{"key":"ref111","article-title":"FSD Chip - Tesla","year":"2020"},{"key":"ref112","article-title":"TI&#x2019;s First Automotive SoC with an AI Accelerator Launches","author":"ward-foxton","year":"2021"},{"key":"ref110","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2020.2975764"},{"key":"ref98","article-title":"Perceive Exits Stealth With Super Efficient Machine Learning Chip For Smarter Devices","author":"mcgregor","year":"2020"},{"key":"ref99","article-title":"The 2,048-core PEZY-SC2 sets a Green500 record","author":"schor","year":"2017"},{"key":"ref96","article-title":"NVIDIA Jetson TX2 Delivers Twice the Intelligence to the Edge","author":"franklin","year":"2017"},{"key":"ref97","article-title":"NVIDIA Gives Jetson AGX Xavier a Trim, Announces Nano-Sized Jetson Xavier NX","author":"smith","year":"2019"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC.2019.8916327"},{"key":"ref11","article-title":"An Analysis of Deep Neural Network Models for Practical Applications","author":"canziani","year":"2016"},{"key":"ref12","article-title":"Intel Benchmarks Neuromorphic Chip Against AI Accelerators","author":"ward-foxton","year":"2020"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1117\/12.205116"},{"key":"ref14","article-title":"Neural Networks in Hardware: A Survey","author":"liao","year":"2001","journal-title":"Department of Computer Science University of California Tech Rep"},{"key":"ref15","doi-asserted-by":"crossref","first-page":"239","DOI":"10.1016\/j.neucom.2010.03.021","article-title":"Artificial neural networks in hardware: A survey of two decades of progress","volume":"74","author":"misra","year":"2010","journal-title":"Neurocomputing"},{"key":"ref118","article-title":"Enflame Stokes AI Acceleration","author":"wheeler","year":"2021"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2017.2761740"},{"key":"ref82","article-title":"Mythic Resizes its AI Chip","author":"ward-foxton","year":"2021"},{"key":"ref117","article-title":"XMOS adapts Xcore into AIoT crossover processor&#x2019; &#x2014; EE Times","author":"ward-foxton","year":"2020"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.2200\/S01004ED1V01Y202004CAC050"},{"key":"ref81","article-title":"Drilling Into Microsoft&#x2019;s BrainWave Soft Deep Learning Chip","author":"morgan","year":"2017"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1117\/12.2529407"},{"key":"ref84","article-title":"Mythic @ Hot Chips 2018 - Mythic - Medium","author":"fick","year":"2018"},{"key":"ref119","article-title":"Mobileye&#x2019;s New EyeQ5: How Open is Open?","year":"2018"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1016\/j.eng.2020.01.007"},{"key":"ref83","article-title":"A Mythic Approach to Deep Learning Inference","author":"hemsoth","year":"2018"},{"key":"ref114","article-title":"TI Jacinto Accelerates Level 3 ADAS","author":"demler","year":"2020"},{"key":"ref113","article-title":"TDA4VM Jacinto Processors for ADAS and Autonomous Vehicles","year":"2021","journal-title":"Texas Instruments Tech Rep"},{"key":"ref116","article-title":"Untether Delivers At-Memory AI","author":"gwennap","year":"2020","journal-title":"Tech Rep the Linley Group"},{"key":"ref80","article-title":"Kneron Attracts Strategic Investors &#x2014; EE Times","author":"ward-foxton","year":"2021"},{"key":"ref115","article-title":"Samsung, Toshiba Detail AI Chips","author":"merritt","year":"2019"},{"key":"ref120","article-title":"Introducing 2nd Generation IPU Systems for AI at Scale","author":"toon","year":"2020"},{"key":"ref89","article-title":"NVIDIA Tesla P100","year":"0"},{"key":"ref121","article-title":"Graphcore Unveils New GC200 Chip and the Expandable M2000 IPU Machine That Runs on Them","author":"lunden","year":"2020"},{"key":"ref122","article-title":"Latest MLPerf Results","author":"russell","year":"2021"},{"key":"ref123","article-title":"SambaNova Emerges From Stealth With Record-Breaking AI System","author":"ward-foxton","year":"2020"},{"key":"ref85","article-title":"NovuMind: An Early Entrant in AI Silicon","author":"freund","year":"2019","journal-title":"Moor Insights & Strategy Tech Rep"},{"key":"ref86","article-title":"NovuMind&#x2019;s AI Chip Sparks Controversy","author":"yoshida","year":"2018"},{"key":"ref87","article-title":"NVIDIA Ampere Architecture In-Depth","author":"krashinsky","year":"2020"},{"key":"ref88","article-title":"Nvidia Rounds Out","author":"morgan","year":"2021","journal-title":"Ampere\" Lineup With Two New Accelerators \""}],"event":{"name":"2021 IEEE High Performance Extreme Computing Conference (HPEC)","location":"Waltham, MA, USA","start":{"date-parts":[[2021,9,20]]},"end":{"date-parts":[[2021,9,24]]}},"container-title":["2021 IEEE High Performance Extreme Computing Conference (HPEC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9622740\/9622741\/09622867.pdf?arnumber=9622867","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,5,10]],"date-time":"2022-05-10T16:53:50Z","timestamp":1652201630000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9622867\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,9,20]]},"references-count":139,"URL":"https:\/\/doi.org\/10.1109\/hpec49654.2021.9622867","relation":{},"subject":[],"published":{"date-parts":[[2021,9,20]]}}}