{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,9]],"date-time":"2026-03-09T01:17:17Z","timestamp":1773019037537,"version":"3.50.1"},"reference-count":135,"publisher":"IEEE","license":[{"start":{"date-parts":[[2020,9,22]],"date-time":"2020-09-22T00:00:00Z","timestamp":1600732800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2020,9,22]],"date-time":"2020-09-22T00:00:00Z","timestamp":1600732800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2020,9,22]],"date-time":"2020-09-22T00:00:00Z","timestamp":1600732800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2020,9,22]]},"DOI":"10.1109\/hpec43674.2020.9286149","type":"proceedings-article","created":{"date-parts":[[2020,12,22]],"date-time":"2020-12-22T21:07:15Z","timestamp":1608671235000},"page":"1-12","source":"Crossref","is-referenced-by-count":126,"title":["Survey of Machine Learning Accelerators"],"prefix":"10.1109","author":[{"given":"Albert","family":"Reuther","sequence":"first","affiliation":[]},{"given":"Peter","family":"Michaleas","sequence":"additional","affiliation":[]},{"given":"Michael","family":"Jones","sequence":"additional","affiliation":[]},{"given":"Vijay","family":"Gadepally","sequence":"additional","affiliation":[]},{"given":"Siddharth","family":"Samsi","sequence":"additional","affiliation":[]},{"given":"Jeremy","family":"Kepner","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1145\/2996864"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.1109\/JSSC.2016.2616357"},{"key":"ref33","author":"albanie","year":"2019","journal-title":"Convnet Burden"},{"key":"ref32","first-page":"1737","article-title":"Deep Learning with Limited Numerical Precision","author":"gupta","year":"2015","journal-title":"Proceedings of the 32Nd International Conference on International Conference on Machine Learning - Volume 37 ser ICML'15 JMLR org"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1145\/3154484"},{"key":"ref30","article-title":"ImageNet Classification with Deep Convolutional Neural Networks","volume":"25","author":"krizhevsky","year":"2012","journal-title":"Neural Information Processing Systems"},{"key":"ref37","first-page":"1","article-title":"Eyeriss: A Spatial Architecture for Energy-Efficient Dataflow for Convolutional Neural Networks","author":"chen","year":"2018","journal-title":"IEEE Micro"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1145\/3093337.3037702"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA.2016.30"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2011.5981829"},{"key":"ref28","author":"khan","year":"2020","journal-title":"AI Chips What They Are and Why They Matter"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1145\/3309551"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-18338-7_12"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1371\/journal.pone.0085175"},{"key":"ref22","author":"liao","year":"2001","journal-title":"Neural Networks in Hardware A Survey"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1117\/12.205116"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.2200\/S01004ED1V01Y202004CAC050"},{"key":"ref23","doi-asserted-by":"crossref","first-page":"239","DOI":"10.1016\/j.neucom.2010.03.021","article-title":"Artificial neural networks in hardware: A survey of two decades of progress","volume":"74","author":"misra","year":"2010","journal-title":"Neurocomputing"},{"key":"ref101","year":"2020","journal-title":"Ascend 910 AI Processor"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1016\/j.eng.2020.01.007"},{"key":"ref100","doi-asserted-by":"publisher","DOI":"10.1109\/ISCA45697.2020.00023"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1117\/12.2529407"},{"key":"ref50","author":"ward-foxton","year":"2020","journal-title":"Kneron's Next-Gen Edge AI Chip Gets $40m Boost"},{"key":"ref51","author":"merritt","year":"2019","journal-title":"Startup Accelerates AI at the Sensor"},{"key":"ref59","author":"yoshida","year":"2018","journal-title":"NovuMind's AI Chip Sparks Controversy"},{"key":"ref58","author":"wheeler","year":"2019","journal-title":"Bitmain SoC Brings AI to the Edge"},{"key":"ref57","author":"schor","year":"2020","journal-title":"Arm Ethos is for Ubiquitous AI At the Edge - WikiChip Fuse"},{"key":"ref56","author":"ward-foxton","year":"2020","journal-title":"XMOS adapts Xcore into AIoT crossover processor&#x2019; - EE Times"},{"key":"ref55","author":"mcgregor","year":"2020","journal-title":"Perceive Exits Stealth With Super Efficient Machine Learning Chip For Smarter Devices"},{"key":"ref54","author":"hemsoth","year":"2018","journal-title":"A Mythic Approach to Deep Learning Inference"},{"key":"ref53","author":"fick","year":"2018","journal-title":"Mythic Hot Chips 2018 - Mythic - Medium"},{"key":"ref52","author":"mcgrath","year":"2018","journal-title":"Tech Heavyweights Back AI Chip Startup"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO.2014.58"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3282307"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/ISSCC.2014.6757323"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/HPEC.2019.8916327"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3361682"},{"key":"ref8","first-page":"1","article-title":"A survey of FPGA-based accelerators for convolutional neural networks","author":"mittal","year":"2018","journal-title":"Neural Computing and Applications"},{"key":"ref49","year":"2020","journal-title":"GAP application processors - Green Waves Technologies"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/s11704-016-6159-1"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1016\/j.sysarc.2019.01.007"},{"key":"ref46","year":"2019","journal-title":"Edge TPU"},{"key":"ref45","author":"hruska","year":"2017","journal-title":"New Movidius Myriad X VPU Packs a Custom Neural Compute Engine"},{"key":"ref48","author":"turley","year":"2020","journal-title":"GAP9 for ML at the Edge EEJournal"},{"key":"ref47","year":"2018","journal-title":"Rockchip Released Its First AI Processor RK3399Pro NPU Performance up to 2 4TOPs"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1145\/2786763.2694358"},{"key":"ref41","doi-asserted-by":"crossref","first-page":"92","DOI":"10.1145\/2872887.2750389","article-title":"ShiDianNao: Shifting vision processing closer to the sensor","volume":"43","author":"du","year":"2015","journal-title":"ACM SIGARCH Computer Architecture News"},{"key":"ref44","author":"feldman","year":"2016","journal-title":"IBM Finds Killer App for TrueNorth Neuromorphic Chip"},{"key":"ref43","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2015.2474396"},{"key":"ref127","author":"feldman","year":"2018","journal-title":"Photonic Computing Company Takes Aim at Artificial Intelligence"},{"key":"ref126","author":"feldman","year":"2019","journal-title":"The Silicon Photonics Key to Building Better Neural Networks"},{"key":"ref125","author":"dunietz","year":"2017","journal-title":"Light-Powered Computers Brighten AI's Future"},{"key":"ref124","author":"hemsoth","year":"2018","journal-title":"First Wave of Spiking Neural Network Hardware Hits"},{"key":"ref73","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2020.2975764"},{"key":"ref72","year":"2020","journal-title":"FSD Chip - Tesla"},{"key":"ref71","author":"firu","year":"2019","journal-title":"Quadric Edge Supercomputer"},{"key":"ref129","doi-asserted-by":"publisher","DOI":"10.1038\/nphoton.2017.93"},{"key":"ref128","year":"2020","journal-title":"Photonic Computing for Massively Parallel AI"},{"key":"ref70","author":"hruska","year":"2018","journal-title":"Nvidia&#x2019;s Jetson Xavier Stuffs Volta Performance Into Tiny Form Factor"},{"key":"ref76","author":"schor","year":"2017","journal-title":"The 2 048-core PEZY-SC2 sets a Green500 record - WikiChip Fuse"},{"key":"ref77","author":"gwennap","year":"2020","journal-title":"Tenstorrent Scales AI Performance Architecture Leads in Data-Center Power Efficiency"},{"key":"ref130","author":"clarke","year":"2019","journal-title":"Startup reveals prototype optical AI processor says report"},{"key":"ref74","author":"merritt","year":"2019","journal-title":"Samsung Toshiba Detail AI Chips"},{"key":"ref75","author":"de gelas","year":"2019","journal-title":"Intel's Xeon Cascade Lake vs NVIDIA Turing An Analysis in AI"},{"key":"ref133","author":"giles","year":"2019","journal-title":"Bill Gates just backed a chip startup that uses light to turbocharge AI"},{"key":"ref134","author":"freund","year":"2020","journal-title":"Intel Lays Out Strategy For AI It's Habana"},{"key":"ref78","author":"hemsoth","year":"2018","journal-title":"Intel FPGA Architecture Focuses on Deep Learning Inference"},{"key":"ref131","author":"feldman","year":"2018","journal-title":"Optalysys Claims AI Breakthrough Using Optical Processing Technology"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/FPL.2018.00077"},{"key":"ref132","author":"feldman","year":"2018","journal-title":"Optical Computing Startup Demos Training of Neural Networks"},{"key":"ref135","author":"clarke","year":"2016","journal-title":"Military startup aims large with neural processor chip"},{"key":"ref60","author":"freund","year":"2019","journal-title":"NovuMind An Early Entrant in AI Silicon"},{"key":"ref62","year":"2018","journal-title":"aiWare3 Hardware IP Helps Drive Autonomous Vehicles To Production"},{"key":"ref61","author":"ward-foxton","year":"2019","journal-title":"Gyrfalcon Unveils Fourth AI Accelerator Chip - EE Times"},{"key":"ref63","author":"clarke","year":"2018","journal-title":"Indo-US startup preps agent-based AI processor"},{"key":"ref64","author":"ward-foxton","year":"2019","journal-title":"Details of Hailo AI Edge Accelerator Emerge"},{"key":"ref65","year":"2020","journal-title":"Horizon Robotics Journey2 Automotive AI Processor Series"},{"key":"ref66","year":"2020","journal-title":"Ascend 310 AI Processor"},{"key":"ref67","article-title":"Kalray's MPPA&#x00AE; Manycore Processor: At the Heart of Intelligent Systems","author":"de dinechin","year":"2019","journal-title":"IEEE International New Circuits and Systems Conference (NEWCAS)"},{"key":"ref68","author":"clarke","year":"2020","journal-title":"NXP Kalray demo Coolidge parallel processor in &#x2018;BlueBox&#x2019;"},{"key":"ref69","author":"franklin","year":"2017","journal-title":"NVIDIA Jetson TX2 Delivers Twice the Intelligence to the Edge"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MCSE.2017.29"},{"key":"ref1","author":"gadepally","year":"2019","journal-title":"AI Enabling Technologies"},{"key":"ref95","author":"duckett","year":"2018","journal-title":"Baidu creates kunlun silicon for ai"},{"key":"ref109","year":"2020","journal-title":"Dell DSS8440 Graphcore IPU Server"},{"key":"ref94","author":"merritt","year":"2018","journal-title":"Baidu Accelerator Rises in AI"},{"key":"ref108","author":"campa","year":"2020","journal-title":"Defining AI Innovation with NVIDIA DGX A100"},{"key":"ref107","author":"cutress","year":"2018","journal-title":"NVIDIA&#x2019;s DGX-2 Sixteen Tesla V100s 30TB of NVMe Only $400K"},{"key":"ref93","author":"evangelist","year":"2020","journal-title":"Deep dive into Amazon Inferentia A custom-built chip to enhance ML and AI"},{"key":"ref106","author":"alcorn","year":"2017","journal-title":"Nvidia Infuses DGX-1 with Volta Eight V100s in a Single Chassis"},{"key":"ref92","author":"hamilton","year":"2018","journal-title":"AWS Inferentia Machine Learning Processor"},{"key":"ref105","author":"hock","year":"2019","journal-title":"Introducing the Cerebras CS-1 the Industry's Fastest Artificial Intelligence Computer - Cerebras"},{"key":"ref91","author":"peng","year":"2019","journal-title":"Alibaba's New AI Chip Can Process Nearly 80K Images Per Second"},{"key":"ref104","author":"gwennap","year":"2019","journal-title":"Habana Offers Gaudi for AI Training"},{"key":"ref90","author":"smith","year":"2018","journal-title":"AMD Announces Radeon Instinct MI60 & MI50 Accelerators Powered By 7nm Vega"},{"key":"ref103","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2020.2975185"},{"key":"ref102","author":"gwennap","year":"2019","journal-title":"Habana Wins Cigar for AI Inference"},{"key":"ref111","year":"2020","journal-title":"SolidRun Gyrfalcon Develop Arm-based Edge Optimized AI Inference Server"},{"key":"ref112","author":"mcgrath","year":"2019","journal-title":"Qualcomm Targets AI Inferencing in the Cloud - EE Times"},{"key":"ref110","author":"lacey","year":"2020","journal-title":"Updated Graphcore IPU benchmarks"},{"key":"ref98","author":"lacey","year":"2017","journal-title":"Preliminary IPU Benchmarks"},{"key":"ref99","author":"gwennap","year":"2020","journal-title":"Groq Rocks Neural Networks"},{"key":"ref96","author":"cutress","year":"2018","journal-title":"Cambricon Maker of Hauwei's Kirin NPU IP Build a Big AI Chip and PCIe Card"},{"key":"ref97","author":"teich","year":"2018","journal-title":"Tearing Apart Google&#x2019;s TPU 3 0 AI Coprocessor"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3289185"},{"key":"ref11","author":"canziani","year":"2016","journal-title":"An analysis of deep neural network models for practical applications"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2017.2761740"},{"key":"ref13","article-title":"Mixed precision training","author":"narang","year":"2018","journal-title":"Proc of ICLR (Vancouver Canada)"},{"key":"ref14","author":"schuman","year":"2017","journal-title":"A survey of neuromorphic computing and neural networks in hardware"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1126\/science.1254642"},{"key":"ref82","article-title":"Performance Estimation and Benchmarks for Real-World Edge Inference Applications","author":"mehta","year":"2020","journal-title":"Linley Spring Processor Conference"},{"key":"ref118","year":"2018","journal-title":"Baidu Backs Neuromorphic IC Developer"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1073\/pnas.1604850113"},{"key":"ref81","year":"2019","journal-title":"Cornami Achieves Unprecedented Performance at Lowest Power Dissipation for Deep Neural Networks"},{"key":"ref117","author":"moore","year":"2020","journal-title":"Low-Power AI Startup Eta Compute Delivers First Commercial Chips - IEEE Spectrum"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2008.4634199"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/IISWC.2017.8167769"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/MC.2018.157113521"},{"key":"ref83","author":"morgan","year":"2017","journal-title":"Drilling Into Microsoft's BrainWave Soft Deep Learning Chip"},{"key":"ref119","author":"clarke","year":"2018","journal-title":"AI chip startup offers new edge computing solution"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1038\/s41586-019-1424-8"},{"key":"ref114","year":"2019","journal-title":"Enflame Technology Announces CloudBlazer with DTU Chip on GLOBALFOUNDRIES 12LP FinFET Platform for Data Center Training"},{"key":"ref113","author":"yoshida","year":"2019","journal-title":"Blaize Fires up GSP for AI Processing"},{"key":"ref80","author":"roos","year":"2019","journal-title":"FPGA acceleration card delivers on bandwidth speed and flexibility"},{"key":"ref116","year":"2020","journal-title":"BrainChip Showcases Vision and Learning Capabilities of its Akida Neural Processing IP and Device at tinyML Summit 2020"},{"key":"ref115","author":"gwennap","year":"2018","journal-title":"Esperanto Maxes Out RISC-V High-End Maxion CPU Raises RISC-V Performance Bar"},{"key":"ref89","year":"2017","journal-title":"Taking a Deeper Look at AMD Radeon Instinct GPUs for Deep Learning"},{"key":"ref120","first-page":"15.4.1","article-title":"A 68 Parallel Row Access Neuromorphic Core with 22K Multi-Level Synapses Based on Logic-Compatible Embedded Flash Memory Technology","volume":"2018 decem","author":"kim","year":"2019","journal-title":"Technical Digest - International Electron Devices Meeting IEDM"},{"key":"ref121","author":"dahad","year":"2019","journal-title":"Startup Launches Its First Low Latency Edge AI Chip"},{"key":"ref122","author":"clarke","year":"2020","journal-title":"GrAI Matter research gives rise to AI processor for the edge"},{"key":"ref123","first-page":"1","article-title":"Cell Culture, Transport and Investigation","author":"agabi","year":"2016"},{"key":"ref85","year":"2019","journal-title":"NVIDIA Tesla V100 Tensor Core GPU"},{"key":"ref86","author":"smith","year":"2018","journal-title":"16GB NVIDIA Tesla V100 Gets Reprieve Remains in Production"},{"key":"ref87","author":"kilgariff","year":"2018","journal-title":"NVIDIA Turing Architecture In-Depth"},{"key":"ref88","author":"krashinsky","year":"2020","journal-title":"NVIDIA Ampere Architecture In-Depth"}],"event":{"name":"2020 IEEE High Performance Extreme Computing Conference (HPEC)","location":"Waltham, MA, USA","start":{"date-parts":[[2020,9,22]]},"end":{"date-parts":[[2020,9,24]]}},"container-title":["2020 IEEE High Performance Extreme Computing Conference (HPEC)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9285977\/9286137\/09286149.pdf?arnumber=9286149","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,6,27]],"date-time":"2022-06-27T15:54:48Z","timestamp":1656345288000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9286149\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2020,9,22]]},"references-count":135,"URL":"https:\/\/doi.org\/10.1109\/hpec43674.2020.9286149","relation":{},"subject":[],"published":{"date-parts":[[2020,9,22]]}}}