{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,13]],"date-time":"2025-10-13T15:35:49Z","timestamp":1760369749540,"version":"3.37.3"},"reference-count":22,"publisher":"IEEE","funder":[{"DOI":"10.13039\/501100003246","name":"NWO","doi-asserted-by":"publisher","award":["P3"],"award-info":[{"award-number":["P3"]}],"id":[{"id":"10.13039\/501100003246","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2021,2,1]]},"DOI":"10.23919\/date51398.2021.9473984","type":"proceedings-article","created":{"date-parts":[[2021,8,24]],"date-time":"2021-08-24T22:11:46Z","timestamp":1629843106000},"page":"120-123","source":"Crossref","is-referenced-by-count":6,"title":["Efficient Tensor Cores support in TVM for Low-Latency Deep learning"],"prefix":"10.23919","author":[{"given":"Wei","family":"Sun","sequence":"first","affiliation":[]},{"given":"Savvas","family":"Sioutas","sequence":"additional","affiliation":[]},{"given":"Sander","family":"Stuijk","sequence":"additional","affiliation":[]},{"given":"Andrew","family":"Nelson","sequence":"additional","affiliation":[]},{"given":"Henk","family":"Corporaal","sequence":"additional","affiliation":[]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"journal-title":"Squeezenet Alexnet-level accuracy with 50x fewer parameters and< 0 5 mb model size","year":"2016","author":"iandola","key":"ref11"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2019.2918851"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.435"},{"key":"ref14","article-title":"Deep Learning","author":"lecun","year":"0","journal-title":"Nature (2015)"},{"journal-title":"The deep learning compiler A comprehensive survey","year":"2020","author":"li","key":"ref15"},{"key":"ref16","article-title":"Optimizing CNN Model Inference on CPUs","author":"liu","year":"0","journal-title":"USENIX ATC &#x2018;19 Renton WA USA"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/IPDPSW.2018.00091"},{"journal-title":"Fast training of convolutional networks through ffts","year":"2013","author":"mathieu","key":"ref18"},{"journal-title":"Optimization of CNNs on Tensor Core","year":"0","key":"ref19"},{"key":"ref4","article-title":"Learning to Optimize Tensor Programs","author":"chen","year":"2018","journal-title":"NIPS 18"},{"journal-title":"Automatic kernel generation for Volta tensor cores","year":"2020","author":"bhaskaracharya","key":"ref3"},{"key":"ref6","article-title":"MEC: Memory-Efficient Convolution for Deep Neural Network","author":"cho","year":"2017","journal-title":"ICML'17 Sydney NSW Australia"},{"journal-title":"TVM An automated end-to-end optimizing compiler for deep learning","year":"2018","author":"chen","key":"ref5"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1145\/3211346.3211354"},{"journal-title":"The indirect convolution algorithm","year":"2019","author":"dukhan","key":"ref7"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/MICRO.2016.7783725"},{"key":"ref1","first-page":"265","article-title":"TensorFlow: A System for Large-Scale Machine Learning","author":"abadi","year":"2016","journal-title":"OSDI '16"},{"journal-title":"Fireiron A scheduling language for high-performance linear algebra on gpus","year":"2020","author":"hagedorn","key":"ref9"},{"key":"ref20","article-title":"PyTorch: An Imperative Style, High-Performance Deep Learning Library","author":"paszke","year":"2019","journal-title":"Advances in Neural IInformation Processing Systems"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3378678.3391880"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1145\/2491956.2462176"}],"event":{"name":"2021 Design, Automation & Test in Europe Conference & Exhibition (DATE)","start":{"date-parts":[[2021,2,1]]},"location":"Grenoble, France","end":{"date-parts":[[2021,2,5]]}},"container-title":["2021 Design, Automation &amp; Test in Europe Conference &amp; Exhibition (DATE)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9473901\/9473226\/09473984.pdf?arnumber=9473984","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,1,28]],"date-time":"2022-01-28T23:37:44Z","timestamp":1643413064000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9473984\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2021,2,1]]},"references-count":22,"URL":"https:\/\/doi.org\/10.23919\/date51398.2021.9473984","relation":{},"subject":[],"published":{"date-parts":[[2021,2,1]]}}}