{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2024,9,8]],"date-time":"2024-09-08T11:22:01Z","timestamp":1725794521223},"reference-count":35,"publisher":"IEEE","license":[{"start":{"date-parts":[[2023,6,4]],"date-time":"2023-06-04T00:00:00Z","timestamp":1685836800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2023,6,4]],"date-time":"2023-06-04T00:00:00Z","timestamp":1685836800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023,6,4]]},"DOI":"10.1109\/iv55152.2023.10186809","type":"proceedings-article","created":{"date-parts":[[2023,7,27]],"date-time":"2023-07-27T17:20:05Z","timestamp":1690478405000},"page":"1-8","source":"Crossref","is-referenced-by-count":1,"title":["Augmenting Legacy Networks for Flexible Inference"],"prefix":"10.1109","author":[{"given":"Jason","family":"Clemons","sequence":"first","affiliation":[{"name":"NVIDIA"}]},{"given":"Iuri","family":"Frosio","sequence":"additional","affiliation":[{"name":"NVIDIA"}]},{"given":"Maying","family":"Shen","sequence":"additional","affiliation":[{"name":"NVIDIA"}]},{"given":"Jose M.","family":"Alvarez","sequence":"additional","affiliation":[{"name":"NVIDIA"}]},{"given":"Stephen W.","family":"Keckler","sequence":"additional","affiliation":[{"name":"NVIDIA"}]}],"member":"263","reference":[{"key":"ref13","article-title":"Accelerate cnns from three dimensions: A comprehensive pruning framework","author":"wang","year":"2021","journal-title":"ICML"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01166"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.01152"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00293"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1007\/s11263-019-01190-4"},{"key":"ref14","article-title":"Outrageously large neural networks: The sparsely-gated mixture-of-experts layer","author":"shazeer","year":"2017","journal-title":"ICLRE"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.155"},{"key":"ref33","article-title":"PyTorch: An Imperative Style, High-Performance Deep Learning Library","author":"paszke","year":"2019","journal-title":"NeurIPS"},{"key":"ref10","article-title":"Learning the number of neurons in deep networks","author":"alvarez","year":"2016","journal-title":"NeurIPS"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref2","article-title":"Once for all: Train one network and specialize it for efficient deployment","author":"cai","year":"2020","journal-title":"ICLRE"},{"key":"ref1","article-title":"Slimmable neural networks","author":"yu","year":"2019","journal-title":"ICLRE"},{"key":"ref17","article-title":"Multi-scale dense networks for resource efficient image classification","author":"huang","year":"2018","journal-title":"ICLRE"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01261-8_25"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33013812"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2016.7900006"},{"key":"ref24","article-title":"Network slimming by slimmable networks: Towards one-shot architecture search for channel numbers","author":"yu","year":"2019","journal-title":"CoRR"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58536-5_38"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01249-6_18"},{"key":"ref25","article-title":"Structural pruning via latency-saliency knapsack","author":"shen","year":"2022","journal-title":"Advances in neural information processing systems"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR42600.2020.01318"},{"key":"ref22","article-title":"Snip: Single-shot network pruning based on connection sensitivity","author":"lee","year":"2018","journal-title":"CoRR"},{"key":"ref21","article-title":"Trained ternary quantization","author":"zhu","year":"2017","journal-title":"ICLRE"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01068"},{"key":"ref27","article-title":"Bert loses patience: Fast and robust inference with early exit","author":"zhou","year":"2020","journal-title":"NeurIPS"},{"key":"ref29","article-title":"Dynamic neural networks: A survey","author":"han","year":"2021","journal-title":"IEEE Trans PAMI"},{"key":"ref8","article-title":"Residual connections encourage iterative inference","author":"jastrzebski","year":"2018","journal-title":"ICLRE"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46493-0_39"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.207"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/JSTSP.2020.2979669"},{"year":"0","key":"ref3","article-title":"NVIDIA DRIVE"},{"key":"ref6","article-title":"Identity mappings in deep residual networks","author":"he","year":"2016","journal-title":"ECCV"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01352"}],"event":{"name":"2023 IEEE Intelligent Vehicles Symposium (IV)","start":{"date-parts":[[2023,6,4]]},"location":"Anchorage, AK, USA","end":{"date-parts":[[2023,6,7]]}},"container-title":["2023 IEEE Intelligent Vehicles Symposium (IV)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/10186382\/10186383\/10186809.pdf?arnumber=10186809","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2023,8,14]],"date-time":"2023-08-14T17:36:30Z","timestamp":1692034590000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/10186809\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,6,4]]},"references-count":35,"URL":"https:\/\/doi.org\/10.1109\/iv55152.2023.10186809","relation":{},"subject":[],"published":{"date-parts":[[2023,6,4]]}}}