{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,6,12]],"date-time":"2026-06-12T01:03:32Z","timestamp":1781226212916,"version":"3.54.1"},"reference-count":28,"publisher":"IEEE","license":[{"start":{"date-parts":[[2022,5,23]],"date-time":"2022-05-23T00:00:00Z","timestamp":1653264000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2022,5,23]],"date-time":"2022-05-23T00:00:00Z","timestamp":1653264000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2022,5,23]]},"DOI":"10.1109\/icra46639.2022.9812320","type":"proceedings-article","created":{"date-parts":[[2022,7,12]],"date-time":"2022-07-12T19:36:40Z","timestamp":1657654600000},"page":"7492-7498","source":"Crossref","is-referenced-by-count":7,"title":["RAPID-RL: A Reconfigurable Architecture with Preemptive-Exits for Efficient Deep-Reinforcement Learning"],"prefix":"10.1109","author":[{"given":"Adarsh Kumar","family":"Kosta","sequence":"first","affiliation":[{"name":"Purdue University,West Lafayette,IN,USA,47907"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Malik Aqeel","family":"Anwar","sequence":"additional","affiliation":[{"name":"Georgia Institute of Technology,Atlanta,GA,USA,30332"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Priyadarshini","family":"Panda","sequence":"additional","affiliation":[{"name":"Yale University,New Haven,CT,USA,06520"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Arijit","family":"Raychowdhury","sequence":"additional","affiliation":[{"name":"Georgia Institute of Technology,Atlanta,GA,USA,30332"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Kaushik","family":"Roy","sequence":"additional","affiliation":[{"name":"Purdue University,West Lafayette,IN,USA,47907"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2020.2971172"},{"key":"ref11","doi-asserted-by":"crossref","first-page":"279","DOI":"10.1007\/BF00992698","article-title":"Q-learning","volume":"8","author":"watkins","year":"1992","journal-title":"Machine Learning"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1090\/S0002-9904-1954-09848-8"},{"key":"ref13","author":"hessel","year":"2017","journal-title":"Rainbow Combining Improvements in Deep Reinforcement Learning"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v30i1.10295"},{"key":"ref15","article-title":"Dueling network architectures for deep reinforcement learning","author":"wang","year":"2015","journal-title":"ArXiv Preprint"},{"key":"ref16","article-title":"Prioritized experi-ence replay","author":"schaul","year":"2016","journal-title":"4th International Conference on Learning Representations ICLR 2016"},{"key":"ref17","author":"sutton","year":"2018","journal-title":"Reinforcement Learning An Introduction"},{"key":"ref18","author":"bellemare","year":"2017","journal-title":"A distributional per-spective on reinforcement learning"},{"key":"ref19","article-title":"Noisy networks for exploration","author":"fortunato","year":"2018","journal-title":"Proceedings of the International Conference on Representation Learning (ICLR 2018)"},{"key":"ref28","article-title":"Airsim: High-fidelity visual and physical simulation for autonomous vehicles","author":"shah","year":"2017","journal-title":"Field and Service Robotics"},{"key":"ref4","doi-asserted-by":"crossref","first-page":"354","DOI":"10.1038\/nature24270","article-title":"Mastering the game of go without human knowledge","volume":"550","author":"silver","year":"2017","journal-title":"Nature"},{"key":"ref27","year":"0","journal-title":"Unreal engine 4 22 1"},{"key":"ref3","article-title":"Playing atari with deep reinforcement learning","author":"mnih","year":"2013","journal-title":"ArXiv Preprint"},{"key":"ref6","article-title":"Deep compression: Compressing deep neural networks with pruning, trained quantization and huffman coding","author":"han","year":"2015","journal-title":"ArXiv Preprint"},{"key":"ref5","first-page":"1135","article-title":"Learning both weights and connections for efficient neural network","author":"han","year":"2015","journal-title":"Advances in neural information processing systems"},{"key":"ref8","article-title":"Under-standing neural networks through deep visualization","author":"yosinski","year":"2015","journal-title":"ArXiv Preprint"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2017.2761740"},{"key":"ref2","first-page":"1889","article-title":"Trust region policy optimization","volume":"37","author":"schulman","year":"0","journal-title":"Proceedings of The 32nd International Conference on Machine Learning"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.3850\/9783981537079_0819"},{"key":"ref1","doi-asserted-by":"crossref","first-page":"529","DOI":"10.1038\/nature14236","article-title":"Human-level control through deep reinforcement learning","volume":"518","author":"mnih","year":"2015","journal-title":"Nature"},{"key":"ref20","article-title":"Binarized neural networks: Training deep neural networks with weights and activations constrained to+ 1or-1","author":"courbariaux","year":"2016","journal-title":"ArXiv Preprint"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1145\/3007192"},{"key":"ref21","first-page":"525","article-title":"Xnor-net: Imagenet classification using binary convolutional neural networks","author":"rastegari","year":"2016","journal-title":"European Conference on Computer Vision"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/ICDCS.2017.226"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2016.7900006"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/JETCAS.2019.2932285"},{"key":"ref25","article-title":"The arcade learning environment: An evaluation platform for general agents (extended abstract)","author":"bellemare","year":"2015","journal-title":"IJCAI"}],"event":{"name":"2022 IEEE International Conference on Robotics and Automation (ICRA)","location":"Philadelphia, PA, USA","start":{"date-parts":[[2022,5,23]]},"end":{"date-parts":[[2022,5,27]]}},"container-title":["2022 International Conference on Robotics and Automation (ICRA)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx7\/9811522\/9811357\/09812320.pdf?arnumber=9812320","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2022,11,3]],"date-time":"2022-11-03T23:06:32Z","timestamp":1667516792000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/9812320\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2022,5,23]]},"references-count":28,"URL":"https:\/\/doi.org\/10.1109\/icra46639.2022.9812320","relation":{},"subject":[],"published":{"date-parts":[[2022,5,23]]}}}