{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,3,28]],"date-time":"2026-03-28T17:08:30Z","timestamp":1774717710303,"version":"3.50.1"},"reference-count":44,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,5,12]],"date-time":"2025-05-12T00:00:00Z","timestamp":1747008000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,5,12]],"date-time":"2025-05-12T00:00:00Z","timestamp":1747008000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/100000001","name":"National Science Foundation (NSF)","doi-asserted-by":"publisher","award":["CNS-1943338"],"award-info":[{"award-number":["CNS-1943338"]}],"id":[{"id":"10.13039\/100000001","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,5,12]]},"DOI":"10.1109\/noms57970.2025.11073623","type":"proceedings-article","created":{"date-parts":[[2025,7,15]],"date-time":"2025-07-15T17:40:26Z","timestamp":1752601226000},"page":"1-9","source":"Crossref","is-referenced-by-count":9,"title":["Infer-EDGE: Dynamic DNN Inference Optimization in Just-in-Time Edge-AI Implementations"],"prefix":"10.1109","author":[{"given":"Motahare","family":"Mounesan","sequence":"first","affiliation":[{"name":"City University of New York,USA"}]},{"given":"Xiaojie","family":"Zhang","sequence":"additional","affiliation":[{"name":"Hunan First Normal University,China"}]},{"given":"Saptarshi","family":"Debroy","sequence":"additional","affiliation":[{"name":"City University of New York,USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.1109\/JPROC.2022.3226481"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.1109\/ICPR.2016.7900006"},{"key":"ref3","doi-asserted-by":"publisher","DOI":"10.1109\/MM.2020.3012391"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1109\/ICC40277.2020.9149012"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3093337.3037698"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1145\/3527155"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.23919\/CNSM62983.2024.10814523"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2020.2981338"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/WoWMoM57956.2023.00015"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.1145\/3583740.3626616"},{"issue":"4","key":"ref11","doi-asserted-by":"crossref","DOI":"10.3390\/jlpea12040057","article-title":"Ocelli: Efficient processing-in-pixel array enabling edge inference of ternary neural networks","volume":"12","author":"Tabrizchi","year":"2022","journal-title":"Journal of Low Power Electronics and Applications"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2946140"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3589639"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/WoWMoM54355.2022.00032"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1145\/3093337.3037698"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TWC.2019.2946140"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1145\/3372224.3419194"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2018.2858384"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.23919\/DATE.2017.7927211"},{"key":"ref20","article-title":"Neural architecture search with reinforcement learning","author":"Zoph","year":"2016","journal-title":"arXiv preprint"},{"key":"ref21","article-title":"A survey on deep neural network compression: Challenges, overview, and solutions","author":"Mishra","year":"2020","journal-title":"arXiv preprint"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/JIOT.2023.3243266"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1002\/ett.4485"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2021.3068255"},{"key":"ref25","doi-asserted-by":"crossref","DOI":"10.1109\/CCGrid59990.2024.00045","article-title":"Scheduling with Fully Compressible Tasks: Application to Deep Learning Inference with Neural Network Compression","volume-title":"CCGRID 2024 \u2013 24th IEEE\/ACM international Symposium on Cluster, Cloud and Internet Computing","author":"da Silva Barros"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/ISCC50000.2020.9219647"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/ICDCS57875.2023.00009"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2021.3068255"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1002\/ett.4485"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1109\/WoWMoM57956.2023.00034"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.1109\/ICFEC61590.2024.00016"},{"key":"ref32","doi-asserted-by":"publisher","DOI":"10.1109\/IC2E61754.2024.00024"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/WCNC57260.2024.10571207"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1109\/TII.2020.3017573"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/TCOMM.2022.3229033"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.3389\/fnins.2019.00095"},{"key":"ref37","article-title":"Resnet in resnet: Generalizing residual architectures","author":"Targ","year":"2016","journal-title":"arXiv preprint"},{"key":"ref38","article-title":"Densenet: Implementing efficient convnet descriptor pyramids","author":"Iandola","year":"2014","journal-title":"arXiv preprint"},{"key":"ref39","volume-title":"Infer-edge","author":"Mounesan"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1038\/s41467-017-02411-5"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1109\/CCGrid51090.2021.00059"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/SEC62691.2024.00047"},{"key":"ref43","article-title":"Actor-critic algorithms","volume":"12","author":"Konda","year":"1999","journal-title":"Advances in neural information processing systems"},{"key":"ref44","first-page":"1928","article-title":"Asynchronous methods for deep reinforcement learning","volume-title":"International conference on machine learning","author":"Mnih","year":"2016"}],"event":{"name":"NOMS 2025-2025 IEEE Network Operations and Management Symposium","location":"Honolulu, HI, USA","start":{"date-parts":[[2025,5,12]]},"end":{"date-parts":[[2025,5,16]]}},"container-title":["NOMS 2025-2025 IEEE Network Operations and Management Symposium"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11073532\/11073571\/11073623.pdf?arnumber=11073623","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,7,16]],"date-time":"2025-07-16T05:34:20Z","timestamp":1752644060000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11073623\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,5,12]]},"references-count":44,"URL":"https:\/\/doi.org\/10.1109\/noms57970.2025.11073623","relation":{},"subject":[],"published":{"date-parts":[[2025,5,12]]}}}