{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,13]],"date-time":"2026-01-13T05:20:20Z","timestamp":1768281620279,"version":"3.49.0"},"reference-count":85,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","license":[{"start":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T00:00:00Z","timestamp":1767225600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by\/4.0\/legalcode"}],"funder":[{"DOI":"10.13039\/501100003662","name":"Korea Planning and Evaluation Institute of Industrial Technology (KEIT) Grant funded by Korean Government (MOTIE)","doi-asserted-by":"publisher","award":["RS-2024-00432265"],"award-info":[{"award-number":["RS-2024-00432265"]}],"id":[{"id":"10.13039\/501100003662","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Access"],"published-print":{"date-parts":[[2026]]},"DOI":"10.1109\/access.2025.3650071","type":"journal-article","created":{"date-parts":[[2026,1,1]],"date-time":"2026-01-01T18:38:09Z","timestamp":1767292689000},"page":"3040-3061","source":"Crossref","is-referenced-by-count":0,"title":["CB-DistillGrad: Class-Balanced Distillation and Gradient Conflict Resolution for Low Power Edge AI Applications"],"prefix":"10.1109","volume":"14","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-1153-9305","authenticated-orcid":false,"given":"Sai","family":"Manohar Vemuri","sequence":"first","affiliation":[{"name":"Department of Electrical and Computer Engineering, Illinois Institute of Technology, Chicago, IL, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-6144-9900","authenticated-orcid":false,"given":"Achyuth","family":"Gundrapally","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, Illinois Institute of Technology, Chicago, IL, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5225-5580","authenticated-orcid":false,"given":"Zhengyu","family":"Xia","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, Illinois Institute of Technology, Chicago, IL, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8833-0319","authenticated-orcid":false,"given":"Joohee","family":"Kim","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, Illinois Institute of Technology, Chicago, IL, USA"}]},{"given":"Kyuwon","family":"Ken Choi","sequence":"additional","affiliation":[{"name":"Department of Electrical and Computer Engineering, Illinois Institute of Technology, Chicago, IL, USA"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.5244\/C.30.87"},{"key":"ref2","article-title":"Deep residual learning for image recognition","author":"He","year":"2015","journal-title":"arXiv:1512.03385"},{"key":"ref3","article-title":"Very deep convolutional networks for large-scale image recognition","author":"Simonyan","year":"2014","journal-title":"arXiv:1409.1556"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.1145\/3065386"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1109\/iccv.2015.169"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/jproc.2022.3226481"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.1016\/j.eswa.2021.114602"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1109\/tpami.2023.3290594"},{"key":"ref9","article-title":"EfficientNet: Rethinking model scaling for convolutional neural networks","author":"Tan","year":"2019","journal-title":"arXiv:1905.11946"},{"key":"ref10","article-title":"MobileNets: Efficient convolutional neural networks for mobile vision applications","author":"Howard","year":"2017","journal-title":"arXiv:1704.04861"},{"key":"ref11","first-page":"1135","article-title":"Learning both weights and connections for efficient neural networks","volume-title":"Proc. NeurIPS","volume":"28","author":"Han"},{"key":"ref12","article-title":"Quantization and training of neural networks for efficient integer-arithmetic-only inference","author":"Jacob","year":"2017","journal-title":"arXiv:1712.05877"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1145\/3007787.3001163"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.48550\/arXiv.1503.02531"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/icpr48806.2021.9413016"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1145\/1150402.1150464"},{"key":"ref17","article-title":"FitNets: Hints for thin deep nets","author":"Romero","year":"2014","journal-title":"arXiv:1412.6550"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1145\/2847263.2847265"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1016\/j.sysarc.2018.12.008"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1145\/3174243.3174959"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/tcsii.2018.2865896"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/FPL.2016.7577308"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1145\/2749469.2750389"},{"key":"ref24","doi-asserted-by":"publisher","DOI":"10.1109\/isca.2016.40"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/micro.2014.58"},{"key":"ref26","article-title":"EfficientNetV2: Smaller models and faster training","volume-title":"Proc. ICML","author":"Tan"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr.2018.00745"},{"key":"ref28","article-title":"Transferring knowledge to smaller network with class-distance loss","volume-title":"Proc. Int. Conf. Learn. Represent.","author":"Kim"},{"key":"ref29","doi-asserted-by":"publisher","DOI":"10.1109\/5.726791"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.1145\/3065386"},{"key":"ref31","article-title":"Language models are few-shot learners","author":"Brown","year":"2020","journal-title":"arXiv:2005.14165"},{"key":"ref32","article-title":"PaLM: Scaling language modeling with pathways","author":"Chowdhery","year":"2022","journal-title":"arXiv:2204.02311"},{"key":"ref33","article-title":"Gemini: A family of highly capable multimodal models","author":"Team","year":"2023","journal-title":"arXiv:2312.11805"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.3390\/philosophies7010004"},{"key":"ref35","article-title":"The rising costs of training frontier AI models","author":"Cottier","year":"2024","journal-title":"arXiv:2405.21015"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.3390\/math13111878"},{"key":"ref37","article-title":"Cognitive edge computing: A comprehensive survey on optimizing large models and AI agents for pervasive deployment","author":"Wang","year":"2025","journal-title":"arXiv:2501.03265"},{"key":"ref38","article-title":"MnasNet: Platform-aware neural architecture search for mobile","author":"Tan","year":"2018","journal-title":"arXiv:1807.11626"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/cvpr.2018.00716"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01264-9_8"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1602.07360"},{"key":"ref42","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW.2018.00215"},{"key":"ref43","article-title":"EfficientDet: Scalable and efficient object detection","author":"Tan","year":"2019","journal-title":"arXiv:1911.09070"},{"key":"ref44","article-title":"Rethinking bottleneck structure for efficient mobile network design","author":"Daquan","year":"2020","journal-title":"arXiv:2007.02269"},{"key":"ref45","article-title":"Can CNNs be more robust than transformers?","author":"Wang","year":"2022","journal-title":"arXiv:2206.03452"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.3390\/sym14122524"},{"key":"ref47","doi-asserted-by":"publisher","DOI":"10.1109\/icc42927.2021.9500744"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1109\/IGSC51522.2020.9290868"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i04.5963"},{"key":"ref50","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.findings-emnlp.385"},{"key":"ref51","doi-asserted-by":"publisher","DOI":"10.1109\/iccv.2019.00489"},{"key":"ref52","article-title":"Simple yet effective semi-supervised knowledge distillation from vision-language models via dual-head optimization","author":"Kang","year":"2025","journal-title":"arXiv:2505.07675"},{"key":"ref53","article-title":"Synthetic adaptive guided embeddings (SAGE): A novel knowledge distillation method","author":"Olcay Polat","year":"2025","journal-title":"arXiv:2508.14783"},{"key":"ref54","article-title":"Biased teacher, balanced student","author":"Kim","year":"2025","journal-title":"arXiv:2506.18496"},{"key":"ref55","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v39i21.34400"},{"key":"ref56","article-title":"Paying more attention to attention: Improving the performance of convolutional neural networks via attention transfer","author":"Zagoruyko","year":"2017","journal-title":"arXiv:1612.03928"},{"key":"ref57","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00409"},{"key":"ref58","article-title":"Born again neural networks","author":"Furlanello","year":"2018","journal-title":"arXiv:1805.04770"},{"key":"ref59","article-title":"Balanced knowledge distillation for long-tailed learning","author":"Zhang","year":"2021","journal-title":"arXiv:2104.10510"},{"key":"ref60","article-title":"Like what you like: Knowledge distill via neuron selectivity transfer","volume-title":"Proc. ICCV","author":"Huang"},{"key":"ref61","article-title":"Contrastive representation distillation","volume-title":"Proc. ICLR","author":"Tian"},{"key":"ref62","article-title":"EA-KD: Entropy-based adaptive knowledge distillation","author":"Su","year":"2023","journal-title":"arXiv:2311.13621"},{"key":"ref63","article-title":"Learn from balance: Rectifying knowledge transfer for long-tailed scenarios","author":"Huang","year":"2024","journal-title":"arXiv:2409.07694"},{"key":"ref64","article-title":"QKD: Quantization-aware knowledge distillation","author":"Kim","year":"2019","journal-title":"arXiv:1911.12491"},{"key":"ref65","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-96-0972-7_24"},{"key":"ref66","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2019.00949"},{"key":"ref67","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.324"},{"key":"ref68","article-title":"Searching for activation functions","volume-title":"Proc. ICLR","author":"Ramachandran"},{"key":"ref69","article-title":"MobileNetV3: Searching for mobile networks","volume-title":"Proc. ICCV","author":"Sandler"},{"key":"ref70","article-title":"Tailored temperature scaling for knowledge distillation in long-tailed recognition","volume-title":"Proc. AAAI","author":"Chen"},{"key":"ref71","first-page":"2335","article-title":"Dynamic temperature knowledge distillation","volume-title":"Proc. 31st Int. Joint Conf. Artif. Intell. (IJCAI)","author":"Wei"},{"key":"ref72","doi-asserted-by":"publisher","DOI":"10.1109\/tits.2023.3264588"},{"key":"ref73","volume-title":"Learning multiple layers of features from tiny images","author":"Krizhevsky","year":"2009"},{"key":"ref74","volume-title":"Tensil: Open Source Machine Learning Accelerators","year":"2022"},{"key":"ref75","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00497"},{"key":"ref76","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01165"},{"key":"ref77","article-title":"Gradient surgery for multi-task learning","author":"Yu","year":"2020","journal-title":"arXiv:2001.06782"},{"key":"ref78","article-title":"Xception: Deep learning with depthwise separable convolutions","author":"Chollet","year":"2016","journal-title":"arXiv:1610.02357"},{"key":"ref79","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00474"},{"key":"ref80","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2025.3635121"},{"key":"ref81","doi-asserted-by":"publisher","DOI":"10.1109\/tai.2024.3394797"},{"key":"ref82","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19803-8_5"},{"key":"ref83","article-title":"MobileViT: Light-weight, general-purpose, and mobile-friendly vision transformer","author":"Mehta","year":"2021","journal-title":"arXiv:2110.02178"},{"key":"ref84","doi-asserted-by":"publisher","DOI":"10.1109\/cyber59472.2023.10256482"},{"key":"ref85","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"}],"container-title":["IEEE Access"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/6287639\/11323511\/11321299.pdf?arnumber=11321299","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,12]],"date-time":"2026-01-12T22:02:49Z","timestamp":1768255369000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11321299\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026]]},"references-count":85,"URL":"https:\/\/doi.org\/10.1109\/access.2025.3650071","relation":{},"ISSN":["2169-3536"],"issn-type":[{"value":"2169-3536","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026]]}}}