{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,11,21]],"date-time":"2025-11-21T18:44:26Z","timestamp":1763750666868,"version":"3.45.0"},"reference-count":46,"publisher":"IEEE","license":[{"start":{"date-parts":[[2025,10,26]],"date-time":"2025-10-26T00:00:00Z","timestamp":1761436800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2025,10,26]],"date-time":"2025-10-26T00:00:00Z","timestamp":1761436800000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,26]]},"DOI":"10.1109\/iccad66269.2025.11240988","type":"proceedings-article","created":{"date-parts":[[2025,11,20]],"date-time":"2025-11-20T18:39:34Z","timestamp":1763663974000},"page":"1-9","source":"Crossref","is-referenced-by-count":0,"title":["Perturbation-efficient Zeroth-order Optimization for Hardware-friendly On-device Training"],"prefix":"10.1109","author":[{"given":"Qitao","family":"Tan","sequence":"first","affiliation":[{"name":"University of Georgia"}]},{"given":"Sung-En","family":"Chang","sequence":"additional","affiliation":[{"name":"Northeastern University"}]},{"given":"Rui","family":"Xia","sequence":"additional","affiliation":[{"name":"University of Pennsylvania"}]},{"given":"Huidong","family":"Ji","sequence":"additional","affiliation":[{"name":"Fudan University"}]},{"given":"Chence","family":"Yang","sequence":"additional","affiliation":[{"name":"University of Georgia"}]},{"given":"Ci","family":"Zhang","sequence":"additional","affiliation":[{"name":"University of Georgia"}]},{"given":"Jun","family":"Liu","sequence":"additional","affiliation":[{"name":"Northeastern University"}]},{"given":"Zheng","family":"Zhan","sequence":"additional","affiliation":[{"name":"Northeastern University"}]},{"given":"Zhenman","family":"Fang","sequence":"additional","affiliation":[{"name":"Simon Fraser University"}]},{"given":"Zhuo","family":"Zou","sequence":"additional","affiliation":[{"name":"Fudan University"}]},{"given":"Yanzhi","family":"Wang","sequence":"additional","affiliation":[{"name":"Northeastern University"}]},{"given":"Jin","family":"Lu","sequence":"additional","affiliation":[{"name":"University of Georgia"}]},{"given":"Geng","family":"Yuan","sequence":"additional","affiliation":[{"name":"University of Georgia"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.acl-long.568"},{"key":"ref2","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-emnlp.563"},{"key":"ref3","article-title":"The second pascal recognising textual entailment challenge","volume-title":"Proceedings of the second PASCAL challenges workshop on recognising textual entailment","volume":"1","author":"Bar-Haim"},{"article-title":"The Fifth PASCAL Recognizing Textual Entailment Challenge","volume-title":"TAC","author":"Bentivogli","key":"ref4"},{"article-title":"BoolQ: Exploring the surprising difficulty of natural yes\/no questions","year":"2019","author":"Clark","key":"ref5"},{"key":"ref6","doi-asserted-by":"publisher","DOI":"10.1109\/ReConFig.2009.11"},{"key":"ref7","doi-asserted-by":"publisher","DOI":"10.23919\/DATE58400.2024.10546516"},{"key":"ref8","doi-asserted-by":"publisher","DOI":"10.1007\/11736790_9"},{"key":"ref9","first-page":"30318","article-title":"Gpt3. int8 (): 8-bit matrix multiplication for transformers at scale","volume":"35","author":"Dettmers","year":"2022","journal-title":"Advances in neural information processing systems"},{"article-title":"Model agnostic contrastive explanations for structured data","year":"2019","author":"Dhurandhar","key":"ref10"},{"key":"ref11","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.01127"},{"key":"ref12","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2021.acl-long.295"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.3115\/1654536.1654538"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v35i9.16928"},{"article-title":"Lora: Low-rank adaptation of large language models","year":"2021","author":"Hu","key":"ref15"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/SOCC.2017.8226056"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TC.2006.81"},{"article-title":"The winograd schema challenge","volume-title":"Thirteenth international conference on the principles of knowledge representation and reasoning","author":"Levesque","key":"ref18"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/tits.2024.3457815"},{"key":"ref20","article-title":"Zeroth-order stochastic variance reduction for nonconvex optimization","volume":"31","author":"Liu","year":"2018","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref21","article-title":"RoBERTa: A Robustly Optimized BERT Pretraining Approach","volume-title":"CoRR","author":"Liu","year":"2019"},{"article-title":"Sparse mezo: Less parameters for better performance in zeroth-order llm fine-tuning","year":"2024","author":"Liu","key":"ref22"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TCAD.2019.2897634"},{"key":"ref24","article-title":"Fine-tuning language models with just forward passes","author":"Malladi","year":"2023","journal-title":"Nerips"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN.2017.7966324"},{"article-title":"WiC: the word-in-context dataset for evaluating context-sensitive meaning representations","year":"2018","author":"Pilehvar","key":"ref26"},{"key":"ref27","doi-asserted-by":"publisher","DOI":"10.1109\/dac18072.2020.9218652"},{"article-title":"Choice of plausible alternatives: An evaluation of commonsense causal reasoning","volume-title":"2011 AAAI spring symposium series","author":"Roemmele","key":"ref28"},{"key":"ref29","article-title":"Learning to Guide Random Search","volume-title":"CoRR","author":"Sener","year":"2020"},{"key":"ref30","article-title":"An optimal algorithm for bandit and zero-order convex optimization with two-point feedback","author":"Shamir","year":"2017","journal-title":"Journal of Machine Learning Research"},{"key":"ref31","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/D13-1170"},{"article-title":"Harmony in Divergence: Towards Fast, Accurate, and Memory-efficient Zeroth-order LLM Fine-tuning","year":"2025","author":"Tan","key":"ref32"},{"key":"ref33","doi-asserted-by":"publisher","DOI":"10.1109\/FCCM.2014.47"},{"key":"ref34","doi-asserted-by":"publisher","DOI":"10.1145\/2629607"},{"article-title":"Certified Zeroth-order Black-Box Defense with Robust UNet Denoiser","year":"2023","author":"Verma","key":"ref35"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1145\/345508.345577"},{"key":"ref37","first-page":"12868","article-title":"Zarts: On zero-order optimization for neural architecture search","volume":"35","author":"Wang","year":"2022","journal-title":"Advances in Neural Information Processing Systems"},{"key":"ref38","doi-asserted-by":"publisher","DOI":"10.2307\/2331939"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.1109\/bigdata50022.2020.9378171"},{"key":"ref40","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-19775-8_3"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1145\/3626202.3637562"},{"article-title":"Opt: Open pre-trained transformer language models","year":"2022","author":"Zhang","key":"ref42"},{"article-title":"Revisiting zeroth-order optimization for memory-efficient llm fine-tuning: A benchmark","year":"2024","author":"Zhang","key":"ref43"},{"article-title":"Dynamic sparse no training: Training-free fine-tuning for sparse llms","year":"2023","author":"Zhang","key":"ref44"},{"article-title":"Second-order fine-tuning without pain for llms: A hessian informed zeroth-order optimizer","year":"2024","author":"Zhao","key":"ref45"},{"key":"ref46","first-page":"233","article-title":"ROLLER: Fast and Efficient Tensor Compilation for Deep Learning","volume-title":"16th USENIX Symposium on Operating Systems Design and Implementation (OSDI 22)","author":"Zhu"}],"event":{"name":"2025 IEEE\/ACM International Conference On Computer Aided Design (ICCAD)","start":{"date-parts":[[2025,10,26]]},"location":"Munich, Germany","end":{"date-parts":[[2025,10,30]]}},"container-title":["2025 IEEE\/ACM International Conference On Computer Aided Design (ICCAD)"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/11240608\/11240621\/11240988.pdf?arnumber=11240988","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,11,21]],"date-time":"2025-11-21T18:39:39Z","timestamp":1763750379000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11240988\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,26]]},"references-count":46,"URL":"https:\/\/doi.org\/10.1109\/iccad66269.2025.11240988","relation":{},"subject":[],"published":{"date-parts":[[2025,10,26]]}}}