{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,1]],"date-time":"2026-07-01T16:29:34Z","timestamp":1782923374186,"version":"3.54.5"},"reference-count":51,"publisher":"Institute of Electrical and Electronics Engineers (IEEE)","issue":"6","license":[{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/ieeexplore.ieee.org\/Xplorehelp\/downloads\/license-information\/IEEE.html"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-029"},{"start":{"date-parts":[[2026,6,1]],"date-time":"2026-06-01T00:00:00Z","timestamp":1780272000000},"content-version":"stm-asf","delay-in-days":0,"URL":"https:\/\/doi.org\/10.15223\/policy-037"}],"funder":[{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62088102"],"award-info":[{"award-number":["62088102"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62302381"],"award-info":[{"award-number":["62302381"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["52441602"],"award-info":[{"award-number":["52441602"]}],"id":[{"id":"10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":["IEEE Trans. Circuits Syst. I"],"published-print":{"date-parts":[[2026,6]]},"DOI":"10.1109\/tcsi.2025.3638831","type":"journal-article","created":{"date-parts":[[2025,12,11]],"date-time":"2025-12-11T18:48:33Z","timestamp":1765478913000},"page":"4124-4137","source":"Crossref","is-referenced-by-count":1,"title":["FP2: A 2-bit Floating-Point Format for Edge-AI Inference and Fine-Tuning"],"prefix":"10.1109","volume":"73","author":[{"ORCID":"https:\/\/orcid.org\/0009-0006-0326-2999","authenticated-orcid":false,"given":"Qiwei","family":"Dang","sequence":"first","affiliation":[{"name":"National Key Laboratory of Human&#x2013;Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Chengyu","family":"Ma","sequence":"additional","affiliation":[{"name":"National Key Laboratory of Human&#x2013;Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Haiduo","family":"Huang","sequence":"additional","affiliation":[{"name":"National Key Laboratory of Human&#x2013;Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7331-0830","authenticated-orcid":false,"given":"Gelin","family":"Fu","sequence":"additional","affiliation":[{"name":"National Key Laboratory of Human&#x2013;Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-7761-2551","authenticated-orcid":false,"given":"Zhiwang","family":"Huo","sequence":"additional","affiliation":[{"name":"National Key Laboratory of Human&#x2013;Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"given":"Guoming","family":"Yang","sequence":"additional","affiliation":[{"name":"National Key Laboratory of Human&#x2013;Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3401-8239","authenticated-orcid":false,"given":"Pengchen","family":"Zong","sequence":"additional","affiliation":[{"name":"National Key Laboratory of Human&#x2013;Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-2520-3731","authenticated-orcid":false,"given":"Tian","family":"Xia","sequence":"additional","affiliation":[{"name":"National Key Laboratory of Human&#x2013;Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7001-2125","authenticated-orcid":false,"given":"Wenzhe","family":"Zhao","sequence":"additional","affiliation":[{"name":"National Key Laboratory of Human&#x2013;Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1163-2014","authenticated-orcid":false,"given":"Pengju","family":"Ren","sequence":"additional","affiliation":[{"name":"National Key Laboratory of Human&#x2013;Machine Hybrid Augmented Intelligence, the National Engineering Research Center of Visual Information and Applications, and the Institute of Artificial Intelligence and Robotics, Xi&#x2019;an Jiaotong University, Xi&#x2019;an, Shaanxi, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"263","reference":[{"key":"ref1","doi-asserted-by":"publisher","DOI":"10.48550\/ARXIV.1706.03762"},{"key":"ref2","article-title":"An image is worth 16\u00d716 words: Transformers for image recognition at scale","author":"Dosovitskiy","year":"2020","journal-title":"arXiv:2010.11929"},{"key":"ref3","first-page":"1","article-title":"Arbitor: A numerically accurate hardware emulation tool for DNN accelerators","volume-title":"Proc. USENIX Annu. Tech. Conf.","author":"Jiang"},{"key":"ref4","doi-asserted-by":"publisher","DOI":"10.23919\/DATE.2017.7927224"},{"key":"ref5","doi-asserted-by":"publisher","DOI":"10.1145\/3079856.3080246"},{"key":"ref6","article-title":"FP8 formats for deep learning","author":"Micikevicius","year":"2022","journal-title":"arXiv:2209.05433"},{"key":"ref7","first-page":"14651","article-title":"FP8 quantization: The power of the exponent","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Kuzmin"},{"key":"ref8","first-page":"10271","article-title":"Pushing the limits of narrow precision inferencing at cloud scale with Microsoft floating point","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","volume":"33","author":"Rouhani"},{"key":"ref9","doi-asserted-by":"publisher","DOI":"10.1109\/HCS61935.2024.10665247"},{"key":"ref10","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.39"},{"key":"ref11","article-title":"FP8-LM: Training FP8 large language models","author":"Peng","year":"2023","journal-title":"arXiv:2310.18313"},{"key":"ref12","article-title":"LLaMA: Open and efficient foundation language models","author":"Touvron","year":"2023","journal-title":"arXiv:2302.13971"},{"key":"ref13","doi-asserted-by":"publisher","DOI":"10.1109\/JCC62314.2024.00017"},{"key":"ref14","doi-asserted-by":"publisher","DOI":"10.1109\/ICME57554.2024.10688089"},{"key":"ref15","doi-asserted-by":"publisher","DOI":"10.1109\/TCSI.2023.3298882"},{"key":"ref16","doi-asserted-by":"publisher","DOI":"10.1109\/TCSI.2023.3326329"},{"key":"ref17","doi-asserted-by":"publisher","DOI":"10.1109\/TCSI.2024.3427681"},{"key":"ref18","doi-asserted-by":"publisher","DOI":"10.1109\/TCSI.2024.3524307"},{"key":"ref19","doi-asserted-by":"publisher","DOI":"10.1109\/CICC63670.2025.10983180"},{"key":"ref20","doi-asserted-by":"publisher","DOI":"10.1109\/isscc42615.2023.10067837"},{"key":"ref21","doi-asserted-by":"publisher","DOI":"10.1109\/MDAT.2021.3120330"},{"key":"ref22","doi-asserted-by":"publisher","DOI":"10.1109\/isscc49657.2024.10454367"},{"key":"ref23","doi-asserted-by":"publisher","DOI":"10.1109\/TCSI.2023.3338378"},{"issue":"1","key":"ref24","article-title":"BFloat16: The secret to high performance on cloud TPUs","volume":"4","author":"Wang","year":"2020","journal-title":"Google Cloud Blog"},{"key":"ref25","doi-asserted-by":"publisher","DOI":"10.1145\/3579371.3589351"},{"key":"ref26","doi-asserted-by":"publisher","DOI":"10.1109\/TCSI.2023.3300657"},{"key":"ref27","article-title":"Microscaling data formats for deep learning","author":"Darvish Rouhani","year":"2023","journal-title":"arXiv:2310.10537"},{"key":"ref28","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46493-0_32"},{"key":"ref29","article-title":"Ternary weight networks","author":"Li","year":"2016","journal-title":"arXiv:1605.04711"},{"key":"ref30","doi-asserted-by":"publisher","DOI":"10.23919\/DATE58400.2024.10546652"},{"key":"ref31","article-title":"Additive powers-of-two quantization: An efficient non-uniform discretization for neural networks","author":"Li","year":"2019","journal-title":"arXiv:1909.13144"},{"key":"ref32","article-title":"BitNet: Scaling 1-bit transformers for large language models","author":"Wang","year":"2023","journal-title":"arXiv:2310.11453"},{"key":"ref33","article-title":"The era of 1-bit LLMs: All large language models are in 1.58 bits","author":"Ma","year":"2024","journal-title":"arXiv:2402.17764"},{"issue":"6","key":"ref34","first-page":"84","article-title":"Learning multiple layers of features from tiny images","volume-title":"Commun. ACM","volume":"60","author":"Krizhevsky","year":"2009"},{"key":"ref35","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2009.5206848"},{"key":"ref36","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"ref37","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01167"},{"key":"ref38","article-title":"The Llama 3 herd of models","author":"Grattafiori","year":"2024","journal-title":"arXiv:2407.21783"},{"key":"ref39","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1472"},{"key":"ref40","first-page":"552","article-title":"The Winograd schema challenge","volume-title":"Proc. KR","author":"Levesque"},{"key":"ref41","doi-asserted-by":"publisher","DOI":"10.1145\/3474381"},{"key":"ref42","first-page":"3123","article-title":"BinaryConnect: Training deep neural networks with binary weights during propagations","volume-title":"Proc. Adv. Neural Inf. Process. Syst.","author":"Courbariaux"},{"key":"ref43","article-title":"Binarized neural networks: Training deep neural networks with weights and activations constrained to + or -","author":"Courbariaux","year":"2016","journal-title":"arXiv:1602.02830"},{"key":"ref44","article-title":"DoReFa-Net: Training low bitwidth convolutional neural networks with low bitwidth gradients","author":"Zhou","year":"2016","journal-title":"arXiv:1606.06160"},{"key":"ref45","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.emnlp-main.467"},{"key":"ref46","doi-asserted-by":"publisher","DOI":"10.1109\/TEC.1962.5219391"},{"key":"ref47","article-title":"Rethinking the value of network pruning","author":"Liu","year":"2018","journal-title":"arXiv:1810.05270"},{"key":"ref48","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20083-0_23"},{"key":"ref49","doi-asserted-by":"publisher","DOI":"10.1109\/IJCNN52387.2021.9534248"},{"key":"ref50","volume-title":"Zynq Dpu V3.2 Production Guide (PG338)","year":"2020"},{"key":"ref51","volume-title":"Designware Library-Datapath and Building Block IP, P-2019.03- DWBB 201903.0","year":"2019"}],"container-title":["IEEE Transactions on Circuits and Systems I: Regular Papers"],"original-title":[],"link":[{"URL":"http:\/\/xplorestaging.ieee.org\/ielx8\/8919\/11541279\/11297762.pdf?arnumber=11297762","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,6,2]],"date-time":"2026-06-02T20:10:09Z","timestamp":1780431009000},"score":1,"resource":{"primary":{"URL":"https:\/\/ieeexplore.ieee.org\/document\/11297762\/"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2026,6]]},"references-count":51,"journal-issue":{"issue":"6"},"URL":"https:\/\/doi.org\/10.1109\/tcsi.2025.3638831","relation":{},"ISSN":["1549-8328","1558-0806"],"issn-type":[{"value":"1549-8328","type":"print"},{"value":"1558-0806","type":"electronic"}],"subject":[],"published":{"date-parts":[[2026,6]]}}}