{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,27]],"date-time":"2025-03-27T08:33:24Z","timestamp":1743064404184,"version":"3.40.3"},"publisher-location":"Cham","reference-count":32,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031250811"},{"type":"electronic","value":"9783031250828"}],"license":[{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2023,1,1]],"date-time":"2023-01-01T00:00:00Z","timestamp":1672531200000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2023]]},"DOI":"10.1007\/978-3-031-25082-8_8","type":"book-chapter","created":{"date-parts":[[2023,2,11]],"date-time":"2023-02-11T09:12:42Z","timestamp":1676106762000},"page":"115-129","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":4,"title":["QFT: Post-training Quantization via\u00a0Fast Joint Finetuning of\u00a0All Degrees of\u00a0Freedom"],"prefix":"10.1007","author":[{"given":"Alex","family":"Finkelstein","sequence":"first","affiliation":[]},{"given":"Ella","family":"Fuchs","sequence":"additional","affiliation":[]},{"given":"Idan","family":"Tal","sequence":"additional","affiliation":[]},{"given":"Mark","family":"Grobman","sequence":"additional","affiliation":[]},{"given":"Niv","family":"Vosco","sequence":"additional","affiliation":[]},{"given":"Eldad","family":"Meller","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2023,2,12]]},"reference":[{"key":"8_CR1","doi-asserted-by":"crossref","unstructured":"Jacob, B., et al.: Quantization and training of neural networks for efficient integer-arithmetic-only inference. CoRR abs\/1712.05877 (2017)","DOI":"10.1109\/CVPR.2018.00286"},{"key":"8_CR2","unstructured":"Krishnamoorthi, R.: Quantizing deep convolutional networks for efficient inference: a whitepaper. CoRR abs\/1806.08342 (2018)"},{"key":"8_CR3","unstructured":"Nagel, M., Fournarakis, M., Amjad, R.A., Bondarenko, Y., van Baalen, M., Blankevoort, T.: A white paper on neural network quantization. CoRR abs\/2106.08295 (2021)"},{"key":"8_CR4","unstructured":"Wu, H., Judd, P., Zhang, X., Isaev, M., Micikevicius, P.: Integer quantization for deep learning inference: principles and empirical evaluation. CoRR abs\/2004.09602 (2020)"},{"key":"8_CR5","doi-asserted-by":"crossref","unstructured":"Kozlov, A., Lazarevich, I., Shamporov, V., Lyalyushkin, N., Gorbachev, Y.: Neural network compression framework for fast model inference. CoRR abs\/2002.08679 (2020)","DOI":"10.1007\/978-3-030-80129-8_17"},{"key":"8_CR6","doi-asserted-by":"crossref","unstructured":"Gholami, A., Kim, S., Dong, Z., Yao, Z., Mahoney, M.W., Keutzer, K.: A survey of quantization methods for efficient neural network inference. CoRR abs\/2103.13630 (2021)","DOI":"10.1201\/9781003162810-13"},{"key":"8_CR7","unstructured":"Meller, E., Finkelstein, A., Almog, U., Grobman, M.: Same, same but different - recovering neural network quantization error through weight factorization. CoRR abs\/1902.01917 (2019)"},{"key":"8_CR8","doi-asserted-by":"crossref","unstructured":"Nagel, M., van Baalen, M., Blankevoort, T., Welling, M.: Data-free quantization through weight equalization and bias correction. In: 2019 IEEE\/CVF International Conference on Computer Vision, ICCV 2019, pp. 1325\u20131334. Seoul, Korea (South), 27 October - 2 November 2019. IEEE (2019)","DOI":"10.1109\/ICCV.2019.00141"},{"key":"8_CR9","unstructured":"Li, Y., et al.: MQBench: towards reproducible and deployable model quantization benchmark. In: Vanschoren, J., Yeung, S., (eds.): Proceedings of the Neural Information Processing Systems Track on Datasets and Benchmarks, vol. 1 (2021)"},{"key":"8_CR10","unstructured":"Bengio, Y., L\u00e9onard, N., Courville, A.C.: Estimating or propagating gradients through stochastic neurons for conditional computation. CoRR abs\/1308.3432 (2013)"},{"key":"8_CR11","unstructured":"Hubara, I., Courbariaux, M., Soudry, D., El-Yaniv, R., Bengio, Y.: Binarized neural networks. In: Lee, D.D., Sugiyama, M., von Luxburg, U., Guyon, I., Garnett, R., (eds.): Advances in Neural Information Processing Systems 29: Annual Conference on Neural Information Processing Systems 2016, pp. 4107\u20134115, 5-10 December 2016, Barcelona, Spain (2016)"},{"key":"8_CR12","doi-asserted-by":"crossref","unstructured":"McKinstry, J.L., et al.: Discovering low-precision networks close to full-precision networks for efficient embedded inference. CoRR abs\/1809.04191 (2018)","DOI":"10.1109\/EMC2-NIPS53020.2019.00009"},{"key":"8_CR13","doi-asserted-by":"crossref","unstructured":"Liu, Z.G., Mattina, M.: Learning low-precision neural networks without straight-through estimator(ste). CoRR abs\/1903.01061 (2019)","DOI":"10.24963\/ijcai.2019\/425"},{"key":"8_CR14","unstructured":"Nagel, M., Amjad, R.A., van Baalen, M., Louizos, C., Blankevoort, T.: Up or down? adaptive rounding for post-training quantization. In: Proceedings of the 37th International Conference on Machine Learning, ICML 2020, pp. 7197\u20137206, 13-18 July 2020, Virtual Event. Volume 119 of Proceedings of Machine Learning Research, PMLR (2020)"},{"key":"8_CR15","unstructured":"Choi, J., Wang, Z., Venkataramani, S., Chuang, P.I., Srinivasan, V., Gopalakrishnan, K.: PACT: parameterized clipping activation for quantized neural networks. CoRR abs\/1805.06085 (2018)"},{"key":"8_CR16","unstructured":"Esser, S.K., McKinstry, J.L., Bablani, D., Appuswamy, R., Modha, D.S.: Learned step size quantization. In: 8th International Conference on Learning Representations, ICLR 2020, Addis Ababa, Ethiopia, April 26\u201330 (2020), OpenReview.net (2020)"},{"key":"8_CR17","unstructured":"Jain, S.R., Gural, A., Wu, M., Dick, C.: Trained quantization thresholds for accurate and efficient fixed-point inference of deep neural networks. In: Dhillon, I.S., Papailiopoulos, D.S., Sze, V., (eds.): Proceedings of Machine Learning and Systems 2020, MLSys 2020, Austin, TX, USA, 2\u20134 March 2020, mlsys.org (2020)"},{"key":"8_CR18","unstructured":"Banner, R., Nahshan, Y., Hoffer, E., Soudry, D.: ACIQ: analytical clipping for integer quantization of neural networks. CoRR abs\/1810.05723 (2018)"},{"key":"8_CR19","unstructured":"Finkelstein, A., Almog, U., Grobman, M.: Fighting quantization bias with bias. CoRR abs\/1906.03193 (2019)"},{"key":"8_CR20","doi-asserted-by":"crossref","unstructured":"Choukroun, Y., Kravchik, E., Yang, F., Kisilev, P.: Low-bit quantization of neural networks for efficient inference. In: 2019 IEEE\/CVF International Conference on Computer Vision Workshops, ICCV Workshops 2019, pp. 3009\u20133018. Seoul, Korea (South), 27-28 October 2019. IEEE (2019)","DOI":"10.1109\/ICCVW.2019.00363"},{"key":"8_CR21","unstructured":"Hubara, I., Nahshan, Y., Hanani, Y., Banner, R., Soudry, D.: Improving post training neural quantization: layer-wise calibration and integer programming. CoRR abs\/2006.10518 (2020)"},{"key":"8_CR22","unstructured":"Li, Y., et al.: BRECQ: pushing the limit of post-training quantization by block reconstruction. In: 9th International Conference on Learning Representations, ICLR 2021, Virtual Event, Austria, 3\u20137 May 2021. OpenReview.net (2021)"},{"key":"8_CR23","unstructured":"Hinton, G.E., Vinyals, O., Dean, J.: Distilling the knowledge in a neural network. CoRR abs\/1503.02531 (2015)"},{"key":"8_CR24","unstructured":"Mishra, A.K., Marr, D.: Apprentice: using knowledge distillation techniques to improve low-precision network accuracy. In: 6th International Conference on Learning Representations, ICLR 2018, Vancouver, BC, Canada, 30 April - 3 May 2018. Conference Track Proceedings, OpenReview.net (2018)"},{"key":"8_CR25","unstructured":"Polino, A., Pascanu, R., Alistarh, D.: Model compression via distillation and quantization. In: 6th International Conference on Learning Representations, ICLR 2018, Vancouver, BC, Canada, 30 April - 3 May 2018. Conference Track Proceedings, OpenReview.net (2018)"},{"key":"8_CR26","doi-asserted-by":"crossref","unstructured":"Zhuang, B., Shen, C., Tan, M., Liu, L., Reid, I.: Towards effective low-bitwidth convolutional neural networks. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) (2018)","DOI":"10.1109\/CVPR.2018.00826"},{"issue":"3","key":"8_CR27","doi-asserted-by":"publisher","first-page":"211","DOI":"10.1007\/s11263-015-0816-y","volume":"115","author":"O Russakovsky","year":"2015","unstructured":"Russakovsky, O., et al.: Imagenet large scale visual recognition challenge. Int. J. Comput. Vis. 115(3), 211\u2013252 (2015)","journal-title":"Int. J. Comput. Vis."},{"key":"8_CR28","doi-asserted-by":"crossref","unstructured":"He, K., Zhang, X., Ren, S., Sun, J.: Deep residual learning for image recognition. In: 2016 IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2016, pp. 770\u2013778. Las Vegas, NV, USA, 27-30 June 2016. IEEE Computer Society (2016)","DOI":"10.1109\/CVPR.2016.90"},{"key":"8_CR29","doi-asserted-by":"crossref","unstructured":"Radosavovic, I., Kosaraju, R.P., Girshick, R.B., He, K., Doll\u00e1r, P.: Designing network design spaces. In: 2020 IEEE\/CVF Conference on Computer Vision and Pattern Recognition, CVPR 2020, pp. 10425\u201310433. Seattle, WA, USA, 13\u201319 June 2020. Computer Vision Foundation \/ IEEE (2020)","DOI":"10.1109\/CVPR42600.2020.01044"},{"key":"8_CR30","doi-asserted-by":"crossref","unstructured":"Tan, M., et al.: MnasNet: platform-aware neural architecture search for mobile. In: IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2019, pp. 2820\u20132828. Long Beach, CA, USA, 16\u201320 June 2019. Computer Vision Foundation \/ IEEE (2019)","DOI":"10.1109\/CVPR.2019.00293"},{"key":"8_CR31","doi-asserted-by":"crossref","unstructured":"Sandler, M., Howard, A.G., Zhu, M., Zhmoginov, A., Chen, L.: Mobilenetv 2: Inverted residuals and linear bottlenecks. In: 2018 IEEE Conference on Computer Vision and Pattern Recognition, CVPR 2018, pp. 4510\u20134520. Salt Lake City, UT, USA, 18\u201322 June 2018. Computer Vision Foundation \/ IEEE Computer Society (2018)","DOI":"10.1109\/CVPR.2018.00474"},{"key":"8_CR32","unstructured":"Gluska, S., Grobman, M.: Exploring neural networks quantization via layer-wise quantization analysis. CoRR abs\/2012.08420 (2020)"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2022 Workshops"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-25082-8_8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,3,7]],"date-time":"2024-03-07T13:03:03Z","timestamp":1709816583000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-25082-8_8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023]]},"ISBN":["9783031250811","9783031250828"],"references-count":32,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-25082-8_8","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2023]]},"assertion":[{"value":"12 February 2023","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Tel Aviv","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Israel","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2022","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"23 October 2022","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"27 October 2022","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"17","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2022","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2022.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Double-blind","order":1,"name":"type","label":"Type","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"CMT","order":2,"name":"conference_management_system","label":"Conference Management System","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"5804","order":3,"name":"number_of_submissions_sent_for_review","label":"Number of Submissions Sent for Review","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"1645","order":4,"name":"number_of_full_papers_accepted","label":"Number of Full Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"0","order":5,"name":"number_of_short_papers_accepted","label":"Number of Short Papers Accepted","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"28% - The value is computed by the equation \"Number of Full Papers Accepted \/ Number of Submissions Sent for Review * 100\" and then rounded to a whole number.","order":6,"name":"acceptance_rate_of_full_papers","label":"Acceptance Rate of Full Papers","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.21","order":7,"name":"average_number_of_reviews_per_paper","label":"Average Number of Reviews per Paper","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"3.91","order":8,"name":"average_number_of_papers_per_reviewer","label":"Average Number of Papers per Reviewer","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"Yes","order":9,"name":"external_reviewers_involved","label":"External Reviewers Involved","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}},{"value":"From the workshops, 367 reviewed full papers have been selected for publication","order":10,"name":"additional_info_on_review_process","label":"Additional Info on Review Process","group":{"name":"ConfEventPeerReviewInformation","label":"Peer Review Information (provided by the conference organizers)"}}]}}