{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,3,28]],"date-time":"2025-03-28T02:53:32Z","timestamp":1743130412769,"version":"3.40.3"},"publisher-location":"Cham","reference-count":32,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783031736605"},{"type":"electronic","value":"9783031736612"}],"license":[{"start":{"date-parts":[[2024,11,10]],"date-time":"2024-11-10T00:00:00Z","timestamp":1731196800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2024,11,10]],"date-time":"2024-11-10T00:00:00Z","timestamp":1731196800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025]]},"DOI":"10.1007\/978-3-031-73661-2_13","type":"book-chapter","created":{"date-parts":[[2024,11,9]],"date-time":"2024-11-09T11:08:21Z","timestamp":1731150501000},"page":"230-246","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["POCA: Post-training Quantization with\u00a0Temporal Alignment for\u00a0Codec Avatars"],"prefix":"10.1007","author":[{"given":"Jian","family":"Meng","sequence":"first","affiliation":[]},{"given":"Yuecheng","family":"Li","sequence":"additional","affiliation":[]},{"given":"Chenghui","family":"Li","sequence":"additional","affiliation":[]},{"given":"Syed Shakib","family":"Sarwar","sequence":"additional","affiliation":[]},{"given":"Dilin","family":"Wang","sequence":"additional","affiliation":[]},{"given":"Jae-sun","family":"Seo","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2024,11,10]]},"reference":[{"key":"13_CR1","first-page":"348","volume":"1","author":"J Choi","year":"2019","unstructured":"Choi, J., Venkataramani, S., Srinivasan, V.V., Gopalakrishnan, K., Wang, Z., Chuang, P.: Accurate and efficient 2-bit quantized neural networks. Proc. Mach. Learn. Syst. 1, 348\u2013359 (2019)","journal-title":"Proc. Mach. Learn. Syst."},{"key":"13_CR2","unstructured":"Esser, S.K., McKinstry, J.L., Bablani, D., Appuswamy, R., Modha, D.S.: Learned step size quantization. In: International Conference on Learning Representations (ICLR) (2020)"},{"key":"13_CR3","doi-asserted-by":"crossref","unstructured":"Fu, Y., et al.: Auto-card: efficient and robust codec avatar driving for real-time mobile telepresence. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2023)","DOI":"10.1109\/CVPR52729.2023.02015"},{"key":"13_CR4","unstructured":"Gorbachev, Y., Fedorov, M., Slavutin, I., Tugarev, A., Fatekhov, M., Tarkan, Y.: Openvino deep learning workbench: comprehensive analysis and tuning of neural networks inference. In: Proceedings of the IEEE\/CVF International Conference on Computer Vision Workshops (CVPR-W) (2019)"},{"key":"13_CR5","doi-asserted-by":"crossref","unstructured":"Han, Y., Yang, S., Wang, W., Liu, J.: From design draft to real attire: unaligned fashion image translation. In: Proceedings of the 28th ACM International Conference on Multimedia, pp. 1533-1541 (2020)","DOI":"10.1145\/3394171.3413953"},{"key":"13_CR6","unstructured":"Kingma, D.P., Welling, M.: Auto-encoding variational bayes. arXiv preprint arXiv:1312.6114 (2013)"},{"key":"13_CR7","doi-asserted-by":"crossref","unstructured":"Le, H., et al.: Mobilecodec: neural inter-frame video compression on mobile devices. In: Proceedings of the 13th ACM Multimedia Systems Conference, pp. 324\u2013330 (2022)","DOI":"10.1145\/3524273.3532906"},{"key":"13_CR8","doi-asserted-by":"crossref","unstructured":"Ledig, C., et\u00a0al.: Photo-realistic single image super-resolution using a generative adversarial network. In: Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition, pp. 4681\u20134690 (2017)","DOI":"10.1109\/CVPR.2017.19"},{"issue":"8","key":"13_CR9","first-page":"2","volume":"1","author":"JP Lewis","year":"2014","unstructured":"Lewis, J.P., Anjyo, K., Rhee, T., Zhang, M., Pighin, F.H., Deng, Z.: Practice and theory of blendshape facial models. Eurograph. (State Rep.) 1(8), 2 (2014)","journal-title":"Eurograph. (State Rep.)"},{"key":"13_CR10","unstructured":"Li, Y., Dong, X., Wang, W.: Additive powers-of-two quantization: an efficient non-uniform discretization for neural networks. In: International Conference on Learning Representations (ICLR) (2020)"},{"key":"13_CR11","unstructured":"Li, Y., et al.: BRECQ: pushing the limit of post-training quantization by block reconstruction. In: International Conference on Learning Representations (ICLR) (2021)"},{"key":"13_CR12","doi-asserted-by":"crossref","unstructured":"Liu, Y., Yang, H., Dong, Z., Keutzer, K., Du, L., Zhang, S.: Noisyquant: noisy bias-enhanced post-training activation quantization for vision transformers. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2023)","DOI":"10.1109\/CVPR52729.2023.01946"},{"key":"13_CR13","doi-asserted-by":"crossref","unstructured":"Liu, Z., Cheng, K.T., Huang, D., Xing, E.P., Shen, Z.: Nonuniform-to-uniform quantization: Towards accurate quantization via generalized straight-through estimation. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2022)","DOI":"10.1109\/CVPR52688.2022.00489"},{"key":"13_CR14","doi-asserted-by":"crossref","unstructured":"Lombardi, S., Saragih, J., Simon, T., Sheikh, Y.: Deep appearance models for face rendering. ACM Trans. Graph. (ToG) (2018)","DOI":"10.1145\/3197517.3201401"},{"key":"13_CR15","doi-asserted-by":"crossref","unstructured":"Ma, S., et al.: Pixel codec avatars. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2021)","DOI":"10.1109\/CVPR46437.2021.00013"},{"key":"13_CR16","doi-asserted-by":"crossref","unstructured":"Mantiuk, R.K., et al.: FovVideoVDP: a visible difference predictor for wide field-of-view video. ACM Trans. Graph. (TOG) (2021)","DOI":"10.1145\/3476576.3476595"},{"issue":"1","key":"13_CR17","doi-asserted-by":"publisher","first-page":"99","DOI":"10.1145\/3503250","volume":"65","author":"B Mildenhall","year":"2021","unstructured":"Mildenhall, B., Srinivasan, P.P., Tancik, M., Barron, J.T., Ramamoorthi, R., Ng, R.: NeRF: representing scenes as neural radiance fields for view synthesis. Commun. ACM 65(1), 99\u2013106 (2021)","journal-title":"Commun. ACM"},{"key":"13_CR18","unstructured":"Nagel, M., Amjad, R.A., Van\u00a0Baalen, M., Louizos, C., Blankevoort, T.: Up or down? adaptive rounding for post-training quantization. In: International Conference on Machine Learning (ICML) (2020)"},{"key":"13_CR19","series-title":"Lecture Notes in Computer Science","doi-asserted-by":"publisher","first-page":"430","DOI":"10.1007\/978-3-030-58539-6_26","volume-title":"Computer Vision \u2013 ECCV 2020","author":"E Park","year":"2020","unstructured":"Park, E., Yoo, S.: PROFIT: a novel training method for sub-4-bit MobileNet models. In: Vedaldi, A., Bischof, H., Brox, T., Frahm, J.-M. (eds.) ECCV 2020. LNCS, vol. 12351, pp. 430\u2013446. Springer, Cham (2020). https:\/\/doi.org\/10.1007\/978-3-030-58539-6_26"},{"key":"13_CR20","unstructured":"Paszke, A., et al.: Pytorch: an imperative style, high-performance deep learning library. In: Advances in Neural Information Processing Systems (NeurIPS) (2019)"},{"key":"13_CR21","doi-asserted-by":"crossref","unstructured":"van Rozendaal, T., et\u00a0al.: Mobilenvc: real-time 1080p neural video compression on a mobile device. In: Proceedings of the IEEE\/CVF Winter Conference on Applications of Computer Vision, pp. 4323\u20134333 (2024)","DOI":"10.1109\/WACV57701.2024.00427"},{"key":"13_CR22","doi-asserted-by":"crossref","unstructured":"Saito, S., Schwartz, G., Simon, T., Li, J., Nam, G.: Relightable gaussian codec avatars. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition, pp. 130\u2013141 (2024)","DOI":"10.1109\/CVPR52733.2024.00021"},{"key":"13_CR23","doi-asserted-by":"crossref","unstructured":"Schwartz, G., et al.: The eyes have it: an integrated eye and face model for photorealistic facial animation. ACM Trans. Graph. (TOG) (2020)","DOI":"10.1145\/3386569.3392493"},{"key":"13_CR24","unstructured":"Siddegowda, S., Fournarakis, M., Nagel, M., Blankevoort, T., Patel, C., Khobare, A.: Neural network quantization with AI model efficiency toolkit (AIMET). arXiv preprint arXiv:2201.08442 (2022)"},{"key":"13_CR25","doi-asserted-by":"crossref","unstructured":"Tu, Z., Hu, J., Chen, H., Wang, Y.: Toward accurate post-training quantization for image super resolution. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2023)","DOI":"10.1109\/CVPR52729.2023.00567"},{"key":"13_CR26","doi-asserted-by":"crossref","unstructured":"Wang, Z., Wu, Z., Lu, J., Zhou, J.: Bidet: an efficient binarized object detector. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2020)","DOI":"10.1109\/CVPR42600.2020.00212"},{"key":"13_CR27","doi-asserted-by":"crossref","unstructured":"Wei, S.E., et al.: VR facial animation via multiview image translation. ACM Trans. Graph. (TOG) (2019)","DOI":"10.1145\/3306346.3323030"},{"key":"13_CR28","unstructured":"Wei, X., Gong, R., Li, Y., Liu, X., Yu, F.: QDrop: randomly dropping quantization for extremely low-bit post-training quantization. In: International Conference on Learning Representations (ICLR) (2022)"},{"key":"13_CR29","doi-asserted-by":"publisher","unstructured":"Wuu, C.H., et al.: Multiface: a dataset for neural face rendering. In: arXiv (2022). https:\/\/doi.org\/10.48550\/ARXIV.2207.11243, https:\/\/arxiv.org\/abs\/2207.11243","DOI":"10.48550\/ARXIV.2207.11243"},{"key":"13_CR30","unstructured":"Xiao, G., Lin, J., Seznec, M., Wu, H., Demouth, J., Han, S.: Smoothquant: accurate and efficient post-training quantization for large language models. In: International Conference on Machine Learning (ICML) (2023)"},{"key":"13_CR31","doi-asserted-by":"crossref","unstructured":"Yin, H., Gong, Y., Qiu, G.: Side window filtering. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2019)","DOI":"10.1109\/CVPR.2019.00896"},{"key":"13_CR32","doi-asserted-by":"crossref","unstructured":"Zhang, Y., Zhang, Z., Lew, L.: Pokebnn: A binary pursuit of lightweight accuracy. In: Proceedings of the IEEE\/CVF Conference on Computer Vision and Pattern Recognition (CVPR) (2022)","DOI":"10.1109\/CVPR52688.2022.01215"}],"container-title":["Lecture Notes in Computer Science","Computer Vision \u2013 ECCV 2024"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-031-73661-2_13","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2024,11,9]],"date-time":"2024-11-09T12:05:48Z","timestamp":1731153948000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-031-73661-2_13"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,11,10]]},"ISBN":["9783031736605","9783031736612"],"references-count":32,"URL":"https:\/\/doi.org\/10.1007\/978-3-031-73661-2_13","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2024,11,10]]},"assertion":[{"value":"10 November 2024","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"ECCV","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"European Conference on Computer Vision","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Milan","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Italy","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2024","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"29 September 2024","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"4 October 2024","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"18","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"eccv2024","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/eccv2024.ecva.net\/","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}