{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T00:10:03Z","timestamp":1755821403292,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":53,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,10,26]],"date-time":"2023-10-26T00:00:00Z","timestamp":1698278400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"National Research Foundation of Korea (NRF)","award":["2022R1A2C1011013"],"award-info":[{"award-number":["2022R1A2C1011013"]}]},{"name":"Institute of Information & Communications Technology Planning & Evaluation (IITP)","award":["2021-0-02068"],"award-info":[{"award-number":["2021-0-02068"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,10,26]]},"DOI":"10.1145\/3581783.3612525","type":"proceedings-article","created":{"date-parts":[[2023,10,27]],"date-time":"2023-10-27T07:26:54Z","timestamp":1698391614000},"page":"4816-4827","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Globally-Robust Instance Identification and Locally-Accurate Keypoint Alignment for Multi-Person Pose Estimation"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-3053-8317","authenticated-orcid":false,"given":"Fangzheng","family":"Tian","sequence":"first","affiliation":[{"name":"Jeonbuk National University, Jeonju , Republic of Korea"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-5887-5606","authenticated-orcid":false,"given":"Sungchan","family":"Kim","sequence":"additional","affiliation":[{"name":"Jeonbuk National University, Jeonju , Republic of Korea"}]}],"member":"320","published-online":{"date-parts":[[2023,10,27]]},"reference":[{"doi-asserted-by":"publisher","key":"e_1_3_2_1_1_1","DOI":"10.1109\/ICCV48922.2021.01164"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_2_1","DOI":"10.1109\/CVPR.2017.143"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_3_1","DOI":"10.1109\/CVPR.2018.00742"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_4_1","DOI":"10.1109\/CVPR42600.2020.00543"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_5_1","DOI":"10.1109\/CVPR.2017.601"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_6_1","DOI":"10.1109\/ICCV.2019.00667"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_7_1","DOI":"10.1109\/ICCV.2017.256"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_8_1","DOI":"10.1109\/CVPR46437.2021.01444"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_9_1","DOI":"10.1109\/ICCV.2017.322"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_10_1","DOI":"10.1109\/CVPR42600.2020.00574"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_11_1","DOI":"10.1007\/978-3-319-46466-4_3"},{"key":"e_1_3_2_1_12_1","volume-title":"PoseTrans: A Simple Yet Effective Pose Transformation Augmentation for Human Pose Estimation. In European Conference on Computer Vision. Springer, 643--659","author":"Jiang Wentao","year":"2022","unstructured":"Wentao Jiang, Sheng Jin, Wentao Liu, Chen Qian, Ping Luo, and Si Liu. 2022. PoseTrans: A Simple Yet Effective Pose Transformation Augmentation for Human Pose Estimation. In European Conference on Computer Vision. Springer, 643--659."},{"key":"e_1_3_2_1_13_1","volume-title":"Proceedings, Part VII 16","author":"Jin Sheng","year":"2020","unstructured":"Sheng Jin, Wentao Liu, Enze Xie, Wenhai Wang, Chen Qian, Wanli Ouyang, and Ping Luo. 2020. Differentiable hierarchical graph grouping for multi-person pose estimation. In Computer Vision-ECCV 2020: 16th European Conference, Glasgow, UK, August 23--28, 2020, Proceedings, Part VII 16. Springer, 718--734."},{"key":"e_1_3_2_1_14_1","volume-title":"Self-Constrained Inference Optimization on Structural Groups for Human Pose Estimation. In European Conference on Computer Vision. Springer, 729--745","author":"Kan Zhehan","year":"2022","unstructured":"Zhehan Kan, Shuoshuo Chen, Zeng Li, and Zhihai He. 2022. Self-Constrained Inference Optimization on Structural Groups for Human Pose Estimation. In European Conference on Computer Vision. Springer, 729--745."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_15_1","DOI":"10.1007\/978-3-030-01252-6_26"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_16_1","DOI":"10.1109\/CVPR.2019.01112"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_17_1","DOI":"10.1109\/CVPR46437.2021.00198"},{"key":"e_1_3_2_1_18_1","volume-title":"SimCC: A Simple Coordinate Classification Perspective for Human Pose Estimation. In European Conference on Computer Vision. Springer, 89--106","author":"Li Yanjie","year":"2022","unstructured":"Yanjie Li, Sen Yang, Peidong Liu, Shoukui Zhang, Yunxiao Wang, Zhicheng Wang, Wankou Yang, and Shu-Tao Xia. 2022. SimCC: A Simple Coordinate Classification Perspective for Human Pose Estimation. In European Conference on Computer Vision. Springer, 89--106."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_19_1","DOI":"10.1109\/ICCV48922.2021.01112"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_20_1","DOI":"10.1109\/ICCV.2017.324"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_21_1","DOI":"10.1007\/978-3-319-10602-1_48"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_22_1","DOI":"10.1109\/CVPR46437.2021.01306"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_23_1","DOI":"10.1007\/978-3-031-20065-6_25"},{"key":"e_1_3_2_1_24_1","volume-title":"Poseur: Direct human pose regression with transformers. In European Conference on Computer Vision","author":"Mao Weian","year":"2022","unstructured":"Weian Mao, Yongtao Ge, Chunhua Shen, Zhi Tian, Xinlong Wang, Zhibin Wang, and Anton van den Hengel. 2022. Poseur: Direct human pose regression with transformers. In European Conference on Computer Vision. Springer, 72--88."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_25_1","DOI":"10.1109\/CVPR46437.2021.00892"},{"volume-title":"Mixed Precision Training. In International Conference on Learning Representations.","author":"Micikevicius Paulius","unstructured":"Paulius Micikevicius, Sharan Narang, Jonah Alben, Gregory Diamos, Erich Elsen, David Garcia, Boris Ginsburg, Michael Houston, Oleksii Kuchaiev, Ganesh Venkatesh, et al. [n.,d.]. Mixed Precision Training. In International Conference on Learning Representations.","key":"e_1_3_2_1_26_1"},{"key":"e_1_3_2_1_27_1","volume-title":"Associative embedding: End-to-end learning for joint detection and grouping. Advances in neural information processing systems","author":"Newell Alejandro","year":"2017","unstructured":"Alejandro Newell, Zhiao Huang, and Jia Deng. 2017. Associative embedding: End-to-end learning for joint detection and grouping. Advances in neural information processing systems, Vol. 30 (2017)."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_28_1","DOI":"10.1109\/ICCV.2019.00705"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_29_1","DOI":"10.1109\/CVPR.2016.533"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_30_1","DOI":"10.1007\/978-3-030-58529-7_29"},{"key":"e_1_3_2_1_31_1","volume-title":"Faster r-cnn: Towards real-time object detection with region proposal networks. Advances in neural information processing systems","author":"Ren Shaoqing","year":"2015","unstructured":"Shaoqing Ren, Kaiming He, Ross Girshick, and Jian Sun. 2015. Faster r-cnn: Towards real-time object detection with region proposal networks. Advances in neural information processing systems, Vol. 28 (2015)."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_32_1","DOI":"10.1109\/CVPR52688.2022.01079"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_33_1","DOI":"10.1109\/CVPR.2019.00582"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_34_1","DOI":"10.1109\/CVPR.2019.00584"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_35_1","DOI":"10.1007\/978-3-030-01231-1_33"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_36_1","DOI":"10.1109\/ICCV.2019.00972"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_37_1","DOI":"10.1109\/CVPR52688.2022.01078"},{"key":"e_1_3_2_1_38_1","first-page":"6278","article-title":"Robust Pose Estimation in Crowded Scenes with Direct Pose-Level Inference","volume":"34","author":"Wang Dongkai","year":"2021","unstructured":"Dongkai Wang, Shiliang Zhang, and Gang Hua. 2021. Robust Pose Estimation in Crowded Scenes with Direct Pose-Level Inference. Advances in Neural Information Processing Systems, Vol. 34 (2021), 6278--6289.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_1_39_1","volume-title":"Regularizing Vector Embedding in Bottom-Up Human Pose Estimation. In European Conference on Computer Vision. Springer, 107--122","author":"Wang Haixin","year":"2022","unstructured":"Haixin Wang, Lu Zhou, Yingying Chen, Ming Tang, and Jinqiao Wang. 2022b. Regularizing Vector Embedding in Bottom-Up Human Pose Estimation. In European Conference on Computer Vision. Springer, 107--122."},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_40_1","DOI":"10.1007\/978-3-030-58621-8_29"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_41_1","DOI":"10.1109\/CVPR52688.2022.01278"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_42_1","DOI":"10.1109\/CVPR.2016.511"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_43_1","DOI":"10.1007\/978-3-030-01231-1_29"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_44_1","DOI":"10.1609\/aaai.v36i3.20186"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_45_1","DOI":"10.1109\/CVPR52688.2022.01279"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_46_1","DOI":"10.1109\/CVPR52688.2022.01272"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_47_1","DOI":"10.1109\/ICCV48922.2021.01159"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_48_1","DOI":"10.1109\/CVPR.2011.5995741"},{"doi-asserted-by":"crossref","unstructured":"Ailing Zeng Xuan Ju Lei Yang Ruiyuan Gao Xizhou Zhu Bo Dai and Qiang Xu. 2022a. DeciWatch: A Simple Baseline for 10x Efficient 2D and 3D Pose Estimation. (2022).","key":"e_1_3_2_1_49_1","DOI":"10.1007\/978-3-031-20065-6_35"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_50_1","DOI":"10.1007\/978-3-031-20065-6_36"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_51_1","DOI":"10.1109\/CVPR42600.2020.00712"},{"doi-asserted-by":"publisher","key":"e_1_3_2_1_52_1","DOI":"10.1109\/CVPR.2019.00098"},{"key":"e_1_3_2_1_53_1","volume-title":"Objects as points. arXiv preprint arXiv:1904.07850","author":"Zhou Xingyi","year":"2019","unstructured":"Xingyi Zhou, Dequan Wang, and Philipp Kr\u00e4henb\u00fchl. 2019. Objects as points. arXiv preprint arXiv:1904.07850 (2019)."}],"event":{"sponsor":["SIGMM ACM Special Interest Group on Multimedia"],"acronym":"MM '23","name":"MM '23: The 31st ACM International Conference on Multimedia","location":"Ottawa ON Canada"},"container-title":["Proceedings of the 31st ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3581783.3612525","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3581783.3612525","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T23:55:34Z","timestamp":1755820534000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3581783.3612525"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,26]]},"references-count":53,"alternative-id":["10.1145\/3581783.3612525","10.1145\/3581783"],"URL":"https:\/\/doi.org\/10.1145\/3581783.3612525","relation":{},"subject":[],"published":{"date-parts":[[2023,10,26]]},"assertion":[{"value":"2023-10-27","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}