{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,7,24]],"date-time":"2026-07-24T14:08:18Z","timestamp":1784902098161,"version":"3.55.0"},"publisher-location":"New York, NY, USA","reference-count":57,"publisher":"ACM","license":[{"start":{"date-parts":[[2023,10,26]],"date-time":"2023-10-26T00:00:00Z","timestamp":1698278400000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"National Nature Science Foundation of China","award":["61931008, U21B2024"],"award-info":[{"award-number":["61931008, U21B2024"]}]},{"DOI":"10.13039\/501100012166","name":"National Key Research and Development Program of China","doi-asserted-by":"publisher","award":["2020YFB1406604"],"award-info":[{"award-number":["2020YFB1406604"]}],"id":[{"id":"10.13039\/501100012166","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Pioneer, Zhejiang Provincial Natural Science Foundation of China","award":["LDT23F01011F01"],"award-info":[{"award-number":["LDT23F01011F01"]}]},{"DOI":"10.13039\/501100005090","name":"Beijing Nova Program","doi-asserted-by":"publisher","award":["20220484063"],"award-info":[{"award-number":["20220484063"]}],"id":[{"id":"10.13039\/501100005090","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2023,10,26]]},"DOI":"10.1145\/3581783.3612052","type":"proceedings-article","created":{"date-parts":[[2023,10,27]],"date-time":"2023-10-27T07:27:30Z","timestamp":1698391650000},"page":"116-124","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":36,"title":["Parsing is All You Need for Accurate Gait Recognition in the Wild"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0002-9176-7703","authenticated-orcid":false,"given":"Jinkai","family":"Zheng","sequence":"first","affiliation":[{"name":"Hangzhou Dianzi University, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-4931-8821","authenticated-orcid":false,"given":"Xinchen","family":"Liu","sequence":"additional","affiliation":[{"name":"JD Explore Academy, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3730-6401","authenticated-orcid":false,"given":"Shuai","family":"Wang","sequence":"additional","affiliation":[{"name":"Hangzhou Dianzi University &amp; Lishui Institute of Hangzhou Dianzi University, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-1311-4023","authenticated-orcid":false,"given":"Lihao","family":"Wang","sequence":"additional","affiliation":[{"name":"Hangzhou Dianzi University, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1204-0512","authenticated-orcid":false,"given":"Chenggang","family":"Yan","sequence":"additional","affiliation":[{"name":"Hangzhou Dianzi University, Hangzhou, China"}],"role":[{"vocabulary":"crossref","role":"author"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-1633-7575","authenticated-orcid":false,"given":"Wu","family":"Liu","sequence":"additional","affiliation":[{"name":"JD Explore Academy, Beijing, China"}],"role":[{"vocabulary":"crossref","role":"author"}]}],"member":"320","published-online":{"date-parts":[[2023,10,27]]},"reference":[{"key":"e_1_3_2_2_1_1","first-page":"421","article-title":"Performance Evaluation of Model-Based Gait on Multi-View Very Large Population Database With Pose Sequences","volume":"2","author":"An Weizhi","year":"2020","unstructured":"Weizhi An, Shiqi Yu, Yasushi Makihara, Xinhui Wu, Chi Xu, Yang Yu, Rijun Liao, and Yasushi Yagi. 2020. Performance Evaluation of Model-Based Gait on Multi-View Very Large Population Database With Pose Sequences. IEEE TBBIS, Vol. 2, 4 (2020), 421--430.","journal-title":"IEEE TBBIS"},{"key":"e_1_3_2_2_2_1","volume-title":"Nixon","author":"Ariyanto Gunawan","year":"2011","unstructured":"Gunawan Ariyanto and Mark S. Nixon. 2011. Model-based 3D gait biometrics. In IJCB. 1--7."},{"key":"e_1_3_2_2_3_1","doi-asserted-by":"crossref","unstructured":"Hanqing Chao Yiwei He Junping Zhang and Jianfeng Feng. 2019. GaitSet: Regarding Gait as a Set for Cross-View Gait Recognition. In AAAI. 8126--8133.","DOI":"10.1609\/aaai.v33i01.33018126"},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"crossref","unstructured":"Chao Fan Junhao Liang Chuanfu Shen Saihui Hou Yongzhen Huang and Shiqi Yu. 2023. OpenGait: Revisiting Gait Recognition Toward Better Practicality. In CVPR. 9707--9716.","DOI":"10.1109\/CVPR52729.2023.00936"},{"key":"e_1_3_2_2_5_1","doi-asserted-by":"crossref","unstructured":"Chao Fan Yunjie Peng Chunshui Cao Xu Liu Saihui Hou Jiannan Chi Yongzhen Huang Qing Li and Zhiqiang He. 2020. GaitPart: Temporal Part-Based Model for Gait Recognition. In CVPR. 14213--14221.","DOI":"10.1109\/CVPR42600.2020.01423"},{"key":"e_1_3_2_2_6_1","first-page":"805","article-title":"Instance-Level Human Parsing via Part Grouping Network","volume":"11208","author":"Gong Ke","year":"2018","unstructured":"Ke Gong, Xiaodan Liang, Yicheng Li, Yimin Chen, Ming Yang, and Liang Lin. 2018. Instance-Level Human Parsing via Part Grouping Network. In ECCV, Vol. 11208. 805--822.","journal-title":"ECCV"},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"crossref","unstructured":"Ke Gong Xiaodan Liang Dongyu Zhang Xiaohui Shen and Liang Lin. 2017. Look into Person: Self-Supervised Structure-Sensitive Learning and a New Benchmark for Human Parsing. In CVPR. 6757--6765.","DOI":"10.1109\/CVPR.2017.715"},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2006.38"},{"key":"e_1_3_2_2_9_1","doi-asserted-by":"crossref","unstructured":"Kaiming He Xiangyu Zhang Shaoqing Ren and Jian Sun. 2016. Deep Residual Learning for Image Recognition. In CVPR. 770--778.","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_2_2_10_1","first-page":"2281","article-title":"Clothing-invariant gait identification using part-based clothing categorization and adaptive weight control","volume":"43","author":"Altab Hossain Md.","year":"2010","unstructured":"Md. Altab Hossain, Yasushi Makihara, Junqiu Wang, and Yasushi Yagi. 2010. Clothing-invariant gait identification using part-based clothing categorization and adaptive weight control. PR, Vol. 43, 6 (2010), 2281--2291.","journal-title":"PR"},{"key":"e_1_3_2_2_11_1","doi-asserted-by":"crossref","unstructured":"Saihui Hou Chunshui Cao Xu Liu and Yongzhen Huang. 2020. Gait Lateral Network: Learning Discriminative and Compact Representations for Gait Recognition. In ECCV. 382--398.","DOI":"10.1007\/978-3-030-58545-7_22"},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"crossref","unstructured":"Xiaohu Huang Duowang Zhu Hao Wang Xinggang Wang Bo Yang Botao He Wenyu Liu and Bin Feng. 2021. Context-Sensitive Temporal Feature Learning for Gait Recognition. In ICCV. 12909--12918.","DOI":"10.1109\/ICCV48922.2021.01267"},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"publisher","DOI":"10.1109\/TIFS.2012.2204253"},{"key":"e_1_3_2_2_14_1","volume-title":"Kingma and Jimmy Ba","author":"Diederik","year":"2015","unstructured":"Diederik P. Kingma and Jimmy Ba. 2015. Adam: A Method for Stochastic Optimization. In ICLR."},{"key":"e_1_3_2_2_15_1","volume-title":"Kipf and Max Welling","author":"Thomas","year":"2017","unstructured":"Thomas N. Kipf and Max Welling. 2017. Semi-Supervised Classification with Graph Convolutional Networks. In ICLR."},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2019.107069"},{"key":"e_1_3_2_2_17_1","unstructured":"Beibei Lin Shunli Zhang and Xin Yu. 2021. Gait Recognition via Effective Global-Local Feature Representation and Local Temporal Aggregation. In ICCV. 14648--14656."},{"key":"e_1_3_2_2_18_1","unstructured":"Kunliang Liu Ouk Choi Jianming Wang and Wonjun Hwang. 2022b. CDGNet: Class Distribution Guided Network for Human Parsing. In CVPR. 4473--4482."},{"key":"e_1_3_2_2_19_1","doi-asserted-by":"crossref","unstructured":"Si Liu Xiaodan Liang Luoqi Liu Ke Lu Liang Lin and Shuicheng Yan. 2014. Fashion Parsing with Video Context. In ACM MM. 467--476.","DOI":"10.1145\/2647868.2654932"},{"key":"e_1_3_2_2_20_1","volume-title":"Recent Advances in Monocular 2D and 3D Human Pose Estimation: A Deep Learning Perspective. Comput. Surveys","author":"Liu Wu","year":"2022","unstructured":"Wu Liu, Qian Bao, Yu Sun, and Tao Mei. 2022a. Recent Advances in Monocular 2D and 3D Human Pose Estimation: A Deep Learning Perspective. Comput. Surveys (2022)."},{"key":"e_1_3_2_2_21_1","doi-asserted-by":"crossref","unstructured":"Xinchen Liu Wu Liu Jinkai Zheng Chenggang Yan and Tao Mei. 2020. Beyond the Parts: Learning Multi-view Cross-part Correlation for Vehicle Re-identification. In ACM MM. 907--915.","DOI":"10.1145\/3394171.3413578"},{"key":"e_1_3_2_2_22_1","volume-title":"Swin Transformer: Hierarchical Vision Transformer using Shifted Windows. In ICCV. 9992--10002.","author":"Liu Ze","year":"2021","unstructured":"Ze Liu, Yutong Lin, Yue Cao, Han Hu, Yixuan Wei, Zheng Zhang, Stephen Lin, and Baining Guo. 2021. Swin Transformer: Hierarchical Vision Transformer using Shifted Windows. In ICCV. 9992--10002."},{"key":"e_1_3_2_2_23_1","doi-asserted-by":"crossref","unstructured":"Xianghui Luo Zhuo Su Jiaming Guo Gengwei Zhang and Xiangjian He. 2018. Trusted Guidance Pyramid Network for Human Parsing. In ACM MM. 654--662.","DOI":"10.1145\/3240508.3240634"},{"key":"e_1_3_2_2_24_1","doi-asserted-by":"crossref","unstructured":"Yasushi Makihara Hidetoshi Mannami and Yasushi Yagi. 2010. Gait Analysis of Gender and Age Using a Large-Scale Multi-view Gait Database. In ACCV. 440--451.","DOI":"10.1007\/978-3-642-19309-5_34"},{"key":"e_1_3_2_2_25_1","volume-title":"Adelson","author":"Niyogi Sourabh A.","year":"1994","unstructured":"Sourabh A. Niyogi and Edward H. Adelson. 1994. Analyzing and recognizing walking figures in XYT. In CVPR. 469--474."},{"key":"e_1_3_2_2_26_1","volume-title":"A stochastic approximation method. The annals of mathematical statistics","author":"Robbins Herbert","year":"1951","unstructured":"Herbert Robbins and Sutton Monro. 1951. A stochastic approximation method. The annals of mathematical statistics (1951), 400--407."},{"key":"e_1_3_2_2_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2005.39"},{"key":"e_1_3_2_2_28_1","doi-asserted-by":"publisher","DOI":"10.1002\/j.1538-7305.1948.tb01338.x"},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"crossref","unstructured":"Kohei Shiraga Yasushi Makihara Daigo Muramatsu Tomio Echigo and Yasushi Yagi. 2016. GEINet: View-invariant gait recognition using a convolutional neural network. In ICB. 1--8.","DOI":"10.1109\/ICB.2016.7550060"},{"key":"e_1_3_2_2_30_1","first-page":"4","article-title":"Multi-view large population gait dataset and its performance evaluation for cross-view gait recognition","volume":"10","author":"Takemura Noriko","year":"2018","unstructured":"Noriko Takemura, Yasushi Makihara, Daigo Muramatsu, Tomio Echigo, and Yasushi Yagi. 2018. Multi-view large population gait dataset and its performance evaluation for cross-view gait recognition. IPSJ TCVA, Vol. 10 (2018), 4.","journal-title":"IPSJ TCVA"},{"key":"e_1_3_2_2_31_1","doi-asserted-by":"crossref","unstructured":"Daoliang Tan Kaiqi Huang Shiqi Yu and Tieniu Tan. 2006. Efficient Night Gait Recognition Based on Template Matching. In ICPR. 1000--1003.","DOI":"10.1109\/ICPR.2006.478"},{"key":"e_1_3_2_2_32_1","volume-title":"Stefan H\u00f6 rmann, and Gerhard Rigoll","author":"Teepe Torben","year":"2021","unstructured":"Torben Teepe, Ali Khan, Johannes Gilg, Fabian Herzog, Stefan H\u00f6 rmann, and Gerhard Rigoll. 2021. Gaitgraph: Graph Convolutional Network for Skeleton-Based Gait Recognition. In ICIP. 2314--2318."},{"key":"e_1_3_2_2_33_1","doi-asserted-by":"crossref","unstructured":"Akira Tsuji Yasushi Makihara and Yasushi Yagi. 2010. Silhouette transformation based on walking speed for gait identification. In CVPR. 717--722.","DOI":"10.1109\/CVPR.2010.5540144"},{"key":"e_1_3_2_2_34_1","first-page":"5","article-title":"The OU-ISIR Large Population Gait Database with real-life carried object and its performance evaluation","volume":"10","author":"Zasim Uddin Md.","year":"2018","unstructured":"Md. Zasim Uddin, Trung Ngo Thanh, Yasushi Makihara, Noriko Takemura, Xiang Li, Daigo Muramatsu, and Yasushi Yagi. 2018. The OU-ISIR Large Population Gait Database with real-life carried object and its performance evaluation. IPSJ TCVA, Vol. 10 (2018), 5.","journal-title":"IPSJ TCVA"},{"key":"e_1_3_2_2_35_1","doi-asserted-by":"crossref","unstructured":"Raquel Urtasun and Pascal Fua. 2004. 3D Tracking for Gait Characterization and Recognition. In FGR. 17--22.","DOI":"10.1109\/AFGR.2004.1301503"},{"key":"e_1_3_2_2_36_1","volume-title":"Phoha","author":"Wan Changsheng","year":"2019","unstructured":"Changsheng Wan, Li Wang, and Vir V. Phoha. 2019. A Survey on Gait Recognition. ACM CSUR, Vol. 51, 5 (2019), 89:1--89:35."},{"key":"e_1_3_2_2_37_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.2983686"},{"key":"e_1_3_2_2_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2003.1251144"},{"key":"e_1_3_2_2_39_1","doi-asserted-by":"crossref","unstructured":"Wenguan Wang Hailong Zhu Jifeng Dai Yanwei Pang Jianbing Shen and Ling Shao. 2020. Hierarchical human parsing with typed part-relation reasoning. In CVPR. 8929--8939.","DOI":"10.1109\/CVPR42600.2020.00895"},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2016.2545669"},{"key":"e_1_3_2_2_41_1","first-page":"24","article-title":"The OU-ISIR Gait Database comprising the Large Population Dataset with Age and performance evaluation of age estimation","volume":"9","author":"Xu Chi","year":"2017","unstructured":"Chi Xu, Yasushi Makihara, Gakuto Ogi, Xiang Li, Yasushi Yagi, and Jianfeng Lu. 2017. The OU-ISIR Gait Database comprising the Large Population Dataset with Age and performance evaluation of age estimation. IPSJ TCVA, Vol. 9 (2017), 24.","journal-title":"IPSJ TCVA"},{"key":"e_1_3_2_2_42_1","first-page":"1057","article-title":"Automated person recognition by walking and running via model-based approaches","volume":"37","author":"Yam Chew-Yean","year":"2004","unstructured":"Chew-Yean Yam, Mark S. Nixon, and John N. Carter. 2004. Automated person recognition by walking and running via model-based approaches. PR, Vol. 37, 5 (2004), 1057--1072.","journal-title":"PR"},{"key":"e_1_3_2_2_43_1","doi-asserted-by":"crossref","unstructured":"Koichiro Yamauchi Bir Bhanu and Hideo Saito. 2009. Recognition of walking humans in 3D: Initial results. In CVPRW. 45--52.","DOI":"10.1109\/CVPRW.2009.5204296"},{"key":"e_1_3_2_2_44_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2020.2975798"},{"key":"e_1_3_2_2_45_1","first-page":"43","article-title":"Task-Adaptive Attention for Image Captioning","volume":"32","author":"Yan Chenggang","year":"2022","unstructured":"Chenggang Yan, Yiming Hao, Liang Li, Jian Yin, Anan Liu, Zhendong Mao, Zhenyu Chen, and Xingyu Gao. 2022a. Task-Adaptive Attention for Image Captioning. IEEE TCSVT, Vol. 32, 1 (2022), 43--51.","journal-title":"IEEE TCSVT"},{"key":"e_1_3_2_2_46_1","volume-title":"TOMM","volume":"16","author":"Yan Chenggang","year":"2021","unstructured":"Chenggang Yan, Zhisheng Li, Yongbing Zhang, Yutao Liu, Xiangyang Ji, and Yong-Dong Zhang. 2021b. Depth Image Denoising Using Nuclear Norm and Learning Graph Model. TOMM, Vol. 16, 4 (2021), 122:1--122:17."},{"key":"e_1_3_2_2_47_1","doi-asserted-by":"publisher","DOI":"10.1145\/3472810"},{"key":"e_1_3_2_2_48_1","doi-asserted-by":"publisher","DOI":"10.1145\/3468872"},{"key":"e_1_3_2_2_49_1","doi-asserted-by":"crossref","unstructured":"Shiqi Yu Daoliang Tan and Tieniu Tan. 2006. A Framework for Evaluating the Effect of View Angle Clothing and Carrying Condition on Gait Recognition. In ICPR. 441--444.","DOI":"10.1109\/ICPR.2006.67"},{"key":"e_1_3_2_2_50_1","doi-asserted-by":"crossref","unstructured":"Shaoxiong Zhang Yunhong Wang and Annan Li. 2021. Cross-View Gait Recognition With Deep Universal Linear Embeddings. In CVPR. 9095--9104.","DOI":"10.1109\/CVPR46437.2021.00898"},{"key":"e_1_3_2_2_51_1","doi-asserted-by":"crossref","unstructured":"Ziyuan Zhang Luan Tran Xi Yin Yousef Atoum Xiaoming Liu Jian Wan and Nanxin Wang. 2019. Gait Recognition via Disentangled Representation Learning. In CVPR. 4710--4719.","DOI":"10.1109\/CVPR.2019.00484"},{"key":"e_1_3_2_2_52_1","doi-asserted-by":"crossref","unstructured":"Guoying Zhao Guoyi Liu Hua Li and Matti Pietik\u00e4inen. 2006. 3D Gait Recognition Using Multiple Cameras. In FGR. 529--534.","DOI":"10.1109\/FGR.2006.2"},{"key":"e_1_3_2_2_53_1","unstructured":"Hengshuang Zhao Jianping Shi Xiaojuan Qi Xiaogang Wang and Jiaya Jia. 2017. Pyramid Scene Parsing Network. In CVPR. 6230--6239."},{"key":"e_1_3_2_2_54_1","doi-asserted-by":"crossref","unstructured":"Jinkai Zheng Xinchen Liu Xiaoyan Gu Yaoqi Sun Chuang Gan Jiyong Zhang Wu Liu and Chenggang Yan. 2022a. Gait Recognition in the Wild with Multi-hop Temporal Switch. In ACM MM. 6136--6145.","DOI":"10.1145\/3503161.3547897"},{"key":"e_1_3_2_2_55_1","doi-asserted-by":"crossref","unstructured":"Jinkai Zheng Xinchen Liu Wu Liu Lingxiao He Chenggang Yan and Tao Mei. 2022b. Gait Recognition in the Wild with Dense 3D Representations and A Benchmark. In CVPR. 20228--20237.","DOI":"10.1109\/CVPR52688.2022.01959"},{"key":"e_1_3_2_2_56_1","doi-asserted-by":"crossref","unstructured":"Qixian Zhou Xiaodan Liang Ke Gong and Liang Lin. 2018. Adaptive Temporal Encoding Network for Video Instance-level Human Parsing. In ACM MM. 1527--1535.","DOI":"10.1145\/3240508.3240660"},{"key":"e_1_3_2_2_57_1","unstructured":"Zheng Zhu Xianda Guo Tian Yang Junjie Huang Jiankang Deng Guan Huang Dalong Du Jiwen Lu and Jie Zhou. 2021. Gait Recognition in the Wild: A Benchmark. In ICCV. 14789--14799."}],"event":{"name":"MM '23: The 31st ACM International Conference on Multimedia","location":"Ottawa ON Canada","acronym":"MM '23","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 31st ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3581783.3612052","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3581783.3612052","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T00:03:11Z","timestamp":1755820991000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3581783.3612052"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2023,10,26]]},"references-count":57,"alternative-id":["10.1145\/3581783.3612052","10.1145\/3581783"],"URL":"https:\/\/doi.org\/10.1145\/3581783.3612052","relation":{},"subject":[],"published":{"date-parts":[[2023,10,26]]},"assertion":[{"value":"2023-10-27","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}