{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T16:52:03Z","timestamp":1777567923687,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":54,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,10,28]],"date-time":"2024-10-28T00:00:00Z","timestamp":1730073600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,10,28]]},"DOI":"10.1145\/3664647.3680812","type":"proceedings-article","created":{"date-parts":[[2024,10,26]],"date-time":"2024-10-26T06:59:27Z","timestamp":1729925967000},"page":"826-835","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":9,"title":["GLGait: A Global-Local Temporal Receptive Field Network for Gait Recognition in the Wild"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0005-7386-6475","authenticated-orcid":false,"given":"Guozhen","family":"Peng","sequence":"first","affiliation":[{"name":"State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8001-2703","authenticated-orcid":false,"given":"Yunhong","family":"Wang","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-1537-0715","authenticated-orcid":false,"given":"Yuwei","family":"Zhao","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-2772-8336","authenticated-orcid":false,"given":"Shaoxiong","family":"Zhang","sequence":"additional","affiliation":[{"name":"The School of Communication Engineering, Hangzhou Dianzi University, Hangzhou, Zhejiang, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3497-5052","authenticated-orcid":false,"given":"Annan","family":"Li","sequence":"additional","affiliation":[{"name":"State Key Laboratory of Virtual Reality Technology and Systems, Beihang University, Beijing, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2024,10,28]]},"reference":[{"key":"e_1_3_2_1_1_1","doi-asserted-by":"publisher","DOI":"10.1109\/TBIOM.2020.3008862"},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00676"},{"key":"e_1_3_2_1_3_1","volume-title":"Lagrange Motion Analysis and View Embeddings for Improved Gait Recognition. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 20249--20258","author":"Chai Tianrui","year":"2022","unstructured":"Tianrui Chai, Annan Li, Shaoxiong Zhang, Zilong Li, and Yunhong Wang. 2022. Lagrange Motion Analysis and View Embeddings for Improved Gait Recognition. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 20249--20258."},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v33i01.33018126"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.cviu.2018.01.007"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2023.3262131"},{"key":"e_1_3_2_1_7_1","volume-title":"9th International Conference on Learning Representations.","author":"Dosovitskiy Alexey","year":"2021","unstructured":"Alexey Dosovitskiy, Lucas Beyer, Alexander Kolesnikov, Dirk Weissenborn, Xiaohua Zhai, Thomas Unterthiner, Mostafa Dehghani, Matthias Minderer, Georg Heigold, Sylvain Gelly, Jakob Uszkoreit, and Neil Houlsby. 2021. An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale. In 9th International Conference on Learning Representations."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20065-6_21"},{"key":"e_1_3_2_1_9_1","volume-title":"GaitGCI: Generative Counterfactual Intervention for Gait Recognition. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 5578--5588","author":"Dou Huanzhang","year":"2023","unstructured":"Huanzhang Dou, Pengyi Zhang, Wei Su, Yunlong Yu, Yining Lin, and Xi Li. 2023. GaitGCI: Generative Counterfactual Intervention for Gait Recognition. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 5578--5588."},{"key":"e_1_3_2_1_10_1","volume-title":"Exploring Deep Models for Practical Gait Recognition. arXiv preprint arXiv:2303.03301","author":"Fan Chao","year":"2023","unstructured":"Chao Fan, Saihui Hou, Yongzhen Huang, and Shiqi Yu. 2023. Exploring Deep Models for Practical Gait Recognition. arXiv preprint arXiv:2303.03301 (2023)."},{"key":"e_1_3_2_1_11_1","volume-title":"OpenGait: Revisiting Gait Recognition Towards Better Practicality. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 9707--9716","author":"Fan Chao","year":"2023","unstructured":"Chao Fan, Junhao Liang, Chuanfu Shen, Saihui Hou, Yongzhen Huang, and Shiqi Yu. 2023. OpenGait: Revisiting Gait Recognition Towards Better Practicality. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 9707--9716."},{"key":"e_1_3_2_1_12_1","volume-title":"Gaitpart: Temporal Part-based Model for Gait Recognition. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 14225--14233","author":"Fan Chao","year":"2020","unstructured":"Chao Fan, Yunjie Peng, Chunshui Cao, Xu Liu, Saihui Hou, Jiannan Chi, Yongzhen Huang, Qing Li, and Zhiqiang He. 2020. Gaitpart: Temporal Part-based Model for Gait Recognition. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 14225--14233."},{"key":"e_1_3_2_1_13_1","volume-title":"GPGait: Generalized Pose-based Gait Recognition. In IEEE\/CVF International Conference on Computer Vision. 19595--19604","author":"Fu Yang","year":"2023","unstructured":"Yang Fu, Shibei Meng, Saihui Hou, Xuecai Hu, and Yongzhen Huang. 2023. GPGait: Generalized Pose-based Gait Recognition. In IEEE\/CVF International Conference on Computer Vision. 19595--19604."},{"key":"e_1_3_2_1_14_1","volume-title":"Horizontal Pyramid Matching for Person Re-identification. In AAAI Conference on Artificial Intelligence","volume":"33","author":"Fu Yang","year":"2019","unstructured":"Yang Fu, Yunchao Wei, Yuqian Zhou, Honghui Shi, Gao Huang, Xinchao Wang, Zhiqiang Yao, and Thomas Huang. 2019. Horizontal Pyramid Matching for Person Re-identification. In AAAI Conference on Artificial Intelligence, Vol. 33. 8295--8302."},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.emnlp-main.3"},{"key":"e_1_3_2_1_16_1","volume-title":"Deep Residual Learning for Image Recognition. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 770--778","author":"He Kaiming","year":"2016","unstructured":"Kaiming He, Xiangyu Zhang, Shaoqing Ren, and Jian Sun. 2016. Deep Residual Learning for Image Recognition. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition. 770--778."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00208"},{"key":"e_1_3_2_1_18_1","unstructured":"Alexander Hermans Lucas Beyer and Bastian Leibe. 2017. In Defense of the Triplet Loss for Person Re-Identification. arXiv preprint arXiv:1703.07737 (2017)."},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-58545-7_22"},{"key":"e_1_3_2_1_20_1","volume-title":"Context-sensitive Temporal Feature Learning for Gait Recognition. In IEEE\/CVF International Conference on Computer Vision. 12909--12918","author":"Huang Xiaohu","year":"2021","unstructured":"Xiaohu Huang, Duowang Zhu, Hao Wang, Xinggang Wang, Bo Yang, Botao He, Wenyu Liu, and Bin Feng. 2021. Context-sensitive Temporal Feature Learning for Gait Recognition. In IEEE\/CVF International Conference on Computer Vision. 12909--12918."},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV51070.2023.00371"},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/5.726791"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2023.3312931"},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10489-022-03543-y"},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2022.3154609"},{"key":"e_1_3_2_1_26_1","volume-title":"Proceedings of the Asian Conference on Computer Vision.","author":"Li Xiang","year":"2020","unstructured":"Xiang Li, Yasushi Makihara, Chi Xu, Yasushi Yagi, Shiqi Yu, and Mingwu Ren. 2020. End-to-end model-based gait recognition. In Proceedings of the Asian Conference on Computer Vision."},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2019.107069"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.01438"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.02279"},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00986"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.00320"},{"key":"e_1_3_2_1_32_1","volume-title":"Bag of Tricks and A Strong Baseline for Deep Person Re-identification. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops.","author":"Luo Hao","year":"2019","unstructured":"Hao Luo, Youzhi Gu, Xingyu Liao, Shenqi Lai, and Wei Jiang. 2019. Bag of Tricks and A Strong Baseline for Deep Person Re-identification. In IEEE\/CVF Conference on Computer Vision and Pattern Recognition Workshops."},{"key":"e_1_3_2_1_33_1","volume-title":"10th International Conference on Learning Representations.","author":"Mehta Sachin","year":"2022","unstructured":"Sachin Mehta and Mohammad Rastegari. 2022. MobileViT: Light-weight, General-purpose, and Mobile-friendly Vision Transformer. In 10th International Conference on Learning Representations."},{"key":"e_1_3_2_1_34_1","volume-title":"Advances in Neural Information Processing Systems","volume":"32","author":"Paszke Adam","year":"2019","unstructured":"Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, et al. 2019. Pytorch: An imperative style, high-performance deep learning library. Advances in Neural Information Processing Systems, Vol. 32 (2019)."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP49357.2023.10096917"},{"key":"e_1_3_2_1_36_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2017.590"},{"key":"e_1_3_2_1_37_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2005.39"},{"key":"e_1_3_2_1_38_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00108"},{"key":"e_1_3_2_1_39_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394171.3413802"},{"key":"e_1_3_2_1_40_1","doi-asserted-by":"publisher","DOI":"10.1186\/s41074-018-0039-6"},{"key":"e_1_3_2_1_41_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW56347.2022.00163"},{"key":"e_1_3_2_1_42_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICIP42928.2021.9506717"},{"key":"e_1_3_2_1_43_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV.2015.510"},{"key":"e_1_3_2_1_44_1","volume-title":"Advances in Neural Information Processing Systems","volume":"30","author":"Vaswani Ashish","year":"2017","unstructured":"Ashish Vaswani, Noam Shazeer, Niki Parmar, Jakob Uszkoreit, Llion Jones, Aidan N Gomez, \u0141ukasz Kaiser, and Illia Polosukhin. 2017. Attention is all you need. Advances in Neural Information Processing Systems, Vol. 30 (2017)."},{"key":"e_1_3_2_1_45_1","volume-title":"Hierarchical Spatio-Temporal Representation Learning for Gait Recognition. In IEEE\/CVF International Conference on Computer Vision. 19639--19649","author":"Wang Lei","year":"2023","unstructured":"Lei Wang, Bo Liu, Fangfang Liang, and Bincheng Wang. 2023. Hierarchical Spatio-Temporal Representation Learning for Gait Recognition. In IEEE\/CVF International Conference on Computer Vision. 19639--19649."},{"key":"e_1_3_2_1_46_1","volume-title":"DyGait: Exploiting Dynamic Representations for High-performance Gait Recognition. In IEEE\/CVF International Conference on Computer Vision. 13424--13433","author":"Wang Ming","year":"2023","unstructured":"Ming Wang, Xianda Guo, Beibei Lin, Tian Yang, Zheng Zhu, Lincheng Li, Shunli Zhang, and Xin Yu. 2023. DyGait: Exploiting Dynamic Representations for High-performance Gait Recognition. In IEEE\/CVF International Conference on Computer Vision. 13424--13433."},{"key":"e_1_3_2_1_47_1","volume-title":"GaitParsing: Human Semantic Parsing for Gait Recognition","author":"Wang Zengbin","year":"2023","unstructured":"Zengbin Wang, Saihui Hou, Man Zhang, Xu Liu, Chunshui Cao, and Yongzhen Huang. 2023. GaitParsing: Human Semantic Parsing for Gait Recognition. IEEE Transactions on Multimedia (2023)."},{"key":"e_1_3_2_1_48_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-319-46478-7_31"},{"key":"e_1_3_2_1_49_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2021.3095809"},{"key":"e_1_3_2_1_50_1","doi-asserted-by":"publisher","DOI":"10.1109\/TMM.2022.3171961"},{"key":"e_1_3_2_1_51_1","volume-title":"Clothing and Carrying Condition on Gait Recognition. In International Conference on Pattern Recognition","volume":"4","author":"Yu Shiqi","year":"2006","unstructured":"Shiqi Yu, Daoliang Tan, and Tieniu Tan. 2006. A Framework for Evaluating the Effect of View Angle, Clothing and Carrying Condition on Gait Recognition. In International Conference on Pattern Recognition, Vol. 4. IEEE, 441--444."},{"key":"e_1_3_2_1_52_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01959"},{"key":"e_1_3_2_1_53_1","doi-asserted-by":"publisher","DOI":"10.1145\/3581783.3612052"},{"key":"e_1_3_2_1_54_1","volume-title":"Gait Recognition in the Wild: A Benchmark. In IEEE\/CVF International Conference on Computer Vision. 14789--14799","author":"Zhu Zheng","year":"2021","unstructured":"Zheng Zhu, Xianda Guo, Tian Yang, Junjie Huang, Jiankang Deng, Guan Huang, Dalong Du, Jiwen Lu, and Jie Zhou. 2021. Gait Recognition in the Wild: A Benchmark. In IEEE\/CVF International Conference on Computer Vision. 14789--14799."}],"event":{"name":"MM '24: The 32nd ACM International Conference on Multimedia","location":"Melbourne VIC Australia","acronym":"MM '24","sponsor":["SIGMM ACM Special Interest Group on Multimedia"]},"container-title":["Proceedings of the 32nd ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3664647.3680812","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3664647.3680812","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:18:07Z","timestamp":1750295887000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3664647.3680812"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,28]]},"references-count":54,"alternative-id":["10.1145\/3664647.3680812","10.1145\/3664647"],"URL":"https:\/\/doi.org\/10.1145\/3664647.3680812","relation":{},"subject":[],"published":{"date-parts":[[2024,10,28]]},"assertion":[{"value":"2024-10-28","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}