{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T05:05:22Z","timestamp":1750309522732,"version":"3.41.0"},"publisher-location":"New York, NY, USA","reference-count":31,"publisher":"ACM","license":[{"start":{"date-parts":[[2024,10,28]],"date-time":"2024-10-28T00:00:00Z","timestamp":1730073600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"the Fundamental Research Funds for the Central Universities","award":["2024JBMC003"],"award-info":[{"award-number":["2024JBMC003"]}]},{"name":"Beijing Natural Science Foundation","award":["4242028, L231012"],"award-info":[{"award-number":["4242028, L231012"]}]},{"DOI":"10.13039\/https:\/\/doi.org\/10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62376021, 62006015, 61971446"],"award-info":[{"award-number":["62376021, 62006015, 61971446"]}],"id":[{"id":"10.13039\/https:\/\/doi.org\/10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"Aviation Science Foundation of China","award":["2023Z0710M5001"],"award-info":[{"award-number":["2023Z0710M5001"]}]},{"name":"CEFLA Audio-Video Restoration and Evaluation Key Lab of Ministry of Culture and Tourism"},{"name":"the Open Project of Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, Anhui University","award":["MMC202401"],"award-info":[{"award-number":["MMC202401"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2024,10,28]]},"DOI":"10.1145\/3664647.3680791","type":"proceedings-article","created":{"date-parts":[[2024,10,26]],"date-time":"2024-10-26T06:59:49Z","timestamp":1729925989000},"page":"8865-8873","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Probabilistic Distillation Transformer: Modelling Uncertainties for Visual Abductive Reasoning"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2206-5051","authenticated-orcid":false,"given":"Wanru","family":"Xu","sequence":"first","affiliation":[{"name":"School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8032-5769","authenticated-orcid":false,"given":"Zhenjiang","family":"Miao","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6054-7970","authenticated-orcid":false,"given":"Yi","family":"Tian","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6255-9422","authenticated-orcid":false,"given":"Yigang","family":"Cen","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-9520-5425","authenticated-orcid":false,"given":"Lili","family":"Wan","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7578-7969","authenticated-orcid":false,"given":"Ma","family":"Xiaole","sequence":"additional","affiliation":[{"name":"School of Computer Science and Technology, Beijing Jiaotong University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2024,10,28]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Proceedings of the acl workshop on intrinsic and extrinsic evaluation measures for machine translation and\/or summarization. 65--72","author":"Banerjee Satanjeev","year":"2005","unstructured":"Satanjeev Banerjee and Alon Lavie. 2005. METEOR: An automatic metric for MT evaluation with improved correlation with human judgments. In Proceedings of the acl workshop on intrinsic and extrinsic evaluation measures for machine translation and\/or summarization. 65--72."},{"key":"e_1_3_2_1_2_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/P19-1285"},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.1109\/TPAMI.2022.3210780"},{"key":"e_1_3_2_1_4_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR46437.2021.00223"},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00532"},{"key":"e_1_3_2_1_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_2_1_7_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-031-20059-5_32"},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.00593"},{"key":"e_1_3_2_1_9_1","volume-title":"International conference on machine learning. pmlr, 448--456","author":"Ioffe Sergey","year":"2015","unstructured":"Sergey Ioffe and Christian Szegedy. 2015. Batch normalization: Accelerating deep network training by reducing internal covariate shift. In International conference on machine learning. pmlr, 448--456."},{"key":"e_1_3_2_1_10_1","volume-title":"Ddp: Diffusion model for dense visual prediction. arXiv preprint arXiv:2303.17559","author":"Ji Yuanfeng","year":"2023","unstructured":"Yuanfeng Ji, Zhe Chen, Enze Xie, Lanqing Hong, Xihui Liu, Zhaoqiang Liu, Tong Lu, Zhenguo Li, and Ping Luo. 2023. Ddp: Diffusion model for dense visual prediction. arXiv preprint arXiv:2303.17559 (2023)."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2020.acl-main.233"},{"key":"e_1_3_2_1_12_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.02059"},{"key":"e_1_3_2_1_13_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acl-long.254"},{"key":"e_1_3_2_1_14_1","doi-asserted-by":"publisher","DOI":"10.24963\/ijcai.2023\/124"},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52688.2022.01512"},{"key":"e_1_3_2_1_16_1","volume-title":"Rouge: A package for automatic evaluation of summaries. Text Summarization Branches Out","author":"Lin Chin-Yew","year":"2004","unstructured":"Chin-Yew Lin. 2004. Rouge: A package for automatic evaluation of summaries. Text Summarization Branches Out (2004)."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"crossref","unstructured":"Qianhui Liu Dong Xing Huajin Tang De Ma and Gang Pan. 2021. Event-based Action Recognition Using Motion Information and Spiking Neural Networks.. In IJCAI. 1743--1749.","DOI":"10.24963\/ijcai.2021\/240"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"crossref","unstructured":"Wen Liu Weixin Luo Zhengxin Li Peilin Zhao Shenghua Gao et al. 2019. Margin Learning Embedded Prediction for Video Anomaly Detection with A Few Anomalies.. In IJCAI. 3023--3030.","DOI":"10.24963\/ijcai.2019\/419"},{"key":"e_1_3_2_1_19_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPRW59228.2023.00536"},{"key":"e_1_3_2_1_20_1","volume-title":"Proceedings of the 40th annual meeting on association for computational linguistics. Association for Computational Linguistics, 311--318","author":"Papineni Kishore","year":"2002","unstructured":"Kishore Papineni, Salim Roukos, Todd Ward, and Wei-Jing Zhu. 2002. BLEU: a method for automatic evaluation of machine translation. In Proceedings of the 40th annual meeting on association for computational linguistics. Association for Computational Linguistics, 311--318."},{"key":"e_1_3_2_1_21_1","volume-title":"PreCNet: Next-frame video prediction based on predictive coding","author":"Straka Zdenek","year":"2023","unstructured":"Zdenek Straka, Tom\u00e1vs Svoboda, and Matej Hoffmann. 2023. PreCNet: Next-frame video prediction based on predictive coding. IEEE Transactions on Neural Networks and Learning Systems (2023)."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2015.7299087"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICCV48922.2021.00677"},{"key":"e_1_3_2_1_24_1","unstructured":"Bofeng Wu Guocheng Niu Jun Yu Xinyan Xiao Jian Zhang and Hua Wu. 2021. Weakly supervised dense video captioning via jointly usage of knowledge distillation and cross-modal matching. In IJCAI."},{"key":"e_1_3_2_1_25_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-3-030-01252-6_29"},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3343031.3351073"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR52729.2023.01032"},{"key":"e_1_3_2_1_28_1","volume-title":"Fine-Grained Regional Prompt Tuning for Visual Abductive Reasoning. arXiv preprint arXiv:2303.10428","author":"Zhang Hao","year":"2023","unstructured":"Hao Zhang and Basura Fernando. 2023. Fine-Grained Regional Prompt Tuning for Visual Abductive Reasoning. arXiv preprint arXiv:2303.10428 (2023)."},{"key":"e_1_3_2_1_29_1","volume-title":"Bertscore: Evaluating text generation with bert. arXiv preprint arXiv:1904.09675","author":"Zhang Tianyi","year":"2019","unstructured":"Tianyi Zhang, Varsha Kishore, Felix Wu, Kilian Q Weinberger, and Yoav Artzi. 2019. Bertscore: Evaluating text generation with bert. arXiv preprint arXiv:1904.09675 (2019)."},{"key":"e_1_3_2_1_30_1","doi-asserted-by":"publisher","DOI":"10.1109\/TIP.2022.3205207"},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1109\/CVPR.2018.00911"}],"event":{"name":"MM '24: The 32nd ACM International Conference on Multimedia","sponsor":["SIGMM ACM Special Interest Group on Multimedia"],"location":"Melbourne VIC Australia","acronym":"MM '24"},"container-title":["Proceedings of the 32nd ACM International Conference on Multimedia"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3664647.3680791","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3664647.3680791","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,6,19]],"date-time":"2025-06-19T01:18:07Z","timestamp":1750295887000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3664647.3680791"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2024,10,28]]},"references-count":31,"alternative-id":["10.1145\/3664647.3680791","10.1145\/3664647"],"URL":"https:\/\/doi.org\/10.1145\/3664647.3680791","relation":{},"subject":[],"published":{"date-parts":[[2024,10,28]]},"assertion":[{"value":"2024-10-28","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}