{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,2,13]],"date-time":"2026-02-13T23:20:41Z","timestamp":1771024841672,"version":"3.50.1"},"publisher-location":"New York, NY, USA","reference-count":52,"publisher":"ACM","license":[{"start":{"date-parts":[[2025,7,20]],"date-time":"2025-07-20T00:00:00Z","timestamp":1752969600000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.acm.org\/publications\/policies\/copyright_policy#Background"}],"funder":[{"name":"Chongqing Natural Science Foundation","award":["CSTB2023NSCQ-LZX0170"],"award-info":[{"award-number":["CSTB2023NSCQ-LZX0170"]}]},{"DOI":"10.13039\/https:\/\/doi.org\/10.13039\/501100001809","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62472174, 62372179, 62402082"],"award-info":[{"award-number":["62472174, 62372179, 62402082"]}],"id":[{"id":"10.13039\/https:\/\/doi.org\/10.13039\/501100001809","id-type":"DOI","asserted-by":"publisher"}]},{"name":"the Open Research Fund of Key Laboratory of Advanced Theory and Application in Statistics and Data Science ?MOE, ECNU"}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,7,20]]},"DOI":"10.1145\/3690624.3709209","type":"proceedings-article","created":{"date-parts":[[2025,4,4]],"date-time":"2025-04-04T18:44:43Z","timestamp":1743792283000},"page":"1703-1714","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":5,"title":["MM-Path: Multi-modal, Multi-granularity Path Representation Learning"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0001-5933-4353","authenticated-orcid":false,"given":"Ronghui","family":"Xu","sequence":"first","affiliation":[{"name":"East China Normal University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-6755-5777","authenticated-orcid":false,"given":"Hanyin","family":"Cheng","sequence":"additional","affiliation":[{"name":"East China Normal University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4516-4637","authenticated-orcid":false,"given":"Chenjuan","family":"Guo","sequence":"additional","affiliation":[{"name":"East China Normal University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-4522-8389","authenticated-orcid":false,"given":"Hongfan","family":"Gao","sequence":"additional","affiliation":[{"name":"East China Normal University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7739-7769","authenticated-orcid":false,"given":"Jilin","family":"Hu","sequence":"additional","affiliation":[{"name":"East China Normal University, Shanghai, China and KLATASDS-MOE, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-7819-2290","authenticated-orcid":false,"given":"Sean Bin","family":"Yang","sequence":"additional","affiliation":[{"name":"Chongqing University of Posts and Telecommunications, Chongqing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1658-1079","authenticated-orcid":false,"given":"Bin","family":"Yang","sequence":"additional","affiliation":[{"name":"East China Normal University, Shanghai, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,7,20]]},"reference":[{"key":"e_1_3_2_2_1_1","unstructured":"Hangbo Bao Li Dong Songhao Piao and FuruWei. 2021. BEiT: BERT pre-training of image Transformers. In ICLR."},{"key":"e_1_3_2_2_2_1","first-page":"32897","article-title":"Vlmo: Unified visionlanguage pre-training with mixture-of-modality-experts","volume":"35","author":"Bao Hangbo","year":"2022","unstructured":"Hangbo Bao, Wenhui Wang, Li Dong, Qiang Liu, Owais Khan Mohammed, Kriti Aggarwal, Subhojit Som, Songhao Piao, and Furu Wei. 2022. Vlmo: Unified visionlanguage pre-training with mixture-of-modality-experts. NeurIPS 35 (2022), 32897--32912.","journal-title":"NeurIPS"},{"key":"e_1_3_2_2_3_1","volume-title":"Jensen","author":"Yang Sean Bin","year":"2022","unstructured":"Sean Bin Yang, Chenjuan Guo, Jilin Hu, Bin Yang, Jian Tang, and Christian S. Jensen. 2022. Weakly-supervised temporal path representation learning with contrastive curriculum learning. In ICDE. 2873--2885."},{"key":"e_1_3_2_2_4_1","doi-asserted-by":"publisher","DOI":"10.1145\/2806416.2806512"},{"key":"e_1_3_2_2_5_1","volume-title":"Contrastive trajectory similarity learning with dual-feature attention","author":"Chang Yanchuan","unstructured":"Yanchuan Chang, Jianzhong Qi, Yuxuan Liang, and Egemen Tanin. 2023. Contrastive trajectory similarity learning with dual-feature attention. In ICDE. IEEE, 2933--2945."},{"key":"e_1_3_2_2_6_1","doi-asserted-by":"publisher","DOI":"10.14778\/3339490.3339502"},{"key":"e_1_3_2_2_7_1","volume-title":"Price-and-time-aware dynamic ridesharing","author":"Chen Lu","unstructured":"Lu Chen, Qilu Zhong, Xiaokui Xiao, Yunjun Gao, Pengfei Jin, and Christian S Jensen. 2018. Price-and-time-aware dynamic ridesharing. In ICDE. IEEE, 1061-- 1072."},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"crossref","unstructured":"Meng Chen Zechen Li Weiming Huang Yongshun Gong and Yilong Yin. 2024. Profiling urban streets: A semi-supervised prediction model based on street view imagery and spatial topology. In KDD. 319--328.","DOI":"10.1145\/3637528.3671918"},{"key":"e_1_3_2_2_9_1","volume-title":"Pathformer: Multi-scale transformers with adaptive pathways for time series forecasting. In ICLR.","author":"Chen Peng","year":"2024","unstructured":"Peng Chen, Yingying Zhang, Yunyao Cheng, Yang Shu, Yihang Wang, Qingsong Wen, Bin Yang, and Chenjuan Guo. 2024. Pathformer: Multi-scale transformers with adaptive pathways for time series forecasting. In ICLR."},{"key":"e_1_3_2_2_10_1","doi-asserted-by":"publisher","DOI":"10.14778\/3632093.3632105"},{"key":"e_1_3_2_2_11_1","volume-title":"Arun Kumar Chandran, and Richard Ellison","author":"Chen Yile","year":"2021","unstructured":"Yile Chen, Xiucheng Li, Gao Cong, Zhifeng Bao, Cheng Long, Yiding Liu, Arun Kumar Chandran, and Richard Ellison. 2021. Robust road network representation learning: When traffic patterns meet traveling semantics. In CIKM. 211--220."},{"key":"e_1_3_2_2_12_1","volume-title":"Personalized route recommendation using big trajectory data","author":"Dai Jian","unstructured":"Jian Dai, Bin Yang, Chenjuan Guo, and Zhiming Ding. 2015. Personalized route recommendation using big trajectory data. In ICDE. IEEE, 543--554."},{"key":"e_1_3_2_2_13_1","first-page":"787","article-title":"Ul- TraMan: A unified platform for big trajectory data management and analytics","volume":"11","author":"Ding Xin","year":"2018","unstructured":"Xin Ding, Lu Chen, Yunjun Gao, Christian S Jensen, and Hujun Bao. 2018. Ul- TraMan: A unified platform for big trajectory data management and analytics. PVLDB 11, 7 (2018), 787--799.","journal-title":"PVLDB"},{"key":"e_1_3_2_2_14_1","doi-asserted-by":"publisher","DOI":"10.1109\/TVT.2020.3048336"},{"key":"e_1_3_2_2_15_1","doi-asserted-by":"crossref","unstructured":"Noel Gorelick Matt Hancher Mike Dixon Simon Ilyushchenko David Thau and Rebecca Moore. 2017. Google Earth Engine: Planetary-scale geospatial analysis for everyone. Remote Sens. Environ. (2017).","DOI":"10.1016\/j.rse.2017.06.031"},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"crossref","unstructured":"Aditya Grover and Jure Leskovec. 2016. Node2vec: Salable feature learning for networks. In KDD. 855--864.","DOI":"10.1145\/2939672.2939754"},{"key":"e_1_3_2_2_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/2694428.2694432"},{"key":"e_1_3_2_2_18_1","doi-asserted-by":"publisher","DOI":"10.14778\/3681954.3681971"},{"key":"e_1_3_2_2_19_1","volume-title":"Learning to route with sparse trajectory sets","author":"Guo Chenjuan","unstructured":"Chenjuan Guo, Bin Yang, Jilin Hu, and Christian Jensen. 2018. Learning to route with sparse trajectory sets. In ICDE. IEEE, 1073--1084."},{"key":"e_1_3_2_2_20_1","doi-asserted-by":"crossref","unstructured":"Kaiming He Xiangyu Zhang Shaoqing Ren and Jian Sun. 2016. Deep residual learning for image recognition. In CVPR. 770--778.","DOI":"10.1109\/CVPR.2016.90"},{"key":"e_1_3_2_2_21_1","volume-title":"Self-supervised trajectory representation learning with temporal regularities and travel semantics","author":"Jiang Jiawei","unstructured":"Jiawei Jiang, Dayan Pan, Houxing Ren, Xiaohan Jiang, Chao Li, and Jingyuan Wang. 2023. Self-supervised trajectory representation learning with temporal regularities and travel semantics. In ICDE. IEEE."},{"key":"e_1_3_2_2_22_1","volume-title":"BERT: Pre-training of deep bidirectional transformers for language understanding. In NAACL-HLT. 4171--4186.","author":"Ming-Wei Chang Jacob Devlin","year":"2019","unstructured":"Jacob Devlin Ming-Wei Chang Kenton and Lee Kristina Toutanova. 2019. BERT: Pre-training of deep bidirectional transformers for language understanding. In NAACL-HLT. 4171--4186."},{"key":"e_1_3_2_2_23_1","volume-title":"TEAM: Topological evolution-aware framework for traffic forecasting. PVLDB 18","author":"Kieu Duc","year":"2024","unstructured":"Duc Kieu, Tung Kieu, Peng Han, Bin Yang, Christian S. Jensen, and Bac Le. 2024. TEAM: Topological evolution-aware framework for traffic forecasting. PVLDB 18 (2024)."},{"key":"e_1_3_2_2_24_1","volume-title":"Urbangpt: Spatio-temporal large language models. In KDD. 5351--5362.","author":"Li Zhonghang","year":"2024","unstructured":"Zhonghang Li, Lianghao Xia, Jiabin Tang, Yong Xu, Lei Shi, Long Xia, Dawei Yin, and Chao Huang. 2024. Urbangpt: Spatio-temporal large language models. In KDD. 5351--5362."},{"key":"e_1_3_2_2_25_1","unstructured":"Zhonghang Li Lianghao Xia Yong Xu and Chao Huang. 2024. FlashST: A Simple and Universal Prompt-Tuning Framework for Traffic Prediction. In ICML."},{"key":"e_1_3_2_2_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3656580"},{"key":"e_1_3_2_2_27_1","volume-title":"LightTR: A lightweight framework for federated trajectory recovery. arXiv preprint arXiv:2405.03409","author":"Liu Ziqiao","year":"2024","unstructured":"Ziqiao Liu, Hao Miao, Yan Zhao, Chenxi Liu, Kai Zheng, and Huan Li. 2024. LightTR: A lightweight framework for federated trajectory recovery. arXiv preprint arXiv:2405.03409 (2024)."},{"key":"e_1_3_2_2_28_1","doi-asserted-by":"publisher","DOI":"10.1007\/s10707-023-00507-3"},{"key":"e_1_3_2_2_29_1","doi-asserted-by":"crossref","unstructured":"Zhipeng Ma Zheyan Tu Xinhai Chen Yan Zhang Deguo Xia Guyue Zhou Yilun Chen Yu Zheng and Jiangtao Gong. 2024. More than routing: Joint GPS and route modeling for refine trajectory representation learning. In WWW. 3064--3075.","DOI":"10.1145\/3589334.3645644"},{"key":"e_1_3_2_2_30_1","unstructured":"Sachit Menon and Carl Vondrick. 2022. Visual classification via description from large language models. In ICLR."},{"key":"e_1_3_2_2_31_1","doi-asserted-by":"crossref","unstructured":"Paul Newson and John Krumm. 2009. Hidden markov map matching through noise and sparseness. In SIGSPATIAL. 336--343.","DOI":"10.1145\/1653771.1653818"},{"key":"e_1_3_2_2_32_1","doi-asserted-by":"publisher","DOI":"10.14778\/3611540.3611566"},{"key":"e_1_3_2_2_33_1","volume-title":"Pytorch: An imperative style, high-performance deep learning library.","author":"Paszke Adam","year":"2019","unstructured":"Adam Paszke, Sam Gross, Francisco Massa, Adam Lerer, James Bradbury, Gregory Chanan, Trevor Killeen, Zeming Lin, Natalia Gimelshein, Luca Antiga, et al. 2019. Pytorch: An imperative style, high-performance deep learning library."},{"key":"e_1_3_2_2_34_1","doi-asserted-by":"publisher","DOI":"10.14778\/3397230.3397248"},{"key":"e_1_3_2_2_35_1","doi-asserted-by":"publisher","DOI":"10.1145\/3617500"},{"key":"e_1_3_2_2_36_1","volume-title":"Hardik Shah, Mike Zheng Shou, Rama Chellappa, and Pengchuan Zhang.","author":"Pramanick Shraman","year":"2023","unstructured":"Shraman Pramanick, Yale Song, Sayan Nag, Kevin Qinghong Lin, Hardik Shah, Mike Zheng Shou, Rama Chellappa, and Pengchuan Zhang. 2023. EgoVLPv2: Egocentric video-language pre-training with fusion in the backbone. In ICCV. 5285--5297."},{"key":"e_1_3_2_2_37_1","volume-title":"Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell, Pamela Mishkin, Jack Clark, et al.","author":"Radford Alec","year":"2021","unstructured":"Alec Radford, Jong Wook Kim, Chris Hallacy, Aditya Ramesh, Gabriel Goh, Sandhini Agarwal, Girish Sastry, Amanda Askell, Pamela Mishkin, Jack Clark, et al. 2021. Learning transferable visual models from natural language supervision. In ICML. 8748--8763."},{"key":"e_1_3_2_2_38_1","volume-title":"Dara Bahri","author":"Tay Yi","year":"2022","unstructured":"Yi Tay, Mostafa Dehghani, Vinh Q Tran, Xavier Garcia, Jason Wei, Xuezhi Wang, Hyung Won Chung, Dara Bahri, Tal Schuster, Steven Zheng, et al. 2022. UL2: Unifying language learning paradigms. In ICLR."},{"key":"e_1_3_2_2_39_1","volume-title":"Jamie Hall, Noam Shazeer, Apoorv Kulshreshtha, Heng-Tze Cheng, Alicia Jin, Taylor Bos, Leslie Baker, Yu Du, et al.","author":"Thoppilan Romal","year":"2022","unstructured":"Romal Thoppilan, Daniel De Freitas, Jamie Hall, Noam Shazeer, Apoorv Kulshreshtha, Heng-Tze Cheng, Alicia Jin, Taylor Bos, Leslie Baker, Yu Du, et al. 2022. Lamda: Language models for dialog applications. arXiv preprint arXiv:2201.08239 (2022)."},{"key":"e_1_3_2_2_40_1","volume-title":"Saksham Singhal, Subhojit Som, et al.","author":"Wang Wenhui","year":"2023","unstructured":"Wenhui Wang, Hangbo Bao, Li Dong, Johan Bjorck, Zhiliang Peng, Qiang Liu, Kriti Aggarwal, Owais Khan Mohammed, Saksham Singhal, Subhojit Som, et al. 2023. Image as a foreign language: Beit pretraining for vision and vision-language tasks. In CVPR. 19175--19186."},{"key":"e_1_3_2_2_41_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i01.5450"},{"key":"e_1_3_2_2_42_1","doi-asserted-by":"publisher","DOI":"10.1145\/3627824"},{"key":"e_1_3_2_2_43_1","doi-asserted-by":"publisher","DOI":"10.1007\/s00778-017-0491-4"},{"key":"e_1_3_2_2_44_1","first-page":"3153","article-title":"Context-aware path ranking in road networks","volume":"34","author":"Yang Sean Bin","year":"2020","unstructured":"Sean Bin Yang, Chenjuan Guo, and Bin Yang. 2020. Context-aware path ranking in road networks. IEEE Trans. Knowl. Data Eng. 34, 7 (2020), 3153--3168.","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"e_1_3_2_2_45_1","volume-title":"Jensen","author":"Yang Sean Bin","year":"2023","unstructured":"Sean Bin Yang, Jilin Hu, Chenjuan Guo, Bin Yang, and Christian S. Jensen. 2023. LightPath: Lightweight and scalable path representation learning. In KDD. ACM, 2999--3010."},{"key":"e_1_3_2_2_46_1","volume-title":"Learning to rank paths in spatial networks","author":"Yang Sean Bin","year":"2006","unstructured":"Sean Bin Yang and Bin Yang. 2020. Learning to rank paths in spatial networks. In ICDE. IEEE, 2006--2009."},{"key":"e_1_3_2_2_47_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v37i9.26290"},{"key":"e_1_3_2_2_48_1","doi-asserted-by":"crossref","unstructured":"Yuan Yuan Jingtao Ding Jie Feng Depeng Jin and Yong Li. 2024. UniST: A prompt-empowered universal model for urban spatio-temporal prediction. In KDD. 4095--4106.","DOI":"10.1145\/3637528.3671662"},{"key":"e_1_3_2_2_49_1","volume-title":"Multi-task adversarial learning for semi-supervised trajectory-user linking","author":"Zhang Sen","unstructured":"Sen Zhang, SenzhangWang, XiangWang, Shigeng Zhang, Hao Miao, and Junxing Zhu. 2022. Multi-task adversarial learning for semi-supervised trajectory-user linking. In ECML PKDD. Springer, 418--434."},{"key":"e_1_3_2_2_50_1","doi-asserted-by":"publisher","DOI":"10.14778\/3636218.3636230"},{"key":"e_1_3_2_2_51_1","first-page":"65168","article-title":"Difftraj: Generating gps trajectory with diffusion probabilistic model","volume":"36","author":"Zhu Yuanshao","year":"2023","unstructured":"Yuanshao Zhu, Yongchao Ye, Shiyao Zhang, Xiangyu Zhao, and James Yu. 2023. Difftraj: Generating gps trajectory with diffusion probabilistic model. NeurIPS 36 (2023), 65168--65188.","journal-title":"NeurIPS"},{"key":"e_1_3_2_2_52_1","volume-title":"Xiangyu Zhao, Qidong Liu, Yongchao Ye, Wei Chen, Zijian Zhang, Xuetao Wei, and Yuxuan Liang.","author":"Zhu Yuanshao","year":"2024","unstructured":"Yuanshao Zhu, James Jianqiao Yu, Xiangyu Zhao, Qidong Liu, Yongchao Ye, Wei Chen, Zijian Zhang, Xuetao Wei, and Yuxuan Liang. 2024. Controltraj: Controllable trajectory generation with topology-constrained diffusion model. In KDD. 4676--4687."}],"event":{"name":"KDD '25: The 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining","location":"Toronto ON Canada","acronym":"KDD '25","sponsor":["SIGMOD ACM Special Interest Group on Management of Data","SIGKDD ACM Special Interest Group on Knowledge Discovery in Data"]},"container-title":["Proceedings of the 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining V.1"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3690624.3709209","content-type":"unspecified","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3690624.3709209","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,16]],"date-time":"2025-08-16T15:46:07Z","timestamp":1755359167000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3690624.3709209"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,20]]},"references-count":52,"alternative-id":["10.1145\/3690624.3709209","10.1145\/3690624"],"URL":"https:\/\/doi.org\/10.1145\/3690624.3709209","relation":{},"subject":[],"published":{"date-parts":[[2025,7,20]]},"assertion":[{"value":"2025-07-20","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}