{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T12:40:01Z","timestamp":1755866401563,"version":"3.44.0"},"publisher-location":"New York, NY, USA","reference-count":37,"publisher":"ACM","funder":[{"name":"Quan Cheng Laboratory","award":["Grant No. QCLZD202301"],"award-info":[{"award-number":["Grant No. QCLZD202301"]}]},{"name":"Natural Science Foundation of China","award":["Grant No. U21B2026, 62372260"],"award-info":[{"award-number":["Grant No. U21B2026, 62372260"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,7,13]]},"DOI":"10.1145\/3726302.3730311","type":"proceedings-article","created":{"date-parts":[[2025,7,14]],"date-time":"2025-07-14T01:38:52Z","timestamp":1752457132000},"page":"3772-3781","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["U-Sticker: A Large-Scale Multi-Domain User Sticker Dataset for Retrieval and Personalization"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0006-5562-5878","authenticated-orcid":false,"given":"Heng Er Metilda","family":"Chee","sequence":"first","affiliation":[{"name":"DCST, Tsinghua University, Beijing, China and Quan Cheng Laboratory, Jinan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8875-1850","authenticated-orcid":false,"given":"Jiayin","family":"Wang","sequence":"additional","affiliation":[{"name":"DCST, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-9393-4854","authenticated-orcid":false,"given":"Zhiqiang","family":"Guo","sequence":"additional","affiliation":[{"name":"DCST, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-5604-7527","authenticated-orcid":false,"given":"Weizhi","family":"Ma","sequence":"additional","affiliation":[{"name":"AIR, Tsinghua University, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-1552-9033","authenticated-orcid":false,"given":"Qinglang","family":"Guo","sequence":"additional","affiliation":[{"name":"CETC Academy of Electronics and Information Technology Group Co.,Ltd; China Academic of Electronics and Information Technology, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0003-3158-1920","authenticated-orcid":false,"given":"Min","family":"Zhang","sequence":"additional","affiliation":[{"name":"DSCT, Tsinghua University, Beijing, China and Quan Cheng Laboratory, Jinan, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,7,13]]},"reference":[{"key":"e_1_3_2_1_1_1","unstructured":"[n.d.]. Power laws Pareto distributions and Zipf's law. ([n.d.])."},{"key":"e_1_3_2_1_2_1","unstructured":"[n.d.]. Telegram Terms of Service. https:\/\/telegram.org\/tos. Accessed: 2025-02-19."},{"key":"e_1_3_2_1_3_1","unstructured":"Falcon AI. 2024. NSFW Image Detection. https:\/\/huggingface.co\/Falconsai\/nsfw_image_detection. https:\/\/huggingface.co\/Falconsai\/nsfw_image_detection Accessed: 2024-02-16."},{"key":"e_1_3_2_1_4_1","volume-title":"Deep Learning Models for Multilingual Hate Speech Detection. arXiv preprint arXiv:2004.06465","author":"Aluru Sai Saket","year":"2020","unstructured":"Sai Saket Aluru, Binny Mathew, Punyajoy Saha, and Animesh Mukherjee. 2020. Deep Learning Models for Multilingual Hate Speech Detection. arXiv preprint arXiv:2004.06465 (2020)."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"publisher","DOI":"10.1145\/2701415"},{"key":"e_1_3_2_1_6_1","volume-title":"Detecting Inappropriate Messages on Sensitive Topics that Could Harm a Company's Reputation. arXiv preprint arXiv:2103.05345","author":"Babakov Nikolay","year":"2021","unstructured":"Nikolay Babakov, Varvara Logacheva, Olga Kozlova, Nikita Semenov, and Alexander Panchenko. 2021. Detecting Inappropriate Messages on Sensitive Topics that Could Harm a Company's Reputation. arXiv preprint arXiv:2103.05345 (2021)."},{"key":"e_1_3_2_1_7_1","volume-title":"Tweeteval: Unified benchmark and comparative evaluation for tweet classification. arXiv preprint arXiv:2010.12421","author":"Barbieri Francesco","year":"2020","unstructured":"Francesco Barbieri, Jose Camacho-Collados, Leonardo Neves, and Luis Espinosa-Anke. 2020. Tweeteval: Unified benchmark and comparative evaluation for tweet classification. arXiv preprint arXiv:2010.12421 (2020)."},{"volume-title":"https:\/\/github.com\/Benau\/tgsconverter Accessed","year":"2025","key":"e_1_3_2_1_8_1","unstructured":"Benau. 2025. TGSConverter. https:\/\/github.com\/Benau\/tgsconverter Accessed: February 15, 2025."},{"key":"e_1_3_2_1_9_1","volume-title":"PerSRV: Personalized Sticker Retrieval with Vision-Language Model. arXiv preprint arXiv:2410.21801","author":"Metilda Chee Heng Er","year":"2024","unstructured":"Heng Er Metilda Chee, Jiayin Wang, Zhiqiang Guo, Weizhi Ma, and Min Zhang. 2024. PerSRV: Personalized Sticker Retrieval with Vision-Language Model. arXiv preprint arXiv:2410.21801 (2024)."},{"key":"e_1_3_2_1_10_1","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3681522"},{"key":"e_1_3_2_1_11_1","unstructured":"Adam Codd. 2024. ViT-Base NSFW Detector. https:\/\/huggingface.co\/AdamCodd\/vit-base-nsfw-detector. https:\/\/huggingface.co\/AdamCodd\/vit-base-nsfwdetector Accessed: 2024-02-16."},{"key":"e_1_3_2_1_12_1","volume-title":"Unsupervised cross-lingual representation learning at scale. arXiv preprint arXiv:1911.02116","author":"Conneau A","year":"2019","unstructured":"A Conneau. 2019. Unsupervised cross-lingual representation learning at scale. arXiv preprint arXiv:1911.02116 (2019)."},{"key":"e_1_3_2_1_13_1","volume-title":"Racial bias in hate speech and abusive language detection datasets. arXiv preprint arXiv:1905.12516","author":"Davidson Thomas","year":"2019","unstructured":"Thomas Davidson, Debasmita Bhattacharya, and Ingmar Weber. 2019. Racial bias in hate speech and abusive language detection datasets. arXiv preprint arXiv:1905.12516 (2019)."},{"key":"e_1_3_2_1_14_1","volume-title":"COLD: A benchmark for Chinese offensive language detection. arXiv preprint arXiv:2201.06025","author":"Deng Jiawen","year":"2022","unstructured":"Jiawen Deng, Jingyan Zhou, Hao Sun, Chujie Zheng, Fei Mi, Helen Meng, and Minlie Huang. 2022. COLD: A benchmark for Chinese offensive language detection. arXiv preprint arXiv:2201.06025 (2022)."},{"key":"e_1_3_2_1_15_1","volume-title":"Accessed","author":"Exo Lonami","year":"2025","unstructured":"Lonami Exo. 2025. Telethon Documentation. https:\/\/tl.telethon.dev\/. Accessed: February 15, 2025."},{"key":"e_1_3_2_1_16_1","volume-title":"Towards expressive communication with internet memes: A new multimodal conversation dataset and benchmark. arXiv preprint arXiv:2109.01839","author":"Fei Zhengcong","year":"2021","unstructured":"Zhengcong Fei, Zekang Li, Jinchao Zhang, Yang Feng, and Jie Zhou. 2021. Towards expressive communication with internet memes: A new multimodal conversation dataset and benchmark. arXiv preprint arXiv:2109.01839 (2021)."},{"key":"e_1_3_2_1_17_1","doi-asserted-by":"publisher","DOI":"10.1145\/3366423.3380191"},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1145\/3429980"},{"key":"e_1_3_2_1_19_1","volume-title":"Proceedings of the 29th International Conference on Computational Linguistics. 6795-6804","author":"Ge Feng","year":"2022","unstructured":"Feng Ge, Weizhao Li, Haopeng Ren, and Yi Cai. 2022. Towards exploiting sticker for multimodal sentiment analysis in social media: A new dataset and baseline. In Proceedings of the 29th International Conference on Computational Linguistics. 6795-6804."},{"key":"e_1_3_2_1_20_1","doi-asserted-by":"publisher","unstructured":"Giacomo Arienti. 2024. nsfw-classifier (Revision 4c8d67f). https:\/\/doi.org\/10.57967\/hf\/2906","DOI":"10.57967\/hf\/2906"},{"key":"e_1_3_2_1_21_1","unstructured":"Jarano Haal. 2024. ViT-Base Violence Detection. https:\/\/huggingface.co\/ jaranohaal\/vit-base-violence-detection. https:\/\/huggingface.co\/jaranohaal\/vitbase-violence-detection Accessed: 2024-02-16."},{"key":"e_1_3_2_1_22_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v34i08.7019"},{"key":"e_1_3_2_1_23_1","doi-asserted-by":"publisher","DOI":"10.1145\/3545862.3545889"},{"key":"e_1_3_2_1_24_1","unstructured":"Bin Liang Bingbing Wang Zhixin Bai Qiwei Lang Mingwei Sun Kaiheng Hou Lanjun Zhou Ruifeng Xu and Kam-Fai Wong. 2024. Reply with Sticker: New Dataset and Model for Sticker Retrieval. arXiv:2403.05427 [cs.MM] https:\/\/arxiv.org\/abs\/2403.05427"},{"key":"e_1_3_2_1_25_1","unstructured":"Haotian Liu Chunyuan Li QingyangWu and Yong Jae Lee. 2023. Visual Instruction Tuning. In NeurIPS."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3503161.3548407"},{"key":"e_1_3_2_1_27_1","doi-asserted-by":"publisher","DOI":"10.1145\/3589334.3645633"},{"key":"e_1_3_2_1_28_1","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3680978"},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1145\/363347.363387"},{"key":"e_1_3_2_1_30_1","volume-title":"Towards Real-World Stickers Use: A New Dataset for Multi-Tag Sticker Recognition. arXiv preprint arXiv:2403.05428","author":"Wang Bingbing","year":"2024","unstructured":"Bingbing Wang, Bin Liang, Chun-Mei Feng, Wangmeng Zuo, Zhixin Bai, Shijue Huang, Kam-Fai Wong, Xi Zeng, and Ruifeng Xu. 2024. Towards Real-World Stickers Use: A New Dataset for Multi-Tag Sticker Recognition. arXiv preprint arXiv:2403.05428 (2024)."},{"key":"e_1_3_2_1_31_1","doi-asserted-by":"publisher","DOI":"10.1038\/sdata.2016.18"},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1145\/3664647.3680987"},{"key":"e_1_3_2_1_33_1","volume-title":"Personalized Image Generation with Large Multimodal Models. arXiv preprint arXiv:2410.14170","author":"Xu Yiyan","year":"2024","unstructured":"Yiyan Xu, Wenjie Wang, Yang Zhang, Tang Biao, Peng Yan, Fuli Feng, and Xiangnan He. 2024. Personalized Image Generation with Large Multimodal Models. arXiv preprint arXiv:2410.14170 (2024)."},{"key":"e_1_3_2_1_34_1","volume-title":"StickerConv: Generating Multimodal Empathetic Responses from Scratch. arXiv preprint arXiv:2402.01679","author":"Zhang Yiqun","year":"2024","unstructured":"Yiqun Zhang, Fanheng Kong, Peidong Wang, Shuang Sun, Lingshuai Wang, Shi Feng, Daling Wang, Yifei Zhang, and Kaisong Song. 2024. StickerConv: Generating Multimodal Empathetic Responses from Scratch. arXiv preprint arXiv:2402.01679 (2024)."},{"key":"e_1_3_2_1_35_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.findings-acl.241"},{"key":"e_1_3_2_1_36_1","volume-title":"Sticker820k: Empowering interactive retrieval with stickers. arXiv preprint arXiv:2306.06870","author":"Zhao Sijie","year":"2023","unstructured":"Sijie Zhao, Yixiao Ge, Zhongang Qi, Lin Song, Xiaohan Ding, Zehua Xie, and Ying Shan. 2023. Sticker820k: Empowering interactive retrieval with stickers. arXiv preprint arXiv:2306.06870 (2023)."},{"volume-title":"Human behavior and the principle of least effort: An introduction to human ecology","author":"Zipf George Kingsley","key":"e_1_3_2_1_37_1","unstructured":"George Kingsley Zipf. 1949. Human behavior and the principle of least effort: An introduction to human ecology. Addison-Wesley Press."}],"event":{"name":"SIGIR '25: The 48th International ACM SIGIR Conference on Research and Development in Information Retrieval","sponsor":["SIGIR ACM Special Interest Group on Information Retrieval"],"location":"Padua Italy","acronym":"SIGIR '25"},"container-title":["Proceedings of the 48th International ACM SIGIR Conference on Research and Development in Information Retrieval"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3726302.3730311","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T12:11:27Z","timestamp":1755864687000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3726302.3730311"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,7,13]]},"references-count":37,"alternative-id":["10.1145\/3726302.3730311","10.1145\/3726302"],"URL":"https:\/\/doi.org\/10.1145\/3726302.3730311","relation":{},"subject":[],"published":{"date-parts":[[2025,7,13]]},"assertion":[{"value":"2025-07-13","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}