{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,12,12]],"date-time":"2025-12-12T00:47:03Z","timestamp":1765500423331,"version":"3.48.0"},"publisher-location":"New York, NY, USA","reference-count":34,"publisher":"ACM","content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,11,10]]},"DOI":"10.1145\/3746252.3760855","type":"proceedings-article","created":{"date-parts":[[2025,11,10]],"date-time":"2025-11-10T18:37:32Z","timestamp":1762799852000},"page":"4981-4985","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["Exploring Reasoning-Infused Text Embedding with Large Language Models for Zero-Shot Dense Retrieval"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0004-2015-4848","authenticated-orcid":false,"given":"Yuxiang","family":"Liu","sequence":"first","affiliation":[{"name":"University of Illinois at Urbana-Champaign, Urbana, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-7451-6153","authenticated-orcid":false,"given":"Tian","family":"Wang","sequence":"additional","affiliation":[{"name":"Amazon, Palo Alto, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0009-0872-3557","authenticated-orcid":false,"given":"Gourab","family":"Kundu","sequence":"additional","affiliation":[{"name":"Amazon, New York, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-2194-9510","authenticated-orcid":false,"given":"Tianyu","family":"Cao","sequence":"additional","affiliation":[{"name":"Amazon, Palo Alto, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-7874-9404","authenticated-orcid":false,"given":"Guang","family":"Cheng","sequence":"additional","affiliation":[{"name":"Amazon, Los Angeles, USA"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-1525-8579","authenticated-orcid":false,"given":"Zhen","family":"Ge","sequence":"additional","affiliation":[{"name":"Amazon, New York, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-8216-2756","authenticated-orcid":false,"given":"Jianshu","family":"Chen","sequence":"additional","affiliation":[{"name":"Amazon, Palo Alto, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-6600-9804","authenticated-orcid":false,"given":"Qingjun","family":"Cui","sequence":"additional","affiliation":[{"name":"Amazon, Palo Alto, USA"}]},{"ORCID":"https:\/\/orcid.org\/0000-0001-6711-1117","authenticated-orcid":false,"given":"Trishul","family":"Chilimbi","sequence":"additional","affiliation":[{"name":"Amazon, Palo Alto, USA"}]}],"member":"320","published-online":{"date-parts":[[2025,11,10]]},"reference":[{"key":"e_1_3_2_1_1_1","volume-title":"Diogo Almeida, Janko Altenschmidt, Sam Altman, Shyamal Anadkat, et al.","author":"Achiam Josh","year":"2023","unstructured":"Josh Achiam, Steven Adler, Sandhini Agarwal, Lama Ahmad, Ilge Akkaya, Florencia Leoni Aleman, Diogo Almeida, Janko Altenschmidt, Sam Altman, Shyamal Anadkat, et al. 2023. Gpt-4 technical report. arXiv preprint arXiv:2303.08774 (2023)."},{"key":"e_1_3_2_1_2_1","volume-title":"Llm2vec: Large language models are secretly powerful text encoders. arXiv preprint arXiv:2404.05961","author":"BehnamGhader Parishad","year":"2024","unstructured":"Parishad BehnamGhader, Vaibhav Adlakha, Marius Mosbach, Dzmitry Bahdanau, Nicolas Chapados, and Siva Reddy. 2024. Llm2vec: Large language models are secretly powerful text encoders. arXiv preprint arXiv:2404.05961 (2024)."},{"key":"e_1_3_2_1_3_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19--1423"},{"key":"e_1_3_2_1_4_1","volume-title":"Recommendation systems: Principles, methods and evaluation. Egyptian informatics journal 16, 3","author":"Isinkaye Folasade Olubusola","year":"2015","unstructured":"Folasade Olubusola Isinkaye, YetundeOFolajimi, and BolandeAdefowoke Ojokoh. 2015. Recommendation systems: Principles, methods and evaluation. Egyptian informatics journal 16, 3 (2015), 261--273."},{"key":"e_1_3_2_1_5_1","doi-asserted-by":"crossref","unstructured":"Cheng Ji and Huaiying Luo. 2025. Leveraging Large Language Model for Intelligent Log Processing and Autonomous Debugging in Cloud AI Platforms. In 2025 8th International Conference on Advanced Electronic Materials Computers and Software Engineering (AEMCSE). IEEE 348--351.","DOI":"10.1109\/AEMCSE65292.2025.11042521"},{"key":"e_1_3_2_1_6_1","volume-title":"Diego de las Casas, Florian Bressand, Gianna Lengyel, Guillaume Lample, Lucile Saulnier, et al.","author":"Jiang Albert Q","year":"2023","unstructured":"Albert Q Jiang, Alexandre Sablayrolles, Arthur Mensch, Chris Bamford, Devendra Singh Chaplot, Diego de las Casas, Florian Bressand, Gianna Lengyel, Guillaume Lample, Lucile Saulnier, et al. 2023. Mistral 7B. arXiv preprint arXiv:2310.06825 (2023)."},{"key":"e_1_3_2_1_7_1","volume-title":"Scaling sentence embeddings with large language models. arXiv preprint arXiv:2307.16645","author":"Jiang Ting","year":"2023","unstructured":"Ting Jiang, Shaohan Huang, Zhongzhi Luan, Deqing Wang, and Fuzhen Zhuang. 2023. Scaling sentence embeddings with large language models. arXiv preprint arXiv:2307.16645 (2023)."},{"key":"e_1_3_2_1_8_1","doi-asserted-by":"publisher","unstructured":"Yihong Jin Ze Yang and Xinhe Xu. 2025. Scam Detection for Ethereum Smart Contracts: Leveraging Graph Representation Learning for Secure Blockchain. In 2025 4th International Symposium on Computer Applications and Information Technology (ISCAIT). 1730--1734. https:\/\/doi.org\/10.1109\/ISCAIT64916.2025.11010625","DOI":"10.1109\/ISCAIT64916.2025.11010625"},{"key":"e_1_3_2_1_9_1","volume-title":"Information retrieval on the web. ACM computing surveys (CSUR) 32, 2","author":"Kobayashi Mei","year":"2000","unstructured":"Mei Kobayashi and Koichi Takeda. 2000. Information retrieval on the web. ACM computing surveys (CSUR) 32, 2 (2000), 144--173."},{"key":"e_1_3_2_1_10_1","volume-title":"Gecko: Versatile text embeddings distilled from large language models. arXiv preprint arXiv:2403.20327","author":"Lee Jinhyuk","year":"2024","unstructured":"Jinhyuk Lee, Zhuyun Dai, Xiaoqi Ren, Blair Chen, Daniel Cer, Jeremy R Cole, Kai Hui, Michael Boratko, Rajvi Kapadia, Wen Ding, et al. 2024. Gecko: Versatile text embeddings distilled from large language models. arXiv preprint arXiv:2403.20327 (2024)."},{"key":"e_1_3_2_1_11_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2025.acl-long.1250"},{"key":"e_1_3_2_1_12_1","volume-title":"Ask To The Point: Open-Domain Entity-Centric Question Generation. In Findings of the Association for Computational Linguistics: EMNLP 2023","author":"Liu Yuxiang","year":"2023","unstructured":"Yuxiang Liu, Jie Huang, and Kevin Chen-Chuan Chang. 2023. Ask To The Point: Open-Domain Entity-Centric Question Generation. In Findings of the Association for Computational Linguistics: EMNLP 2023, Singapore, December 6--10, 2023. Association for Computational Linguistics, 2703--2716. https:\/\/doi.org\/10. 18653\/v1\/2023.findings-emnlp.178"},{"key":"e_1_3_2_1_13_1","volume-title":"Cross-Cloud Data Privacy Protection: Optimizing Collaborative Mechanisms of AI Systems by Integrating Federated Learning and LLMs. arXiv preprint arXiv:2505.13292","author":"Luo Huaiying","year":"2025","unstructured":"Huaiying Luo and Cheng Ji. 2025. Cross-Cloud Data Privacy Protection: Optimizing Collaborative Mechanisms of AI Systems by Integrating Federated Learning and LLMs. arXiv preprint arXiv:2505.13292 (2025)."},{"key":"e_1_3_2_1_14_1","volume-title":"Federated Learning-Based Data Collaboration Method for Enhancing Edge Cloud AI System Security Using Large Language Models. arXiv preprint arXiv:2506.18087","author":"Luo Huaiying","year":"2025","unstructured":"Huaiying Luo and Cheng Ji. 2025. Federated Learning-Based Data Collaboration Method for Enhancing Edge Cloud AI System Security Using Large Language Models. arXiv preprint arXiv:2506.18087 (2025)."},{"key":"e_1_3_2_1_15_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.emnlp-main.322"},{"key":"e_1_3_2_1_16_1","volume-title":"Finetuning llama for multi-stage text retrieval. arXiv preprint arXiv:2310.08319","author":"Ma Xueguang","year":"2023","unstructured":"Xueguang Ma, Liang Wang, Nan Yang, Furu Wei, and Jimmy Lin. 2023. Finetuning llama for multi-stage text retrieval. arXiv preprint arXiv:2310.08319 (2023)."},{"key":"e_1_3_2_1_17_1","volume-title":"Generative representational instruction tuning. arXiv preprint arXiv:2402.09906","author":"Muennighoff Niklas","year":"2024","unstructured":"Niklas Muennighoff, Hongjin Su, LiangWang, Nan Yang, FuruWei, Tao Yu, Amanpreet Singh, and Douwe Kiela. 2024. Generative representational instruction tuning. arXiv preprint arXiv:2402.09906 (2024)."},{"key":"e_1_3_2_1_18_1","doi-asserted-by":"publisher","DOI":"10.1109\/ACCESS.2023.3266377"},{"key":"e_1_3_2_1_19_1","volume-title":"Repetition improves language model embeddings. arXiv preprint arXiv:2402.15449","author":"Springer Jacob Mitchell","year":"2024","unstructured":"Jacob Mitchell Springer, Suhas Kotha, Daniel Fried, Graham Neubig, and Aditi Raghunathan. 2024. Repetition improves language model embeddings. arXiv preprint arXiv:2402.15449 (2024)."},{"key":"e_1_3_2_1_20_1","volume-title":"BRIGHT: A Realistic and Challenging Benchmark for Reasoning-Intensive Retrieval. arXiv preprint arXiv:2407.12883","author":"Su Hongjin","year":"2024","unstructured":"Hongjin Su, Howard Yen, Mengzhou Xia,Weijia Shi, Niklas Muennighoff, Han-yu Wang, Haisu Liu, Quan Shi, Zachary S Siegel, Michael Tang, et al. 2024. BRIGHT: A Realistic and Challenging Benchmark for Reasoning-Intensive Retrieval. arXiv preprint arXiv:2407.12883 (2024)."},{"key":"e_1_3_2_1_21_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.acllong"},{"key":"e_1_3_2_1_22_1","volume-title":"BlendFilter: Advancing Retrieval- Augmented Large Language Models via Query Generation Blending and Knowledge Filtering. arXiv preprint arXiv:2402.11129","author":"Wang Haoyu","year":"2024","unstructured":"Haoyu Wang, Tuo Zhao, and Jing Gao. 2024. BlendFilter: Advancing Retrieval- Augmented Large Language Models via Query Generation Blending and Knowledge Filtering. arXiv preprint arXiv:2402.11129 (2024)."},{"key":"e_1_3_2_1_23_1","volume-title":"Text embeddings by weakly-supervised contrastive pre-training. arXiv preprint arXiv:2212.03533","author":"Wang Liang","year":"2022","unstructured":"Liang Wang, Nan Yang, Xiaolong Huang, Binxing Jiao, Linjun Yang, Daxin Jiang, Rangan Majumder, and Furu Wei. 2022. Text embeddings by weakly-supervised contrastive pre-training. arXiv preprint arXiv:2212.03533 (2022)."},{"key":"e_1_3_2_1_24_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.acl-long.642"},{"key":"e_1_3_2_1_25_1","volume-title":"RAR-b: Reasoning as Retrieval Benchmark. arXiv preprint arXiv:2404.06347","author":"Xiao Chenghao","year":"2024","unstructured":"Chenghao Xiao, G Thomas Hudson, and Noura Al Moubayed. 2024. RAR-b: Reasoning as Retrieval Benchmark. arXiv preprint arXiv:2404.06347 (2024)."},{"key":"e_1_3_2_1_26_1","doi-asserted-by":"publisher","DOI":"10.1145\/3627673.3679071"},{"key":"e_1_3_2_1_27_1","volume-title":"The Second Tiny Papers Track at ICLR","author":"Xu Han","year":"2024","unstructured":"Han Xu, Jingyang Ye, Yutong Li, and Haipeng Chen. 2024. Can Speculative Sampling Accelerate ReAct Without Compromising Reasoning Quality?. In The Second Tiny Papers Track at ICLR 2024. https:\/\/openreview.net\/forum?id=42b9hJrIpX"},{"key":"e_1_3_2_1_28_1","volume-title":"Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing: Industry Track. 1433--1443","author":"Xu Han","year":"2024","unstructured":"Han Xu, Ruining Zhao, Jindong Wang, and Haipeng Chen. 2024. RESTful-Llama: Connecting User Queries to RESTful APIs. In Proceedings of the 2024 Conference on Empirical Methods in Natural Language Processing: Industry Track. 1433--1443."},{"key":"e_1_3_2_1_29_1","doi-asserted-by":"publisher","DOI":"10.1109\/CISCE65916.2025.11065413"},{"key":"e_1_3_2_1_30_1","volume-title":"Hades: Hardware accelerated decoding for efficient speculation in large language models. arXiv preprint arXiv:2412.19925","author":"Yang Ze","year":"2024","unstructured":"Ze Yang, Yihong Jin, and Xinhe Xu. 2024. Hades: Hardware accelerated decoding for efficient speculation in large language models. arXiv preprint arXiv:2412.19925 (2024)."},{"key":"e_1_3_2_1_31_1","volume-title":"Chain-of-note: Enhancing robustness in retrieval-augmented language models. arXiv preprint arXiv:2311.09210","author":"Yu Wenhao","year":"2023","unstructured":"Wenhao Yu, Hongming Zhang, Xiaoman Pan, Kaixin Ma, Hongwei Wang, and Dong Yu. 2023. Chain-of-note: Enhancing robustness in retrieval-augmented language models. arXiv preprint arXiv:2311.09210 (2023)."},{"key":"e_1_3_2_1_32_1","doi-asserted-by":"publisher","DOI":"10.1007\/978-981-97-5669-8_5"},{"key":"e_1_3_2_1_33_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.naacl-long.96"},{"key":"e_1_3_2_1_34_1","volume-title":"PromptReps: Prompting Large Language Models to Generate Dense and Sparse Representations for Zero-Shot Document Retrieval. arXiv preprint arXiv:2404.18424","author":"Zhuang Shengyao","year":"2024","unstructured":"Shengyao Zhuang, Xueguang Ma, Bevan Koopman, Jimmy Lin, and Guido Zuccon. 2024. PromptReps: Prompting Large Language Models to Generate Dense and Sparse Representations for Zero-Shot Document Retrieval. arXiv preprint arXiv:2404.18424 (2024)."}],"event":{"name":"CIKM '25: The 34th ACM International Conference on Information and Knowledge Management","sponsor":["SIGIR ACM Special Interest Group on Information Retrieval","SIGWEB ACM Special Interest Group on Hypertext, Hypermedia, and Web"],"location":"Seoul Republic of Korea","acronym":"CIKM '25"},"container-title":["Proceedings of the 34th ACM International Conference on Information and Knowledge Management"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3746252.3760855","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,12,12]],"date-time":"2025-12-12T00:44:00Z","timestamp":1765500240000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3746252.3760855"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,11,10]]},"references-count":34,"alternative-id":["10.1145\/3746252.3760855","10.1145\/3746252"],"URL":"https:\/\/doi.org\/10.1145\/3746252.3760855","relation":{},"subject":[],"published":{"date-parts":[[2025,11,10]]},"assertion":[{"value":"2025-11-10","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}