{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,5,4]],"date-time":"2026-05-04T05:49:40Z","timestamp":1777873780476,"version":"3.51.4"},"publisher-location":"New York, NY, USA","reference-count":46,"publisher":"ACM","funder":[{"DOI":"10.13039\/501100006374","name":"National Natural Science Foundation of China","doi-asserted-by":"publisher","award":["62302059,62172053"],"award-info":[{"award-number":["62302059,62172053"]}],"id":[{"id":"10.13039\/501100006374","id-type":"DOI","asserted-by":"publisher"}]},{"DOI":"10.13039\/501100006374","name":"National Key Research and Development Program of China","doi-asserted-by":"publisher","award":["Grant 2022YFC3303301, Grant 2023YFC3305401, Grant 2023YFC3305402"],"award-info":[{"award-number":["Grant 2022YFC3303301, Grant 2023YFC3305401, Grant 2023YFC3305402"]}],"id":[{"id":"10.13039\/501100006374","id-type":"DOI","asserted-by":"publisher"}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,8,3]]},"DOI":"10.1145\/3711896.3737219","type":"proceedings-article","created":{"date-parts":[[2025,8,3]],"date-time":"2025-08-03T21:04:26Z","timestamp":1754255066000},"page":"5117-5128","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":4,"title":["FinBERT2: A Specialized Bidirectional Encoder for Bridging the Gap in Finance-Specific Deployment of Large Language Models"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0009-0007-1326-4282","authenticated-orcid":false,"given":"Xuan","family":"Xu","sequence":"first","affiliation":[{"name":"Beijing University of Posts and Telecommunications, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-0034-7191","authenticated-orcid":false,"given":"Fufang","family":"Wen","sequence":"additional","affiliation":[{"name":"Beijing Value Simplex Technology Co. Ltd., Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-3024-0983","authenticated-orcid":false,"given":"Beilin","family":"Chu","sequence":"additional","affiliation":[{"name":"Beijing University of Posts and Telecommunications, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0000-3898-4306","authenticated-orcid":false,"given":"Zhibing","family":"Fu","sequence":"additional","affiliation":[{"name":"Beijing Value Simplex Technology Co. Ltd., Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-6651-2866","authenticated-orcid":false,"given":"Qinhong","family":"Lin","sequence":"additional","affiliation":[{"name":"Beijing University of Posts and Telecommunications, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-8058-0649","authenticated-orcid":false,"given":"Jiaqi","family":"Liu","sequence":"additional","affiliation":[{"name":"Beijing Value Simplex Technology Co. Ltd., Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0007-9719-1147","authenticated-orcid":false,"given":"Binjie","family":"Fei","sequence":"additional","affiliation":[{"name":"Beijing Value Simplex Technology Co. Ltd., Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-5528-7606","authenticated-orcid":false,"given":"Yu","family":"Li","sequence":"additional","affiliation":[{"name":"Beijing Value Simplex Technology Co. Ltd., Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0009-0004-0727-2436","authenticated-orcid":false,"given":"Linna","family":"Zhou","sequence":"additional","affiliation":[{"name":"Beijing University of Posts and Telecommunications, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]},{"ORCID":"https:\/\/orcid.org\/0000-0002-8027-9560","authenticated-orcid":false,"given":"Zhongliang","family":"Yang","sequence":"additional","affiliation":[{"name":"Beijing University of Posts and Telecommunications, Beijing, China"}],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"320","published-online":{"date-parts":[[2025,8,3]]},"reference":[{"key":"e_1_3_2_2_1_1","unstructured":"Dimo Angelov. 2020. Top2vec: Distributed representations of topics. arXiv preprint arXiv:2008.09470(2020)."},{"key":"e_1_3_2_2_2_1","unstructured":"Dogu Araci. 2019. FinBERT: Financial Sentiment Analysis with Pre-Trained Language Models. https:\/\/arxiv.org\/abs\/1908.10063"},{"key":"e_1_3_2_2_3_1","volume-title":"Hasan Cavusoglu, and Muhammad Abdul-Mageed.","author":"Bhatia Gagan","year":"2024","unstructured":"Gagan Bhatia, El Moatez Billah Nagoudi, Hasan Cavusoglu, and Muhammad Abdul-Mageed. 2024. FinTral: A Family of GPT-4 Level Multimodal Financial Large Language Models. https:\/\/arxiv.org\/abs\/2402.10986"},{"key":"e_1_3_2_2_4_1","unstructured":"Rishi Bommasani Drew A Hudson Ehsan Adeli Russ Altman Simran Arora Sydney von Arx Michael S Bernstein Jeannette Bohg Antoine Bosselut Emma Brunskill et al. 2021. On the opportunities and risks of foundation models. arXiv preprint arXiv:2108.07258(2021)."},{"key":"e_1_3_2_2_5_1","unstructured":"Wei-Cheng Chang Felix X Yu Yin-Wen Chang Yiming Yang and Sanjiv Kumar. 2020. Pre-training tasks for embedding-based large-scale retrieval. arXiv preprint arXiv:2002.03932(2020)."},{"key":"e_1_3_2_2_6_1","doi-asserted-by":"publisher","DOI":"10.1109\/TASLP.2021.3124365"},{"key":"e_1_3_2_2_7_1","doi-asserted-by":"publisher","unstructured":"Desola. 2019. FinBERT: Pre-Trained Model on SEC Filings for Financial Natural Language Tasks. doi:10.13140\/RG.2.2.19153.89442","DOI":"10.13140\/RG.2.2.19153.89442"},{"key":"e_1_3_2_2_8_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/N19-1423"},{"key":"e_1_3_2_2_9_1","unstructured":"Maarten Grootendorst. 2022. BERTopic: Neural topic modeling with a class-based TF-IDF procedure. arXiv:2203.05794 [cs.CL] https:\/\/arxiv.org\/abs\/2203.05794"},{"key":"e_1_3_2_2_10_1","unstructured":"Panpan Hou Mengchao Zhang Zhibing Fu and Yu Li. 2020. FinBERT. https:\/\/github.com\/valuesimplex\/FinBERT."},{"key":"e_1_3_2_2_11_1","doi-asserted-by":"publisher","DOI":"10.1609\/aaai.v38i20.30214"},{"key":"e_1_3_2_2_12_1","doi-asserted-by":"publisher","DOI":"10.1111\/1911-3846.12832"},{"key":"e_1_3_2_2_13_1","doi-asserted-by":"publisher","DOI":"10.1145\/3394486.3403305"},{"key":"e_1_3_2_2_14_1","unstructured":"IDEA-CCNL. 2021. Fengshenbang-LM. https:\/\/github.com\/IDEA-CCNL\/Fengshenbang-LM."},{"key":"e_1_3_2_2_15_1","doi-asserted-by":"publisher","DOI":"10.1145\/3677052.3698618"},{"key":"e_1_3_2_2_16_1","doi-asserted-by":"crossref","unstructured":"Vladimir Karpukhin Barlas O\u011fuz Sewon Min Patrick Lewis Ledell Wu Sergey Edunov Danqi Chen and Wen-tau Yih. 2020. Dense passage retrieval for open-domain question answering. arXiv preprint arXiv:2004.04906(2020).","DOI":"10.18653\/v1\/2020.emnlp-main.550"},{"key":"e_1_3_2_2_17_1","doi-asserted-by":"publisher","DOI":"10.1016\/j.inffus.2023.101861"},{"key":"e_1_3_2_2_18_1","unstructured":"Thanos Konstantinidis Giorgos Iacovides Mingxue Xu Tony G. Constantinides and Danilo Mandic. 2024. FinLlama: Financial Sentiment Classification for Algorithmic Trading Applications. https:\/\/arxiv.org\/abs\/2403.12285"},{"key":"e_1_3_2_2_19_1","unstructured":"G Lample. 2019. Cross-lingual language model pretraining. arXiv preprint arXiv:1901.07291(2019)."},{"key":"e_1_3_2_2_20_1","unstructured":"Kenton Lee Ming-Wei Chang and Kristina Toutanova. 2019. Latent retrieval for weakly supervised open domain question answering. arXiv preprint arXiv:1906.00300(2019)."},{"key":"e_1_3_2_2_21_1","first-page":"9459","article-title":"Retrieval-augmented generation for knowledge-intensive nlp tasks","volume":"33","author":"Lewis Patrick","year":"2020","unstructured":"Patrick Lewis, Ethan Perez, Aleksandra Piktus, Fabio Petroni, Vladimir Karpukhin, Naman Goyal, Heinrich K\u00fcttler, Mike Lewis, Wen-tau Yih, Tim Rockt\u00e4schel, et al., 2020. Retrieval-augmented generation for knowledge-intensive nlp tasks. Advances in Neural Information Processing Systems, Vol. 33 (2020), 9459-9474.","journal-title":"Advances in Neural Information Processing Systems"},{"key":"e_1_3_2_2_22_1","unstructured":"Yinhan Liu Myle Ott Naman Goyal Jingfei Du Mandar Joshi Danqi Chen Omer Levy M. Lewis Luke Zettlemoyer and Veselin Stoyanov. 2019. RoBERTa: A Robustly Optimized BERT Pretraining Approach. ArXiv(2019)."},{"key":"e_1_3_2_2_23_1","unstructured":"Ilya Loshchilov Barlas O\u011fuz Sewon Min Patrick Lewis Ledell Wu Sergey Edunov Danqi Chen and Wen-tau Yih. 2017. Fixing weight decay regularization in adam. arXiv preprint arXiv:1711.05101(2017)."},{"key":"e_1_3_2_2_24_1","doi-asserted-by":"publisher","DOI":"10.1145\/3626772.3657792"},{"key":"e_1_3_2_2_25_1","doi-asserted-by":"publisher","DOI":"10.1017\/S0022109022001181"},{"key":"e_1_3_2_2_26_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2023.eacl-main.148"},{"key":"e_1_3_2_2_27_1","unstructured":"Pandu Nayak. 2019. Understanding searches better than ever before. https:\/\/blog.google\/products\/search\/search-language-understanding-bert\/ Accessed: 2025-01-05."},{"key":"e_1_3_2_2_28_1","volume-title":"Jerry Tworek, Qiming Yuan, Nikolas Tezak, Jong Wook Kim, Chris Hallacy, et al.","author":"Neelakantan Arvind","year":"2022","unstructured":"Arvind Neelakantan, Tao Xu, Raul Puri, Alec Radford, Jesse Michael Han, Jerry Tworek, Qiming Yuan, Nikolas Tezak, Jong Wook Kim, Chris Hallacy, et al., 2022. Text and code embeddings by contrastive pre-training. arXiv preprint arXiv:2201.10005(2022)."},{"key":"e_1_3_2_2_29_1","unstructured":"Inc. NetEase Youdao. 2023. BCEmbedding: Bilingual and Crosslingual Embedding for RAG. https:\/\/github.com\/netease-youdao\/BCEmbedding."},{"key":"e_1_3_2_2_30_1","unstructured":"Aaron van den Oord Yazhe Li and Oriol Vinyals. 2018. Representation learning with contrastive predictive coding. arXiv preprint arXiv:1807.03748(2018)."},{"key":"e_1_3_2_2_31_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2024.findings-acl.967"},{"key":"e_1_3_2_2_32_1","doi-asserted-by":"publisher","DOI":"10.1109\/ICASSP.2012.6289079"},{"key":"e_1_3_2_2_33_1","volume-title":"One Embedder","author":"Su Hongjin","unstructured":"Hongjin Su, Weijia Shi, Jungo Kasai, Yizhong Wang, Yushi Hu, Mari Ostendorf, Wen-tau Yih, Noah A. Smith, Luke Zettlemoyer, and Tao Yu. 2022. One Embedder, Any Task: Instruction-Finetuned Text Embeddings. https:\/\/arxiv.org\/abs\/2212.09741"},{"key":"e_1_3_2_2_34_1","unstructured":"Yixuan Tang and Yi Yang. 2025. Do We Need Domain-Specific Embedding Models? An Empirical Investigation. arXiv:2409.18511 [cs.CL] https:\/\/arxiv.org\/abs\/2409.18511"},{"key":"e_1_3_2_2_35_1","volume-title":"Beir: A heterogenous benchmark for zero-shot evaluation of information retrieval models. arXiv preprint arXiv:2104.08663(2021).","author":"Thakur Nandan","year":"2021","unstructured":"Nandan Thakur, Nils Reimers, Andreas R\u00fcckl\u00e9, Abhishek Srivastava, and Iryna Gurevych. 2021. Beir: A heterogenous benchmark for zero-shot evaluation of information retrieval models. arXiv preprint arXiv:2104.08663(2021)."},{"key":"e_1_3_2_2_36_1","unstructured":"Liang Wang Nan Yang Xiaolong Huang Binxing Jiao Linjun Yang Daxin Jiang Rangan Majumder and Furu Wei. 2022b. Text Embeddings by Weakly-Supervised Contrastive Pre-Training. https:\/\/arxiv.org\/abs\/2212.03533"},{"key":"e_1_3_2_2_37_1","unstructured":"Neng Wang Hongyang Yang and Christina Dan Wang. 2023b. FinGPT: Instruction Tuning Benchmark for Open-Source Large Language Models in Financial Datasets. https:\/\/arxiv.org\/abs\/2310.04793"},{"key":"e_1_3_2_2_38_1","volume-title":"International Conference on Machine Learning. PMLR, 22964-22984","author":"Wang Thomas","year":"2022","unstructured":"Thomas Wang, Adam Roberts, Daniel Hesslow, Teven Le Scao, Hyung Won Chung, Iz Beltagy, Julien Launay, and Colin Raffel. 2022a. What language model architecture and pretraining objective works best for zero-shot generalization?. In International Conference on Machine Learning. PMLR, 22964-22984."},{"key":"e_1_3_2_2_39_1","unstructured":"Yuxin Wang Qingxuan Sun and Sicheng He. 2023a. M3E: Moka Massive Mixed Embedding Model . Moka Massive Mixed Embedding."},{"key":"e_1_3_2_2_40_1","doi-asserted-by":"crossref","unstructured":"Benjamin Warner Antoine Chaffin Benjamin Clavi\u00e9 Orion Weller Oskar Hallstr\u00f6m Said Taghadouini Alexis Gallagher Raja Biswas Faisal Ladhak Tom Aarsen et al. 2024. Smarter better faster longer: A modern bidirectional encoder for fast memory efficient and long context finetuning and inference. arXiv preprint arXiv:2412.13663(2024).","DOI":"10.18653\/v1\/2025.acl-long.127"},{"key":"e_1_3_2_2_41_1","unstructured":"Shijie Wu Ozan Irsoy Steven Lu Vadim Dabravolski Mark Dredze Sebastian Gehrmann Prabhanjan Kambadur David Rosenberg and Gideon Mann. 2023. BloombergGPT: A Large Language Model for Finance. https:\/\/arxiv.org\/abs\/2303.17564"},{"key":"e_1_3_2_2_42_1","doi-asserted-by":"publisher","DOI":"10.18653\/v1\/2022.emnlp-main.35"},{"key":"e_1_3_2_2_43_1","unstructured":"Shitao Xiao Zheng Liu Peitian Zhang and Niklas Muennighof. 2023. C-Pack: Packaged Resources To Advance General Chinese Embedding. https:\/\/arxiv.org\/abs\/2309.07597"},{"key":"e_1_3_2_2_44_1","volume-title":"International Conference on Machine Learning. PMLR, 26176-26192","author":"Zhang Biao","year":"2022","unstructured":"Biao Zhang, Behrooz Ghorbani, Ankur Bapna, Yong Cheng, Xavier Garcia, Jonathan Shen, and Orhan Firat. 2022. Examining scaling and transfer of language model architectures for machine translation. In International Conference on Machine Learning. PMLR, 26176-26192."},{"key":"e_1_3_2_2_45_1","doi-asserted-by":"publisher","DOI":"10.1145\/3583780.3615285"},{"key":"e_1_3_2_2_46_1","volume-title":"Mengzi: Towards Lightweight yet Ingenious Pre-Trained Models for Chinese. https:\/\/arxiv.org\/abs\/2110.06696","author":"Zhang Zhuosheng","year":"2021","unstructured":"Zhuosheng Zhang, Hanqing Zhang, Keming Chen, Yuhang Guo, Jingyun Hua, Yulong Wang, and Ming Zhou. 2021. Mengzi: Towards Lightweight yet Ingenious Pre-Trained Models for Chinese. https:\/\/arxiv.org\/abs\/2110.06696"}],"event":{"name":"KDD '25: The 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining","location":"Toronto ON Canada","acronym":"KDD '25","sponsor":["SIGKDD ACM Special Interest Group on Knowledge Discovery in Data","SIGMOD ACM Special Interest Group on Management of Data"]},"container-title":["Proceedings of the 31st ACM SIGKDD Conference on Knowledge Discovery and Data Mining V.2"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3711896.3737219","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,4,30]],"date-time":"2026-04-30T18:20:39Z","timestamp":1777573239000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3711896.3737219"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,3]]},"references-count":46,"alternative-id":["10.1145\/3711896.3737219","10.1145\/3711896"],"URL":"https:\/\/doi.org\/10.1145\/3711896.3737219","relation":{},"subject":[],"published":{"date-parts":[[2025,8,3]]},"assertion":[{"value":"2025-08-03","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}