{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2026,1,29]],"date-time":"2026-01-29T19:23:23Z","timestamp":1769714603253,"version":"3.49.0"},"publisher-location":"New York, NY, USA","reference-count":11,"publisher":"ACM","funder":[{"name":"Research Program of Shandong University of Political Science and Law","award":["2023Z07B"],"award-info":[{"award-number":["2023Z07B"]}]},{"name":"Research Program of Shandong University of Political Science and Law","award":["2024KZ13Z"],"award-info":[{"award-number":["2024KZ13Z"]}]}],"content-domain":{"domain":["dl.acm.org"],"crossmark-restriction":true},"short-container-title":[],"published-print":{"date-parts":[[2025,10,29]]},"DOI":"10.1145\/3778265.3778274","type":"proceedings-article","created":{"date-parts":[[2026,1,29]],"date-time":"2026-01-29T07:25:21Z","timestamp":1769671521000},"page":"63-68","update-policy":"https:\/\/doi.org\/10.1145\/crossmark-policy","source":"Crossref","is-referenced-by-count":0,"title":["A fast and parallel framework for massive sensitive data detection based on big data technologies and large language models (LLMs)"],"prefix":"10.1145","author":[{"ORCID":"https:\/\/orcid.org\/0000-0003-2165-7119","authenticated-orcid":false,"given":"Xingsen","family":"Zhang","sequence":"first","affiliation":[{"name":"School of Cyber Science and Technology, Shandong University of Political Science and Law, Shandong, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0001-8848-2766","authenticated-orcid":false,"given":"Guanyu","family":"Su","sequence":"additional","affiliation":[{"name":"School of Cyber Science and Technology, Shandong University of Political Science and Law, Shandong, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-8674-7037","authenticated-orcid":false,"given":"Daopeng","family":"Zhu","sequence":"additional","affiliation":[{"name":"School of Cyber Science and Technology, Shandong University of Political Science and Law, Shandong, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0002-9825-166X","authenticated-orcid":false,"given":"Jiaxi","family":"Huang","sequence":"additional","affiliation":[{"name":"School of Cyber Science and Technology, Shandong University of Political Science and Law, Shandong, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-4548-0642","authenticated-orcid":false,"given":"Yanrui","family":"Yang","sequence":"additional","affiliation":[{"name":"School of Cyber Science and Technology, Shandong University of Political Science and Law, Shandong, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0003-3115-4483","authenticated-orcid":false,"given":"Guohui","family":"Li","sequence":"additional","affiliation":[{"name":"School of Cyber Science and Technology, Shandong University of Political Science and Law, Shandong, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0008-0607-172X","authenticated-orcid":false,"given":"Shengan","family":"Che","sequence":"additional","affiliation":[{"name":"School of Cyber Science and Technology, Shandong University of Political Science and Law, Shandong, China"}]},{"ORCID":"https:\/\/orcid.org\/0009-0005-1724-9800","authenticated-orcid":false,"given":"Bolu","family":"Zhang","sequence":"additional","affiliation":[{"name":"School of Cyber Science and Technology, Shandong University of Political Science and Law, Shandong, China"}]}],"member":"320","published-online":{"date-parts":[[2026,1,28]]},"reference":[{"key":"e_1_3_3_1_2_2","doi-asserted-by":"publisher","DOI":"10.1109\/INCoS.2016.95"},{"key":"e_1_3_3_1_3_2","doi-asserted-by":"publisher","unstructured":"Tom\u00a0B. Brown Benjamin Mann Nick Ryder et\u00a0al. 2020. Language models are few-shot learners. arxiv:https:\/\/arXiv.org\/abs\/2005.14165\u00a0[cs.CL] 10.48550\/arXiv.2005.14165","DOI":"10.48550\/arXiv.2005.14165"},{"key":"e_1_3_3_1_4_2","doi-asserted-by":"publisher","unstructured":"Haisu Chen Jiachun Liao and Sicheng Yao. 2024. Identification and statistical analysis methods of personal information disclosure in open government data. Journal of Shandong University (Natural Science) 59 3 (2024) 95\u2013106. 10.6040\/j.issn.1671-9352.7.2023.2681","DOI":"10.6040\/j.issn.1671-9352.7.2023.2681"},{"key":"e_1_3_3_1_5_2","doi-asserted-by":"publisher","unstructured":"Haisu Chen Jiachun Liao and Sicheng Yao. 2024. Identification and statistical analysis methods of personal information disclosure in open government data. Journal of Shandong University (Natural Science) 59 3 (2024) 95\u2013106. 10.6040\/j.issn.1671-9352.7.2023.2681","DOI":"10.6040\/j.issn.1671-9352.7.2023.2681"},{"key":"e_1_3_3_1_6_2","doi-asserted-by":"publisher","unstructured":"Ye Hua and Li Wang. 2020. Research and practice of data asset management in tobacco enterprises. Acta Tabacaria Sinica 26 5 (2020) 114\u2013122. 10.16472\/j.chinatobacco.2019.236","DOI":"10.16472\/j.chinatobacco.2019.236"},{"key":"e_1_3_3_1_7_2","doi-asserted-by":"publisher","DOI":"10.1145\/3677052.3698696"},{"key":"e_1_3_3_1_8_2","doi-asserted-by":"publisher","unstructured":"Peng Su and Karthik Vijay-Shanker. 2022. Investigation of improving the pre-training and fine-tuning of BERT model for biomedical relation extraction. BMC Bioinformatics 23 1 (2022) 120. 10.1186\/s12859-022-04642-w","DOI":"10.1186\/s12859-022-04642-w"},{"key":"e_1_3_3_1_9_2","doi-asserted-by":"publisher","unstructured":"Chongteng Tian Jing Liu Xiaoyan Wang and Ming Li. 2025. Review of the application of large language models GPT in medical text. Journal of Frontiers of Computer Science and Technology (2025). 10.3778\/j.issn.1673-9418.2409076","DOI":"10.3778\/j.issn.1673-9418.2409076"},{"key":"e_1_3_3_1_10_2","doi-asserted-by":"publisher","unstructured":"Ji Tu Wendong Xiao Wenji Tu and Lijian Li. 2025. Application of large language models in medical education: Current situation challenges and future. Computer Science 52 6A (2025) 240400121\u20136. 10.11896\/jsjkx.240400121","DOI":"10.11896\/jsjkx.240400121"},{"key":"e_1_3_3_1_11_2","doi-asserted-by":"publisher","unstructured":"Hanzhou Xiao and Yingchun Liu. 2025. Study on large database retrieval based on improved B+ tree index. Journal of Guilin University of Aerospace Technology 29 3 (2025) 446\u2013451. 10.3969\/j.issn.1009-1033.2024.03.023","DOI":"10.3969\/j.issn.1009-1033.2024.03.023"},{"key":"e_1_3_3_1_12_2","doi-asserted-by":"publisher","unstructured":"Sonja Zillner and Sabrina Neurerer. 2015. Technology roadmap development for big data healthcare applications. Kunstliche Intelligenz 29 2 (2015) 131\u2013141. 10.1007\/s13218-014-0335-y","DOI":"10.1007\/s13218-014-0335-y"}],"event":{"name":"BDSIC 2025: 2025 7th International Conference on Big-data Service and Intelligent Computation","location":"Bangkok Thailand","acronym":"BDSIC 2025"},"container-title":["Proceedings of the 2025 7th International Conference on Big-data Service and Intelligent Computation"],"original-title":[],"link":[{"URL":"https:\/\/dl.acm.org\/doi\/pdf\/10.1145\/3778265.3778274","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2026,1,29]],"date-time":"2026-01-29T07:25:39Z","timestamp":1769671539000},"score":1,"resource":{"primary":{"URL":"https:\/\/dl.acm.org\/doi\/10.1145\/3778265.3778274"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,29]]},"references-count":11,"alternative-id":["10.1145\/3778265.3778274","10.1145\/3778265"],"URL":"https:\/\/doi.org\/10.1145\/3778265.3778274","relation":{},"subject":[],"published":{"date-parts":[[2025,10,29]]},"assertion":[{"value":"2026-01-28","order":3,"name":"published","label":"Published","group":{"name":"publication_history","label":"Publication History"}}]}}