{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,9,25]],"date-time":"2025-09-25T11:21:46Z","timestamp":1758799306461,"version":"3.44.0"},"reference-count":35,"publisher":"Springer Science and Business Media LLC","issue":"5","license":[{"start":{"date-parts":[[2025,4,9]],"date-time":"2025-04-09T00:00:00Z","timestamp":1744156800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,4,9]],"date-time":"2025-04-09T00:00:00Z","timestamp":1744156800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":["Int J Data Sci Anal"],"published-print":{"date-parts":[[2025,10]]},"DOI":"10.1007\/s41060-025-00752-9","type":"journal-article","created":{"date-parts":[[2025,4,9]],"date-time":"2025-04-09T06:51:22Z","timestamp":1744181482000},"page":"4799-4821","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Enhancing clinical information processing with ICRE: an intelligent chain-refinement extraction framework for precision data mining"],"prefix":"10.1007","volume":"20","author":[{"given":"Zheng","family":"Xiao","sequence":"first","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Xiangqian","family":"Dong","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]},{"given":"Juhong","family":"Zou","sequence":"additional","affiliation":[],"role":[{"role":"author","vocabulary":"crossref"}]}],"member":"297","published-online":{"date-parts":[[2025,4,9]]},"reference":[{"issue":"6","key":"752_CR1","doi-asserted-by":"publisher","first-page":"1","DOI":"10.1145\/3127881","volume":"50","author":"P Yadav","year":"2018","unstructured":"Yadav, P., Steinbach, M., Kumar, V., Simon, G.: Mining electronic health records (ehrs) a survey. ACM Comput. Surv. (CSUR) 50(6), 1\u201340 (2018)","journal-title":"ACM Comput. Surv. (CSUR)"},{"key":"752_CR2","doi-asserted-by":"publisher","first-page":"136","DOI":"10.1016\/j.amjcard.2023.06.104","volume":"203","author":"LS Dhingra","year":"2023","unstructured":"Dhingra, L.S., Shen, M., Mangla, A., Khera, R.: Cardiovascular care innovation through data-driven discoveries in the electronic health record. Am. J. Cardiol. 203, 136\u2013148 (2023)","journal-title":"Am. J. Cardiol."},{"issue":"10","key":"752_CR3","doi-asserted-by":"publisher","first-page":"1261","DOI":"10.2217\/fon-2015-0043","volume":"12","author":"ML Berger","year":"2016","unstructured":"Berger, M.L., Curtis, M.D., Smith, G., Harnett, J., Abernethy, A.P.: Opportunities and challenges in leveraging electronic health record data in oncology. Future Oncol. 12(10), 1261\u20131274 (2016)","journal-title":"Future Oncol."},{"issue":"Suppl 4","key":"752_CR4","doi-asserted-by":"publisher","first-page":"999","DOI":"10.1007\/s11606-023-08318-w","volume":"38","author":"B Molloy-Paolillo","year":"2023","unstructured":"Molloy-Paolillo, B., Mohr, D., Levy, D.R., Cutrona, S.L., Anderson, E., Rucci, J., Helfrich, C., Sayre, G., Rinne, S.T.: Assessing electronic health record (ehr) use during a major ehr transition: An innovative mixed methods approach. J. Gen. Intern. Med. 38(Suppl 4), 999\u20131006 (2023)","journal-title":"J. Gen. Intern. Med."},{"key":"752_CR5","doi-asserted-by":"publisher","first-page":"765","DOI":"10.1016\/j.molmed.2023.06.006","volume":"29","author":"P Singhal","year":"2023","unstructured":"Singhal, P., Tan, A., Drivas, T., Johnson, K., Ritchie, M., Beaulieu-Jones, B.: Opportunities and challenges for biomarker discovery using electronic health record data. Trends Mol. Med. 29, 765\u2013776 (2023)","journal-title":"Trends Mol. Med."},{"issue":"1","key":"752_CR6","first-page":"17","volume":"43","author":"VK Chaudhri","year":"2022","unstructured":"Chaudhri, V.K., Baru, C., Chittar, N., Dong, X.L., Genesereth, M., Hendler, J., Kalyanpur, A., Lenat, D.B., Sequeda, J., Vrande\u010di\u0107, D., Wang, K.: Knowledge graphs: Introduction, history, and perspectives. AI Mag. 43(1), 17\u201329 (2022)","journal-title":"AI Mag."},{"issue":"2","key":"752_CR7","doi-asserted-by":"publisher","first-page":"494","DOI":"10.1109\/TNNLS.2021.3070843","volume":"33","author":"S Ji","year":"2021","unstructured":"Ji, S., Pan, S., Cambria, E., Marttinen, P., Philip, S.Y.: A survey on knowledge graphs: Representation, acquisition, and applications. IEEE Trans. Neural Netw. Learn. Syst. 33(2), 494\u2013514 (2021)","journal-title":"IEEE Trans. Neural Netw. Learn. Syst."},{"issue":"1","key":"752_CR8","doi-asserted-by":"publisher","first-page":"2017","DOI":"10.1038\/s41467-021-22328-4","volume":"12","author":"JA Fries","year":"2021","unstructured":"Fries, J.A., Steinberg, E., Khattar, S., Fleming, S.L., Posada, J., Callahan, A., Shah, N.H.: Ontology-driven weak supervision for clinical entity classification in electronic health records. Nat. Commun. 12(1), 2017 (2021)","journal-title":"Nat. Commun."},{"key":"752_CR9","doi-asserted-by":"publisher","DOI":"10.1016\/j.ijmedinf.2022.104864","volume":"167","author":"SY Wang","year":"2022","unstructured":"Wang, S.Y., Huang, J., Hwang, H., Hu, W., Tao, S., Hernandez-Boussard, T.: Leveraging weak supervision to perform named entity recognition in electronic health records progress notes to identify the ophthalmology exam. Int. J. Med. Inf. 167, 104864 (2022)","journal-title":"Int. J. Med. Inf."},{"key":"752_CR10","doi-asserted-by":"publisher","first-page":"132","DOI":"10.1016\/j.neunet.2019.08.032","volume":"121","author":"L Gligic","year":"2020","unstructured":"Gligic, L., Kormilitzin, A., Goldberg, P., Nevado-Holgado, A.: Named entity recognition in electronic health records using transfer learning bootstrapped neural networks. Neural Netw. 121, 132\u2013139 (2020)","journal-title":"Neural Netw."},{"key":"752_CR11","doi-asserted-by":"crossref","unstructured":"Lu, Y., Liu, Q., Dai, D., Xiao, X., Lin, H., Han, X., Sun, L., Wu, H.: Unified structure generation for universal information extraction. In: Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), pp. 5755\u20135772. Association for Computational Linguistics, Dublin, Ireland (2022)","DOI":"10.18653\/v1\/2022.acl-long.395"},{"key":"752_CR12","unstructured":"Wang, X., Zhou, W., Zu, C., Xia, H., Chen, T., Zhang, Y., Zheng, R., Ye, J., Zhang, Q., Gui, T., Kang, J., Yang, J., Li, S., Du, C.: InstructUIE: Multi-task instruction tuning for unified information extraction. ArXiv abs\/2304.08085 (2023)"},{"key":"752_CR13","unstructured":"Gui, H., Zhang, J., Ye, H., Zhang, N.: InstructIE: A bilingual instruction-based information extraction dataset. ArXiv abs\/2305.11527 (2023)"},{"key":"752_CR14","doi-asserted-by":"publisher","first-page":"3580","DOI":"10.1109\/TKDE.2024.3352100","volume":"36","author":"S Pan","year":"2024","unstructured":"Pan, S., Luo, L., Wang, Y., Chen, C., Wang, J., Wu, X.: Unifying large language models and knowledge graphs: A roadmap. IEEE Trans. Knowl. Data Eng. 36, 3580\u20133599 (2024)","journal-title":"IEEE Trans. Knowl. Data Eng."},{"key":"752_CR15","unstructured":"Zhang, S., Dong, L., Li, X., Zhang, S., Sun, X., Wang, S., Li, J., Hu, R., Zhang, T., Wu, F., et al.: Instruction tuning for large language models: A survey. arXiv preprint arXiv:2308.10792 (2023)"},{"key":"752_CR16","unstructured":"Jang, J., Kim, S., Ye, S., Kim, D., Logeswaran, L., Lee, M., Lee, K., Seo, M.: Exploring the benefits of training expert language models over instruction tuning. In: International Conference on Machine Learning, 14702\u201314729 (2023). PMLR"},{"key":"752_CR17","doi-asserted-by":"crossref","unstructured":"Amal, S., Kuflik, T., Minkov, E.: Harvesting entity-relation social networks from the web: Potential and challenges. In: Proceedings of the 25th Conference on User Modeling, Adaptation and Personalization. UMAP \u201917, pp. 351\u2013352. Association for Computing Machinery, New York, NY, USA (2017)","DOI":"10.1145\/3079628.3079656"},{"key":"752_CR18","doi-asserted-by":"crossref","unstructured":"Gui, H., Yuan, L., Ye, H., Zhang, N., Sun, M., Liang, L., Chen, H.: IEPile: Unearthing large-scale schema-based information extraction corpus. ArXiv abs\/2402.14710 (2024)","DOI":"10.18653\/v1\/2024.acl-short.13"},{"key":"752_CR19","doi-asserted-by":"crossref","unstructured":"Ou, Y., Zhang, N., Gui, H., Xu, Z., Qiao, S., Bi, Z., Chen, H.: EasyInstruct: An easy-to-use instruction processing framework for large language models. arXiv preprint arXiv:2402.03049 (2024)","DOI":"10.18653\/v1\/2024.acl-demos.10"},{"key":"752_CR20","unstructured":"Kejriwal, M., Knoblock, C.A., Szekely, P.: Knowledge Graphs: Fundamentals, Techniques, and Applications. MIT Press, (2021)"},{"key":"752_CR21","doi-asserted-by":"publisher","DOI":"10.1145\/3560815","author":"P Liu","year":"2023","unstructured":"Liu, P., Yuan, W., Fu, J., Jiang, Z., Hayashi, H., Neubig, G.: Pre-train, prompt, and predict: A systematic survey of prompting methods in natural language processing. ACM Comput. Surv. (2023). https:\/\/doi.org\/10.1145\/3560815","journal-title":"ACM Comput. Surv."},{"key":"752_CR22","doi-asserted-by":"crossref","unstructured":"Bach, S.H., Sanh, V., Yong, Z.-X., Webson, A., Raffel, C., Nayak, N.V., Sharma, A., Kim, T., Bari, M.S., F\u00e9vry, T., Alyafeai, Z., Dey, M., Santilli, A., Sun, Z., Ben-David, S., Xu, C., Chhablani, G., Wang, H., Fries, J.A., Al-Shaibani, M.S., Sharma, S., Thakker, U., Almubarak, K., Tang, X., Jiang, M.T.-J., Rush, A.M.: PromptSource: An integrated development environment and repository for natural language prompts. ArXiv abs\/2202.01279 (2022)","DOI":"10.18653\/v1\/2022.acl-demo.9"},{"issue":"4","key":"752_CR23","doi-asserted-by":"publisher","first-page":"5235","DOI":"10.1007\/s10586-023-04221-5","volume":"27","author":"B Abdollahzadeh","year":"2024","unstructured":"Abdollahzadeh, B., Khodadadi, N., Barshandeh, S., Trojovsk\u00fd, P., Gharehchopogh, F.S., El-kenawy, E.-S.M., Abualigah, L., Mirjalili, S.: Puma optimizer (PO): a novel metaheuristic optimization algorithm and its application in machine learning. Clust. Comput. 27(4), 5235\u20135283 (2024)","journal-title":"Clust. Comput."},{"key":"752_CR24","unstructured":"Agarwal, E., Dani, V., Ganu, T., Nambi, A.: PromptWizard: Task-aware agent-driven prompt optimization framework. arXiv preprint arXiv:2405.18369 (2024)"},{"key":"752_CR25","doi-asserted-by":"crossref","unstructured":"Li, Y., Li, Z., Zhang, K., Dan, R., Jiang, S., Zhang, Y.: ChatDoctor: A medical chat model fine-tuned on a large language model meta-ai (llama) using medical domain knowledge. Cureus 15 (2023)","DOI":"10.7759\/cureus.40895"},{"issue":"5","key":"752_CR26","doi-asserted-by":"publisher","first-page":"885","DOI":"10.1016\/j.jbi.2012.04.008","volume":"45","author":"H Gurulingappa","year":"2012","unstructured":"Gurulingappa, H., Rajput, A.M., Roberts, A., Fluck, J., Hofmann-Apitius, M., Toldo, L.: Development of a benchmark corpus to support the automatic extraction of drug-related adverse effects from medical case reports. J. Biomed. Inf. 45(5), 885\u2013892 (2012). https:\/\/doi.org\/10.1016\/j.jbi.2012.04.008","journal-title":"J. Biomed. Inf."},{"key":"752_CR27","doi-asserted-by":"crossref","unstructured":"Wen, C., Chen, T., Jia, X., Zhu, J.: Medical Named Entity Recognition from Un-labelled Medical Records based on Pre-trained Language Models and Domain Dictionary. Data Intell. 3(3), 402\u2013417 (2021)","DOI":"10.1162\/dint_a_00105"},{"key":"752_CR28","unstructured":"Chen, M., Bi, Z., Liang, X., Li, L., Shang, X., Yin, K., Tan, C., Xu, J., Huang, F., Si, L., Ni, Y., Sui, Z., Chang, B., Zong, H., Yuan, Z., Li, L., Yan, J., Zan, H., Zhang, K., Tang, B., Chen, Q.: Cblue: a chinese biomedical language understanding evaluation benchmark. Proceedings of the 60th Annual Meeting of the Association for Computational Linguistics (Volume 1: Long Papers), 7888\u20137915 (2022)"},{"key":"752_CR29","unstructured":"Do, V.-T., Hoang, V.-K., Nguyen, D.-H., Sabahi, S., Yang, J., Hotta, H., Nguyen, M.-T., Le, H.: Automatic prompt selection for large language models. ArXiv abs\/2404.02717 (2024)"},{"key":"752_CR30","doi-asserted-by":"crossref","unstructured":"Bosselut, A., Rashkin, H., Sap, M., Malaviya, C., Celikyilmaz, A., Choi, Y.: COMET: Commonsense transformers for automatic knowledge graph construction. In: Korhonen, A., Traum, D., M\u00e0rquez, L. (eds.) Proceedings of the 57th Annual Meeting of the Association for Computational Linguistics, pp. 4762\u20134779. Association for Computational Linguistics, Florence, Italy (2019)","DOI":"10.18653\/v1\/P19-1470"},{"key":"752_CR31","unstructured":"Yang, C., Wang, X., Lu, Y., Liu, H., Le, Q.V., Zhou, D., Chen, X.: Large language models as optimizers. In: The Twelfth International Conference on Learning Representations (2024)"},{"key":"752_CR32","doi-asserted-by":"publisher","DOI":"10.1016\/j.patcog.2023.109542","volume":"140","author":"P Cao","year":"2023","unstructured":"Cao, P., Wu, J.: Graphrevisedie: Multimodal information extraction with graph-revised network. Pattern Recognit. 140, 109542 (2023)","journal-title":"Pattern Recognit."},{"key":"752_CR33","doi-asserted-by":"crossref","unstructured":"Sun, L., Zhang, K., Li, Q., Lou, R.: Umie: Unified multimodal information extraction with instruction tuning. In: Proceedings of the AAAI Conference on Artificial Intelligence, 38, 19062\u201319070 (2024)","DOI":"10.1609\/aaai.v38i17.29873"},{"key":"752_CR34","doi-asserted-by":"crossref","unstructured":"Islakoglu, D.S., Chekol, M.W., Velegrakis, Y.: Leveraging pre-trained language models for time interval prediction in text-enhanced temporal knowledge graphs. In: European Semantic Web Conference, pp. 59\u201378 (2024). Springer","DOI":"10.1007\/978-3-031-60626-7_4"},{"key":"752_CR35","doi-asserted-by":"crossref","unstructured":"Liao, R., Jia, X., Ma, Y., Tresp, V.: Gentkg: Generative forecasting on temporal knowledge graph. arXiv preprint arXiv:2310.07793 (2023)","DOI":"10.18653\/v1\/2024.findings-naacl.268"}],"container-title":["International Journal of Data Science and Analytics"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-025-00752-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/article\/10.1007\/s41060-025-00752-9\/fulltext.html","content-type":"text\/html","content-version":"vor","intended-application":"text-mining"},{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/s41060-025-00752-9.pdf","content-type":"application\/pdf","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,9,25]],"date-time":"2025-09-25T10:48:30Z","timestamp":1758797310000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/s41060-025-00752-9"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,4,9]]},"references-count":35,"journal-issue":{"issue":"5","published-print":{"date-parts":[[2025,10]]}},"alternative-id":["752"],"URL":"https:\/\/doi.org\/10.1007\/s41060-025-00752-9","relation":{},"ISSN":["2364-415X","2364-4168"],"issn-type":[{"type":"print","value":"2364-415X"},{"type":"electronic","value":"2364-4168"}],"subject":[],"published":{"date-parts":[[2025,4,9]]},"assertion":[{"value":"13 December 2024","order":1,"name":"received","label":"Received","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"1 March 2025","order":2,"name":"accepted","label":"Accepted","group":{"name":"ArticleHistory","label":"Article History"}},{"value":"9 April 2025","order":3,"name":"first_online","label":"First Online","group":{"name":"ArticleHistory","label":"Article History"}},{"order":1,"name":"Ethics","group":{"name":"EthicsHeading","label":"Declarations"}},{"value":"The authors declare no conflict of interest.","order":2,"name":"Ethics","group":{"name":"EthicsHeading","label":"Conflict of interest"}}]}}