{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T01:40:02Z","timestamp":1755826802390,"version":"3.44.0"},"publisher-location":"Cham","reference-count":32,"publisher":"Springer Nature Switzerland","isbn-type":[{"type":"print","value":"9783032025500"},{"type":"electronic","value":"9783032025517"}],"license":[{"start":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T00:00:00Z","timestamp":1755820800000},"content-version":"tdm","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"},{"start":{"date-parts":[[2025,8,22]],"date-time":"2025-08-22T00:00:00Z","timestamp":1755820800000},"content-version":"vor","delay-in-days":0,"URL":"https:\/\/www.springernature.com\/gp\/researchers\/text-and-data-mining"}],"content-domain":{"domain":["link.springer.com"],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2026]]},"DOI":"10.1007\/978-3-032-02551-7_8","type":"book-chapter","created":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T05:27:44Z","timestamp":1755754064000},"page":"77-89","update-policy":"https:\/\/doi.org\/10.1007\/springer_crossmark_policy","source":"Crossref","is-referenced-by-count":0,"title":["Efficient Domain-Adaptive Continual Pretraining for\u00a0the\u00a0Process Industry in\u00a0the\u00a0German Language"],"prefix":"10.1007","author":[{"given":"Anastasia","family":"Zhukova","sequence":"first","affiliation":[]},{"given":"Christian E.","family":"Matt","sequence":"additional","affiliation":[]},{"given":"Bela","family":"Gipp","sequence":"additional","affiliation":[]}],"member":"297","published-online":{"date-parts":[[2025,8,22]]},"reference":[{"key":"8_CR1","doi-asserted-by":"publisher","unstructured":"Bai, F., Ritter, A., Xu, W.: Pre-train or annotate? domain adaptation with a constrained budget. In: Proceedings of the 2021 Conference on Empirical Methods in Natural Language Processing, pp. 5002\u20135015. Association for Computational Linguistics, Online and Punta Cana, Dominican Republic (2021). https:\/\/doi.org\/10.18653\/v1\/2021.emnlp-main.409","DOI":"10.18653\/v1\/2021.emnlp-main.409"},{"key":"8_CR2","doi-asserted-by":"publisher","unstructured":"Beltagy, I., Lo, K., Cohan, A.: SciBERT: a pretrained language model for scientific text. In: Proceedings of the 2019 Conference on Empirical Methods in Natural Language Processing and the 9th International Joint Conference on Natural Language Processing (EMNLP-IJCNLP), pp. 3613\u20133618. Association for Computational Linguistics, Hong Kong, China (2019). https:\/\/doi.org\/10.18653\/v1\/D19-1371","DOI":"10.18653\/v1\/D19-1371"},{"key":"8_CR3","unstructured":"Brown, T., et al.: Language models are few-shot learners. In: Larochelle, H., Ranzato, M., Hadsell, R., Balcan, M., Lin, H. (eds.) Advances in Neural Information Processing Systems, vol.\u00a033, pp. 1877\u20131901. Curran Associates, Inc. (2020). https:\/\/proceedings.neurips.cc\/paper_files\/paper\/2020\/file\/1457c0d6bfcb4967418bfb8ac142f64a-Paper.pdf"},{"key":"8_CR4","doi-asserted-by":"publisher","unstructured":"Caciularu, A., Cohan, A., Beltagy, I., Peters, M., Cattan, A., Dagan, I.: CDLM: cross-document language modeling. In: Findings of the Association for Computational Linguistics: EMNLP 2021, pp. 2648\u20132662. Association for Computational Linguistics, Punta Cana, Dominican Republic (2021). https:\/\/doi.org\/10.18653\/v1\/2021.findings-emnlp.225","DOI":"10.18653\/v1\/2021.findings-emnlp.225"},{"key":"8_CR5","doi-asserted-by":"publisher","unstructured":"Chan, B., Schweter, S., M\u00f6ller, T.: German\u2019s next language model. In: Proceedings of the 28th International Conference on Computational Linguistics. pp. 6788\u20136796. International Committee on Computational Linguistics, Barcelona, Spain (Online) (2020). https:\/\/doi.org\/10.18653\/v1\/2020.coling-main.598","DOI":"10.18653\/v1\/2020.coling-main.598"},{"key":"8_CR6","doi-asserted-by":"publisher","DOI":"10.1016\/j.compbiomed.2023.106581","volume":"154","author":"M Chizhikova","year":"2023","unstructured":"Chizhikova, M., et al.: CARES: a corpus for classification of Spanish radiological reports. Comput. Biol. Med. 154, 106581 (2023). https:\/\/doi.org\/10.1016\/j.compbiomed.2023.106581","journal-title":"Comput. Biol. Med."},{"key":"8_CR7","unstructured":"Chu, C., Wang, R.: A survey of domain adaptation for neural machine translation. In: Bender, E.M., Derczynski, L., Isabelle, P. (eds.) Proceedings of the 27th International Conference on Computational Linguistics, pp. 1304\u20131319. Association for Computational Linguistics, Santa Fe, New Mexico, USA (2018). https:\/\/aclanthology.org\/C18-1111"},{"key":"8_CR8","unstructured":"DNB: Free online university publications. https:\/\/data.dnb.de\/FreieOnlineHochschulschriften\/ (2024). Accessed 06 May 2024"},{"key":"8_CR9","unstructured":"DPMAregister: DPMAregister - Amtliche Publikations- und Registerdatenbank (2024). https:\/\/register.dpma.de\/DPMAregister\/pat\/basis. Accessed 10 Jan 2024"},{"key":"8_CR10","unstructured":"ECHA: Rechtsvorschriften (2024). https:\/\/echa.europa.eu\/de\/regulations\/reach\/legislation. Accessed 23 July 2023"},{"key":"8_CR11","unstructured":"EUR-Lex: Directive 2006\/42\/EC of the European Parliament and of the Council of 17 May 2006 on machinery, and amending Directive 95\/16\/EC (2019). https:\/\/eur-lex.europa.eu\/legal-content\/EN\/ALL\/?uri=celex%3A32006L0042. Accessed 26 July 2023"},{"key":"8_CR12","unstructured":"European Comission: Legal framework governing medicinal products for human use in the EU (2024). https:\/\/health.ec.europa.eu\/medicinal-products\/legal-framework-governing-medicinal-products-human-use-eu_en?etrans=de&prefLang=de. Accessed 24 July 2023"},{"key":"8_CR13","unstructured":"GESIS: Patentdaten der Deutschen Demokratischen Republik (DDR) (1949-1990). https:\/\/doi.org\/10.7802\/2423 (2022). Accessed 12 Aug 2023"},{"key":"8_CR14","unstructured":"Garg, S., Moghaddam, R.Z., Sundaresan, N.: RAPGen: an approach for fixing code inefficiencies in zero-shot (2024). https:\/\/arxiv.org\/abs\/2306.17077"},{"key":"8_CR15","unstructured":"Gunasekar, S., et al.: Textbooks are all you need (2023)"},{"key":"8_CR16","doi-asserted-by":"publisher","unstructured":"Gururangan, S., et al.: Don\u2019t stop pretraining: adapt language models to domains and tasks. In: Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 8342\u20138360. Association for Computational Linguistics, Online (2020). https:\/\/doi.org\/10.18653\/v1\/2020.acl-main.740","DOI":"10.18653\/v1\/2020.acl-main.740"},{"key":"8_CR17","doi-asserted-by":"publisher","unstructured":"Hedderich, M.A., Lange, L., Adel, H., Str\u00f6tgen, J., Klakow, D.: A survey on recent approaches for natural language processing in low-resource scenarios. In: Toutanova, K., Rumshisky, A., Zettlemoyer, L., Hakkani-Tur, D., Beltagy, I., Bethard, S., Cotterell, R., Chakraborty, T., Zhou, Y. (eds.) Proceedings of the 2021 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, pp. 2545\u20132568. Association for Computational Linguistics, Online (Jun 2021). https:\/\/doi.org\/10.18653\/v1\/2021.naacl-main.201, https:\/\/aclanthology.org\/2021.naacl-main.201","DOI":"10.18653\/v1\/2021.naacl-main.201"},{"key":"8_CR18","doi-asserted-by":"publisher","unstructured":"Jiang, G., et al.: Towards anytime fine-tuning: continually pre-trained language models with hypernetwork prompts. In: Findings of the Association for Computational Linguistics: EMNLP 2023, pp. 12081\u201312095. Association for Computational Linguistics, Singapore (2023). https:\/\/doi.org\/10.18653\/v1\/2023.findings-emnlp.808","DOI":"10.18653\/v1\/2023.findings-emnlp.808"},{"key":"8_CR19","doi-asserted-by":"publisher","unstructured":"Joshi, P., Santy, S., Budhiraja, A., Bali, K., Choudhury, M.: The state and fate of linguistic diversity and inclusion in the NLP world. In: Jurafsky, D., Chai, J., Schluter, N., Tetreault, J. (eds.) Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics, pp. 6282\u20136293. Association for Computational Linguistics, Online (2020). https:\/\/doi.org\/10.18653\/v1\/2020.acl-main.560, https:\/\/aclanthology.org\/2020.acl-main.560\/","DOI":"10.18653\/v1\/2020.acl-main.560"},{"key":"8_CR20","unstructured":"Ke, Z., Shao, Y., Lin, H., Konishi, T., Kim, G., Liu, B.: Continual pre-training of language models. In: The Eleventh International Conference on Learning Representations, ICLR 2023, Kigali, Rwanda, May 1-5, 2023. OpenReview.net (2023). https:\/\/openreview.net\/forum?id=m_GDIItaI3o"},{"key":"8_CR21","doi-asserted-by":"publisher","unstructured":"Long, Q., Wang, W., Pan, S.: Adapt in contexts: retrieval-augmented domain adaptation via in-context learning. In: Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing, pp. 6525\u20136542. Association for Computational Linguistics, Singapore (2023). https:\/\/doi.org\/10.18653\/v1\/2023.emnlp-main.402","DOI":"10.18653\/v1\/2023.emnlp-main.402"},{"key":"8_CR22","unstructured":"Monajatipoor, M., et al.: LLMS in biomedicine: a study on clinical named entity recognition (2024)"},{"key":"8_CR23","doi-asserted-by":"publisher","unstructured":"Mosbach, M., Pimentel, T., Ravfogel, S., Klakow, D., Elazar, Y.: Few-shot fine-tuning vs. in-context learning: a fair comparison and evaluation. In: Rogers, A., Boyd-Graber, J., Okazaki, N. (eds.) Findings of the Association for Computational Linguistics: ACL 2023, pp. 12284\u201312314. Association for Computational Linguistics, Toronto, Canada (2023). https:\/\/doi.org\/10.18653\/v1\/2023.findings-acl.779, https:\/\/aclanthology.org\/2023.findings-acl.779\/","DOI":"10.18653\/v1\/2023.findings-acl.779"},{"key":"8_CR24","unstructured":"Nguyen, T., et al.: MS MARCO: a human generated machine reading comprehension dataset. In: Besold, T.R., Bordes, A., d\u2019Avila Garcez, A.S., Wayne, G. (eds.) Proceedings of the Workshop on Cognitive Computation: Integrating neural and symbolic approaches 2016 co-located with the 30th Annual Conference on Neural Information Processing Systems (NIPS 2016), Barcelona, Spain, December 9, 2016. CEUR Workshop Proceedings, vol.\u00a01773. CEUR-WS.org (2016). https:\/\/ceur-ws.org\/Vol-1773\/CoCoNIPS_2016_paper9.pdf"},{"key":"8_CR25","doi-asserted-by":"publisher","unstructured":"Reimers, N., Gurevych, I.: Making monolingual sentence embeddings multilingual using knowledge distillation. In: Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP), pp. 4512\u20134525. Association for Computational Linguistics, Online (2020). https:\/\/doi.org\/10.18653\/v1\/2020.emnlp-main.365","DOI":"10.18653\/v1\/2020.emnlp-main.365"},{"key":"8_CR26","doi-asserted-by":"publisher","unstructured":"Rojas, M., Dunstan, J., Villena, F.: Clinical Flair: a pre-trained language model for Spanish clinical natural language processing. In: Proceedings of the 4th Clinical Natural Language Processing Workshop, pp. 87\u201392. Association for Computational Linguistics, Seattle, WA (2022). https:\/\/doi.org\/10.18653\/v1\/2022.clinicalnlp-1.9","DOI":"10.18653\/v1\/2022.clinicalnlp-1.9"},{"key":"8_CR27","doi-asserted-by":"publisher","unstructured":"Tai, W., Kung, H.T., Dong, X., Comiter, M., Kuo, C.F.: exBERT: extending pre-trained models with domain-specific vocabulary under constrained training resources. In: Findings of the Association for Computational Linguistics: EMNLP 2020, pp. 1433\u20131439. Association for Computational Linguistics, Online (2020). https:\/\/doi.org\/10.18653\/v1\/2020.findings-emnlp.129","DOI":"10.18653\/v1\/2020.findings-emnlp.129"},{"key":"8_CR28","unstructured":"Thakur, N., Reimers, N., R\u00fcckl\u00e9, A., Srivastava, A., Gurevych, I.: Beir: a heterogeneous benchmark for zero-shot evaluation of information retrieval models. In: Vanschoren, J., Yeung, S. (eds.) Proceedings of the Neural Information Processing Systems Track on Datasets and Benchmarks. vol.\u00a01 (2021). https:\/\/datasets-benchmarks-proceedings.neurips.cc\/paper_files\/paper\/2021\/file\/65b9eea6e1cc6bb9f0cd2a47751a186f-Paper-round2.pdf"},{"key":"8_CR29","unstructured":"Xie, S.M., Santurkar, S., Ma, T., Liang, P.: Data selection for language models via importance resampling. In: Proceedings of the 37th International Conference on Neural Information Processing Systems. NIPS 2023, Curran Associates Inc., Red Hook, NY, USA (2023)"},{"key":"8_CR30","doi-asserted-by":"publisher","unstructured":"Yang, J., Hu, X., Huang, W., Yuan, H., Shen, Y., Xiao, G.: Advancing domain adaptation of BERT by learning domain term semantics. In: Knowledge Science, Engineering and Management: 16th International Conference, KSEM 2023, Guangzhou, China, August 16\u201318, 2023, Proceedings, Part IV, p. 12\u201324. Springer, Heidelberg (2023). https:\/\/doi.org\/10.1007\/978-3-031-40292-0_2","DOI":"10.1007\/978-3-031-40292-0_2"},{"key":"8_CR31","unstructured":"Zhukova, A., Matt, C.E., Gipp, B.: Automated collection of evaluation dataset for semantic search in low-resource domain language. In: Hettiarachchi, H., Ranasinghe, T., Rayson, P., Mitkov, R., Gaber, M., Premasiri, D., Tan, F.A., Uyangodage, L. (eds.) Proceedings of the First Workshop on Language Models for Low-Resource Languages, pp. 112\u2013122. Association for Computational Linguistics, Abu Dhabi, United Arab Emirates (2025). https:\/\/aclanthology.org\/2025.loreslm-1.8\/"},{"key":"8_CR32","doi-asserted-by":"publisher","first-page":"7859","DOI":"10.1007\/s10115-024-02212-5","volume":"66","author":"A Zhukova","year":"2024","unstructured":"Zhukova, A., von Sperl, L., Matt, C.E., Gipp, B.: Generative user-experience research for developing domain-specific natural language processing applications. Knowl. Inf. Syst. 66, 7859\u20137889 (2024). https:\/\/doi.org\/10.1007\/s10115-024-02212-5","journal-title":"Knowl. Inf. Syst."}],"container-title":["Lecture Notes in Computer Science","Text, Speech, and Dialogue"],"original-title":[],"language":"en","link":[{"URL":"https:\/\/link.springer.com\/content\/pdf\/10.1007\/978-3-032-02551-7_8","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,8,21]],"date-time":"2025-08-21T05:27:51Z","timestamp":1755754071000},"score":1,"resource":{"primary":{"URL":"https:\/\/link.springer.com\/10.1007\/978-3-032-02551-7_8"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,8,22]]},"ISBN":["9783032025500","9783032025517"],"references-count":32,"URL":"https:\/\/doi.org\/10.1007\/978-3-032-02551-7_8","relation":{},"ISSN":["0302-9743","1611-3349"],"issn-type":[{"type":"print","value":"0302-9743"},{"type":"electronic","value":"1611-3349"}],"subject":[],"published":{"date-parts":[[2025,8,22]]},"assertion":[{"value":"22 August 2025","order":1,"name":"first_online","label":"First Online","group":{"name":"ChapterHistory","label":"Chapter History"}},{"value":"TSD","order":1,"name":"conference_acronym","label":"Conference Acronym","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"International Conference on Text, Speech, and Dialogue","order":2,"name":"conference_name","label":"Conference Name","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Erlangen","order":3,"name":"conference_city","label":"Conference City","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"Germany","order":4,"name":"conference_country","label":"Conference Country","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"2025","order":5,"name":"conference_year","label":"Conference Year","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"25 August 2025","order":7,"name":"conference_start_date","label":"Conference Start Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28 August 2025","order":8,"name":"conference_end_date","label":"Conference End Date","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"28","order":9,"name":"conference_number","label":"Conference Number","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"tsd2025","order":10,"name":"conference_id","label":"Conference ID","group":{"name":"ConferenceInfo","label":"Conference Information"}},{"value":"https:\/\/www.kiv.zcu.cz\/tsd2025\/index.php","order":11,"name":"conference_url","label":"Conference URL","group":{"name":"ConferenceInfo","label":"Conference Information"}}]}}