{"status":"ok","message-type":"work","message-version":"1.0.0","message":{"indexed":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T23:37:53Z","timestamp":1761176273752,"version":"build-2065373602"},"reference-count":0,"publisher":"IOS Press","isbn-type":[{"value":"9781643686318","type":"electronic"}],"license":[{"start":{"date-parts":[[2025,10,21]],"date-time":"2025-10-21T00:00:00Z","timestamp":1761004800000},"content-version":"unspecified","delay-in-days":0,"URL":"https:\/\/creativecommons.org\/licenses\/by-nc\/4.0\/"}],"content-domain":{"domain":[],"crossmark-restriction":false},"short-container-title":[],"published-print":{"date-parts":[[2025,10,21]]},"abstract":"<jats:p>We present two multilingual LLMs, Teuken 7B-base and Teuken 7B-instruct, designed to embrace Europe\u2019s linguistic diversity by supporting all 24 official languages of the European Union. Trained on a dataset comprising around 60% non-English data and utilizing a custom multilingual tokenizer, our models address the limitations of existing Large Language Models (LLMs) that predominantly focus on English or a few high-resource languages. We detail the models\u2019 development principles, i.e., data composition, tokenizer optimization, and training methodologies. The models demonstrate strong performance across multilingual benchmarks, as evidenced by their performance on European versions of ARC, HellaSwag, and TruthfulQA.<\/jats:p>","DOI":"10.3233\/faia251328","type":"book-chapter","created":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T09:58:25Z","timestamp":1761127105000},"source":"Crossref","is-referenced-by-count":0,"title":["Teuken-7B-Base &amp; Teuken-7B-Instruct: Towards European LLMs"],"prefix":"10.3233","author":[{"given":"Mehdi","family":"Ali","sequence":"first","affiliation":[{"name":"Fraunhofer IAIS"},{"name":"Lamarr Institute"}]},{"given":"Michael","family":"Fromm","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"},{"name":"Lamarr Institute"}]},{"given":"Klaudia","family":"Thellmann","sequence":"additional","affiliation":[{"name":"TU Dresden"},{"name":"ScaDS.AI Dresden\/Leipzig"}]},{"given":"Jan","family":"Ebert","sequence":"additional","affiliation":[{"name":"FZ J\u00fclich"}]},{"given":"Alexander Arno","family":"Weber","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"},{"name":"Lamarr Institute"}]},{"given":"Richard","family":"Rutmann","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"},{"name":"Lamarr Institute"}]},{"given":"Charvi","family":"Jain","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"},{"name":"Lamarr Institute"}]},{"given":"Max","family":"L\u00fcbbering","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"},{"name":"Lamarr Institute"}]},{"given":"Daniel","family":"Steinigen","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Johannes","family":"Leveling","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Katrin","family":"Klug","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Jasper Schulze","family":"Buschhoff","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Lena","family":"Jurkschat","sequence":"additional","affiliation":[{"name":"TU Dresden"}]},{"given":"Hammam","family":"Abdelwahab","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Benny J\u00f6rg","family":"Stein","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Karl-Heinz","family":"Sylla","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Pavel","family":"Denisov","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Nicolo\u2019","family":"Brandizzi","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Qasid","family":"Saleem","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Anirban","family":"Bhowmick","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Lennard","family":"Helmer","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Chelsea","family":"John","sequence":"additional","affiliation":[{"name":"FZ J\u00fclich"}]},{"given":"Pedro","family":"Ortiz Suarez","sequence":"additional","affiliation":[{"name":"DFKI"}]},{"given":"Malte","family":"Ostendorff","sequence":"additional","affiliation":[{"name":"DFKI"}]},{"given":"Alex","family":"Jude","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Lalith","family":"Manjunath","sequence":"additional","affiliation":[{"name":"TU Dresden"}]},{"given":"Samuel","family":"Weinbach","sequence":"additional","affiliation":[{"name":"Aleph Alpha"}]},{"given":"Carolin","family":"Penke","sequence":"additional","affiliation":[{"name":"FZ J\u00fclich"}]},{"given":"Oleg","family":"Filatov","sequence":"additional","affiliation":[{"name":"FZ J\u00fclich"}]},{"given":"Fabio","family":"Barth","sequence":"additional","affiliation":[{"name":"DFKI"}]},{"given":"Paramita","family":"Mirza","sequence":"additional","affiliation":[{"name":"Fraunhofer IIS"}]},{"given":"Lucas","family":"Weber","sequence":"additional","affiliation":[{"name":"Fraunhofer IIS"}]},{"given":"Ines","family":"Wendler","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Rafet","family":"Sifa","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Fabian","family":"K\u00fcch","sequence":"additional","affiliation":[{"name":"Fraunhofer IIS"}]},{"given":"Andreas","family":"Herten","sequence":"additional","affiliation":[{"name":"FZ J\u00fclich"}]},{"given":"Ren\u00e9","family":"J\u00e4kel","sequence":"additional","affiliation":[{"name":"TU Dresden"}]},{"given":"Georg","family":"Rehm","sequence":"additional","affiliation":[{"name":"DFKI"}]},{"given":"Stefan","family":"Kesselheim","sequence":"additional","affiliation":[{"name":"FZ J\u00fclich"}]},{"given":"Joachim","family":"K\u00f6hler","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]},{"given":"Nicolas","family":"Flores-Herr","sequence":"additional","affiliation":[{"name":"Fraunhofer IAIS"}]}],"member":"7437","container-title":["Frontiers in Artificial Intelligence and Applications","ECAI 2025"],"original-title":[],"link":[{"URL":"https:\/\/ebooks.iospress.nl\/pdf\/doi\/10.3233\/FAIA251328","content-type":"unspecified","content-version":"vor","intended-application":"similarity-checking"}],"deposited":{"date-parts":[[2025,10,22]],"date-time":"2025-10-22T09:58:26Z","timestamp":1761127106000},"score":1,"resource":{"primary":{"URL":"https:\/\/ebooks.iospress.nl\/doi\/10.3233\/FAIA251328"}},"subtitle":[],"short-title":[],"issued":{"date-parts":[[2025,10,21]]},"ISBN":["9781643686318"],"references-count":0,"URL":"https:\/\/doi.org\/10.3233\/faia251328","relation":{},"ISSN":["0922-6389","1879-8314"],"issn-type":[{"value":"0922-6389","type":"print"},{"value":"1879-8314","type":"electronic"}],"subject":[],"published":{"date-parts":[[2025,10,21]]}}}