@inproceedings{786e93661da24dd3a0fa80d10fb46721,
title = "Announcement of the German Medical Text Corpus Project (GeMTeX)",
abstract = "The largest publicly funded project to generate a German-language medical text corpus will start in mid-2023. GeMTeX comprises clinical texts from information systems of six university hospitals, which will be made accessible for NLP by annotation of entities and relations, which will be enhanced with additional meta-information. A strong governance provides a stable legal framework for the use of the corpus. State-of-the art NLP methods are used to build, pre-annotate and annotate the corpus and train language models. A community will be built around GeMTeX to ensure its sustainable maintenance, use, and dissemination.",
keywords = "German Medical Informatics Initiative, Natural Language Processing, Text Corpus",
author = "Frank Meineke and Luise Modersohn and Markus Loeffler and Martin Boeker",
note = "Publisher Copyright: {\textcopyright} 2023 European Federation for Medical Informatics (EFMI) and IOS Press.; 33rd Medical Informatics Europe Conference: Caring is Sharing - Exploiting the Value in Data for Health and Innovation, MIE2023 ; Conference date: 22-05-2023 Through 25-05-2023",
year = "2023",
month = may,
day = "18",
doi = "10.3233/SHTI230283",
language = "English",
series = "Studies in Health Technology and Informatics",
publisher = "IOS Press BV",
pages = "835--836",
editor = "Maria Hagglund and Madeleine Blusi and Stefano Bonacina and Lina Nilsson and Madsen, {Inge Cort} and Sylvia Pelayo and Anne Moen and Arriel Benis and Lars Lindskold and Parisis Gallos",
booktitle = "Caring is Sharing - Exploiting the Value in Data for Health and Innovation - Proceedings of MIE 2023",
}