<?xml version="1.0" encoding="iso-8859-1" standalone="no"?>
<!DOCTYPE GmsArticle SYSTEM "http://www.egms.de/dtd/2.0.34/GmsArticle.dtd">
<GmsArticle xmlns:xlink="http://www.w3.org/1999/xlink">
  <MetaData>
    <Identifier>25gmds062</Identifier>
    <IdentifierDoi>10.3205/25gmds062</IdentifierDoi>
    <IdentifierUrn>urn:nbn:de:0183-25gmds0625</IdentifierUrn>
    <ArticleType>Meeting Abstract</ArticleType>
    <TitleGroup>
      <Title language="en">Using LLMs for the Annotation of German Clinical Forms with SNOMED CT and the MII Core Data Set</Title>
    </TitleGroup>
    <CreatorList>
      <Creator>
        <PersonNames>
          <Lastname>Riedel</Lastname>
          <LastnameHeading>Riedel</LastnameHeading>
          <Firstname>Andrea</Firstname>
          <Initials>A</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Erlangen University Hospital, Medical Center for Information and Communication Technology, Erlangen, Germany</Affiliation>
          <Affiliation>Friedrich-Alexander-Universit&#228;t Erlangen-N&#252;rnberg, Medical Informatics, Erlangen, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Kosminski</Lastname>
          <LastnameHeading>Kosminski</LastnameHeading>
          <Firstname>Michelle</Firstname>
          <Initials>M</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Friedrich-Alexander-Universit&#228;t Erlangen-N&#252;rnberg, Machine Learning and Data Analytics Lab, Erlangen, Germany</Affiliation>
          <Affiliation>Erlangen University Hospital, Medical Center for Information and Communication Technology, Erlangen, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Borst</Lastname>
          <LastnameHeading>Borst</LastnameHeading>
          <Firstname>Sandra</Firstname>
          <Initials>S</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Erlangen University Hospital, Medical Center for Information and Communication Technology, Erlangen, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Salin</Lastname>
          <LastnameHeading>Salin</LastnameHeading>
          <Firstname>Emmanuelle</Firstname>
          <Initials>E</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Friedrich-Alexander-Universit&#228;t Erlangen-N&#252;rnberg, Machine Learning and Data Analytics Lab, Erlangen, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Bohr</Lastname>
          <LastnameHeading>Bohr</LastnameHeading>
          <Firstname>Arijana</Firstname>
          <Initials>A</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Friedrich-Alexander-Universit&#228;t Erlangen-N&#252;rnberg, Machine Learning and Data Analytics Lab, Erlangen, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Eskofier</Lastname>
          <LastnameHeading>Eskofier</LastnameHeading>
          <Firstname>Bjoern</Firstname>
          <Initials>B</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Friedrich-Alexander-Universit&#228;t Erlangen-N&#252;rnberg, Machine Learning and Data Analytics Lab, Erlangen, Germany</Affiliation>
          <Affiliation>Translational Digital Health Group, Institute of AI for Health, Helmholtz Zentrum M&#252;nchen - German Research Center for Environmental Health, Neuherberg, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Ganslandt</Lastname>
          <LastnameHeading>Ganslandt</LastnameHeading>
          <Firstname>Thomas</Firstname>
          <Initials>T</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Friedrich-Alexander-Universit&#228;t Erlangen-N&#252;rnberg, Medical Informatics, Erlangen, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Deppenwiese</Lastname>
          <LastnameHeading>Deppenwiese</LastnameHeading>
          <Firstname>Noemi</Firstname>
          <Initials>N</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Erlangen University Hospital, Medical Center for Information and Communication Technology, Erlangen, Germany</Affiliation>
          <Affiliation>Friedrich-Alexander-Universit&#228;t Erlangen-N&#252;rnberg, Medical Informatics, Erlangen, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
    </CreatorList>
    <PublisherList>
      <Publisher>
        <Corporation>
          <Corporatename>German Medical Science GMS Publishing House</Corporatename>
        </Corporation>
        <Address>D&#252;sseldorf</Address>
      </Publisher>
    </PublisherList>
    <SubjectGroup>
      <SubjectheadingDDB>610</SubjectheadingDDB>
      <Keyword language="en">clinical coding</Keyword>
      <Keyword language="en">health information interoperability</Keyword>
      <Keyword language="en">large language models</Keyword>
      <Keyword language="en">systematized nomenclature of medicine</Keyword>
      <Keyword language="en">terminology as topic</Keyword>
    </SubjectGroup>
    <DatePublishedList>
      <DatePublished>20251103</DatePublished>
    </DatePublishedList>
    <Language>engl</Language>
    <License license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
      <AltText language="en">This is an Open Access article distributed under the terms of the Creative Commons Attribution 4.0 License.</AltText>
      <AltText language="de">Dieser Artikel ist ein Open-Access-Artikel und steht unter den Lizenzbedingungen der Creative Commons Attribution 4.0 License (Namensnennung).</AltText>
    </License>
    <SourceGroup>
      <Meeting>
        <MeetingId>M0631</MeetingId>
        <MeetingSequence>062</MeetingSequence>
        <MeetingCorporation>Deutsche Gesellschaft f&#252;r Medizinische Informatik, Biometrie und Epidemiologie</MeetingCorporation>
        <MeetingName>70. Jahrestagung der Deutschen Gesellschaft f&#252;r Medizinische Informatik, Biometrie und Epidemiologie e. V. (GMDS)</MeetingName>
        <MeetingTitle></MeetingTitle>
        <MeetingSession>V: Large language models &#38; medical texts 2</MeetingSession>
        <MeetingCity>Jena</MeetingCity>
        <MeetingDate>
          <DateFrom>20250907</DateFrom>
          <DateTo>20250911</DateTo>
        </MeetingDate>
      </Meeting>
    </SourceGroup>
    <ArticleNo>Abstr. 317</ArticleNo>
  </MetaData>
  <OrigData>
    <TextBlock name="Text" linked="yes">
      <MainHeadline>Text</MainHeadline><Pgraph><Mark1>Introduction:</Mark1> The <Mark2>Medical Informatics Initiative (MII) </Mark2>aims to standardise routine care data for research based on the <Mark2>core data set (CDS)</Mark2> <TextLink reference="1"></TextLink>. To improve semantic interoperability, the <Mark2>CDS</Mark2> utilises the world&#8217;s leading health terminology <Mark2>SNOMED CT</Mark2> <Mark2>(SCT)</Mark2> <TextLink reference="2"></TextLink>.</Pgraph><Pgraph>Medical forms are an inherent means of routinely capturing patient data through structured hospital documentation. Our project aims to enhance the reusability of clinical documentation forms through their semantic annotation, addressing a common issue of inconsistent standards across departments.</Pgraph><Pgraph>Currently, the field of German natural language processing in medicine is limited by the scarcity of publicly accessible, domain-specific Large Language Models (LLMs) and German-language ground truth (GT) corpora with semantic annotations <TextLink reference="3"></TextLink>, <TextLink reference="4"></TextLink>, <TextLink reference="5"></TextLink>.</Pgraph><Pgraph><Mark1>Methods:</Mark1> We aim to accelerate the annotation process of German medical forms with the help of LLMs and by prioritising <Mark2>SCT</Mark2> concepts appearing within the <Mark2>CDS</Mark2> to support automated <Mark2>SCT</Mark2> coding. As the <Mark2>German National Edition</Mark2> is currently limited to specific use cases, we focused on annotations with the <Mark2>SCT International Edition</Mark2> (Version: 01-04-2025). We chose tumour board forms from the <Mark2>University Hospital Erlangen (UKER) </Mark2>as our use case, since the documentation of tumour board meetings is mandatory for hospitals certified by the <Mark2>German Cancer Society</Mark2>. Due to privacy concerns, we compared two locally-hosted LLMs, <Mark2>unsloth&#47;Meta-Llama-3.1-8B-Instruct </Mark2>and<Mark2> mistralai&#47;Mistral-7B-Instruct-v0.3</Mark2>.</Pgraph><Pgraph>The form items were first preprocessed using <Mark2>unsloth&#47;Mistral-Small-3.1-24B-Instruct-2503-unsloth-bnb-4bit</Mark2>. Next, we employed <Mark2>Retrieval Augmented Generation</Mark2> techniques. A list of possible <Mark2>SCT </Mark2>codes was extracted from the <Mark2>CDS</Mark2> (version 2025) using three different embedding methods (<Mark2>sentencetransformers&#47;all-mpnet-base-v2</Mark2>, <Mark2>xlreator&#47;biosyn-biobert-snomed</Mark2>, and <Mark2>abhinand&#47;MedEmbed-base-v0.1</Mark2>). Finally, the two decoder models were tested for code suggestion using the <Mark2>SNOWSTORM</Mark2> server API, and final selection of the k (k&#61; 1, 3, 5) most relevant codes. The proposed automated approach was evaluated by comparing the suggested codes with a manually annotated GT of 15 <Mark2>UKER</Mark2> tumour board forms by two local medical <Mark2>SCT</Mark2> experts.</Pgraph><Pgraph><Mark1>Results:</Mark1> Our GT annotations showed that 48&#37; of the tumour board forms could be represented by pre-coordinated <Mark2>SCT</Mark2> concepts (Inter-Annotator-Agreement <Mark2>Cohen&#39;s Kappa</Mark2> (&#954; &#61; 0.75 micro, 0.75 macro)). Around 4.8&#37; of the chosen <Mark2>SCT</Mark2> concepts are part of the current <Mark2>CDS</Mark2>. The best results were shown for <Mark2>unsloth&#47;Meta-Llama-3.1-8BInstruct</Mark2> with a <Mark2>xlreator&#47;biosyn-biobert-snomed</Mark2> embedding, which correctly detected 46.2&#37; of GT codes for one selected <Mark2>SCT</Mark2> code, and up to 57.8&#37; for five selected <Mark2>SCT</Mark2> codes.</Pgraph><Pgraph><Mark1>Discussion:</Mark1> Our proposed pipeline is one of the first contributions to automated pre-annotation suggestions for <Mark2>SCT</Mark2> annotations of German medical forms, as manual annotation still outperforms automated approaches. The LLM-based annotation process was complicated by the German-English translation between the German form content and the English-language international terminology <Mark2>SCT</Mark2>. Additional primary factors for missing mappings were non-mappable local peculiarities, non-relevant supporting protocol instructions (e.g., proper names) or outdated <Mark2>SCT</Mark2> concepts within the <Mark2>CDS</Mark2>.</Pgraph><Pgraph><Mark1>Conclusion:</Mark1> Our pipeline will support the standardisation processes of German medical forms across different clinical <Mark2>MII</Mark2> sites. An analysis of linguistic, technical, and semantic aspects (e.g., prioritisation of specific semantic tags in <Mark2>SCT</Mark2> selection) provided insights for future research. Further investigations regarding automated post-coordinations are necessary to further limit manual efforts.</Pgraph><Pgraph>The authors declare that they have no competing interests.</Pgraph><Pgraph>The authors declare that an ethics committee vote is not required.</Pgraph></TextBlock>
    <References linked="yes">
      <Reference refNo="1">
        <RefAuthor>Semler SC</RefAuthor>
        <RefAuthor>Wissing F</RefAuthor>
        <RefAuthor>Heyder R</RefAuthor>
        <RefTitle>German medical informatics initiative</RefTitle>
        <RefYear>2018</RefYear>
        <RefJournal>Methods of information in medicine</RefJournal>
        <RefPage>e50-6</RefPage>
        <RefTotal>Semler SC, Wissing F, Heyder R. German medical informatics initiative. Methods of information in medicine. 2018 May;57(S 01):e50-6.</RefTotal>
      </Reference>
      <Reference refNo="2">
        <RefAuthor>Ingenerf J</RefAuthor>
        <RefAuthor>Drenkhahn C</RefAuthor>
        <RefTitle></RefTitle>
        <RefYear>2024</RefYear>
        <RefBookTitle>Referenzterminologie SNOMED CT: Interlingua zur Gew&#228;hrleistung semantischer Interoperabilit&#228;t in der Medizin</RefBookTitle>
        <RefPage></RefPage>
        <RefTotal>Ingenerf J, Drenkhahn C. Referenzterminologie SNOMED CT: Interlingua zur Gew&#228;hrleistung semantischer Interoperabilit&#228;t in der Medizin. Springer-Verlag; 2024 Jan 18.</RefTotal>
      </Reference>
      <Reference refNo="3">
        <RefAuthor>Hahn U</RefAuthor>
        <RefTitle>Clinical Document Corpora -- Real Ones, Translated and Synthetic Substitutes, and Assorted Domain Proxies: A Survey of Diversity in Corpus Design, with Focus on German Text Data &#91;Preprint&#93;</RefTitle>
        <RefYear>2024</RefYear>
        <RefJournal>arXiv</RefJournal>
        <RefPage></RefPage>
        <RefTotal>Hahn U. Clinical Document Corpora -- Real Ones, Translated and Synthetic Substitutes, and Assorted Domain Proxies: A Survey of Diversity in Corpus Design, with Focus on German Text Data &#91;Preprint&#93;. arXiv. 2024. DOI: 
10.48550&#47;arXiv.2412.00230</RefTotal>
        <RefLink>https:&#47;&#47;doi.org&#47;10.48550&#47;arXiv.2412.00230</RefLink>
      </Reference>
      <Reference refNo="4">
        <RefAuthor>Borchert F</RefAuthor>
        <RefAuthor>Lohr C</RefAuthor>
        <RefAuthor>Modersohn L</RefAuthor>
        <RefAuthor>Witt J</RefAuthor>
        <RefAuthor>Langer T</RefAuthor>
        <RefAuthor>Follmann M</RefAuthor>
        <RefAuthor>Gietzelt M</RefAuthor>
        <RefAuthor>Arnrich B</RefAuthor>
        <RefAuthor>Hahn U</RefAuthor>
        <RefAuthor>Schapranow MP</RefAuthor>
        <RefTitle>GGPONC 2.0 - the German clinical guideline corpus for oncology: Curation workflow, annotation policy, baseline NER taggers</RefTitle>
        <RefYear></RefYear>
        <RefBookTitle>Proceedings of the Thirteenth Language Resources and Evaluation Conference; 2022 Jun</RefBookTitle>
        <RefPage>p. 3650-3660.</RefPage>
        <RefTotal>Borchert F, Lohr C, Modersohn L, Witt J, Langer T, Follmann M, Gietzelt M, Arnrich B, Hahn U, Schapranow MP. GGPONC 2.0 - the German clinical guideline corpus for oncology: Curation workflow, annotation policy, baseline NER taggers. In: Proceedings of the Thirteenth Language Resources and Evaluation Conference; 2022 Jun. p. 3650-3660.</RefTotal>
      </Reference>
      <Reference refNo="5">
        <RefAuthor>Carlini N</RefAuthor>
        <RefAuthor>Tramer F</RefAuthor>
        <RefAuthor>Wallace E</RefAuthor>
        <RefAuthor>Jagielski M</RefAuthor>
        <RefAuthor>Herbert-Voss A</RefAuthor>
        <RefAuthor>Lee K</RefAuthor>
        <RefAuthor>Roberts A</RefAuthor>
        <RefAuthor>Brown T</RefAuthor>
        <RefAuthor>Song D</RefAuthor>
        <RefAuthor>Erlingsson U</RefAuthor>
        <RefAuthor>Oprea A</RefAuthor>
        <RefTitle>Extracting training data from large language models</RefTitle>
        <RefYear></RefYear>
        <RefBookTitle>30th USENIX security symposium (USENIX Security 21) 2021</RefBookTitle>
        <RefPage>2633-2650</RefPage>
        <RefTotal>Carlini N, Tramer F, Wallace E, Jagielski M, Herbert-Voss A, Lee K, Roberts A, Brown T, Song D, Erlingsson U, Oprea A. Extracting training data from large language models. In: 30th USENIX security symposium (USENIX Security 21) 2021. p. 2633-2650.</RefTotal>
      </Reference>
    </References>
    <Media>
      <Tables>
        <NoOfTables>0</NoOfTables>
      </Tables>
      <Figures>
        <NoOfPictures>0</NoOfPictures>
      </Figures>
      <InlineFigures>
        <NoOfPictures>0</NoOfPictures>
      </InlineFigures>
      <Attachments>
        <NoOfAttachments>0</NoOfAttachments>
      </Attachments>
    </Media>
  </OrigData>
</GmsArticle>