<?xml version="1.0" encoding="iso-8859-1" standalone="no"?>
<!DOCTYPE GmsArticle SYSTEM "http://www.egms.de/dtd/2.0.34/GmsArticle.dtd">
<GmsArticle xmlns:xlink="http://www.w3.org/1999/xlink">
  <MetaData>
    <Identifier>25gmds179</Identifier>
    <IdentifierDoi>10.3205/25gmds179</IdentifierDoi>
    <IdentifierUrn>urn:nbn:de:0183-25gmds1797</IdentifierUrn>
    <ArticleType>Meeting Abstract</ArticleType>
    <TitleGroup>
      <Title language="en">Accessible pipeline for intelligent search on in-house clinical guidelines</Title>
    </TitleGroup>
    <CreatorList>
      <Creator>
        <PersonNames>
          <Lastname>Spiegel</Lastname>
          <LastnameHeading>Spiegel</LastnameHeading>
          <Firstname>S&#246;ren</Firstname>
          <Initials>S</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Institute for Applied Medical Informatics (IAM), Center for Experimental Medicine, University Hospital Hamburg-Eppendorf (UKE), Hamburg, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Bellmann</Lastname>
          <LastnameHeading>Bellmann</LastnameHeading>
          <Firstname>Louis</Firstname>
          <Initials>L</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Institute for Applied Medical Informatics (IAM), Center for Experimental Medicine, University Hospital Hamburg-Eppendorf (UKE), Hamburg, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Solomonova</Lastname>
          <LastnameHeading>Solomonova</LastnameHeading>
          <Firstname>Aliona</Firstname>
          <Initials>A</Initials>
        </PersonNames>
        <Address>
          <Affiliation>UKE Hamburg-Eppendorf, Hamburg, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Breitfeld</Lastname>
          <LastnameHeading>Breitfeld</LastnameHeading>
          <Firstname>Philipp</Firstname>
          <Initials>P</Initials>
        </PersonNames>
        <Address>
          <Affiliation>UKE Hamburg-Eppendorf, Hamburg, Germany</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
    </CreatorList>
    <PublisherList>
      <Publisher>
        <Corporation>
          <Corporatename>German Medical Science GMS Publishing House</Corporatename>
        </Corporation>
        <Address>D&#252;sseldorf</Address>
      </Publisher>
    </PublisherList>
    <SubjectGroup>
      <SubjectheadingDDB>610</SubjectheadingDDB>
      <Keyword language="en">large language model (LLM)</Keyword>
      <Keyword language="en">retrieval-augmented generation (RAG)</Keyword>
    </SubjectGroup>
    <DatePublishedList>
      <DatePublished>20251103</DatePublished>
    </DatePublishedList>
    <Language>engl</Language>
    <License license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
      <AltText language="en">This is an Open Access article distributed under the terms of the Creative Commons Attribution 4.0 License.</AltText>
      <AltText language="de">Dieser Artikel ist ein Open-Access-Artikel und steht unter den Lizenzbedingungen der Creative Commons Attribution 4.0 License (Namensnennung).</AltText>
    </License>
    <SourceGroup>
      <Meeting>
        <MeetingId>M0631</MeetingId>
        <MeetingSequence>179</MeetingSequence>
        <MeetingCorporation>Deutsche Gesellschaft f&#252;r Medizinische Informatik, Biometrie und Epidemiologie</MeetingCorporation>
        <MeetingName>70. Jahrestagung der Deutschen Gesellschaft f&#252;r Medizinische Informatik, Biometrie und Epidemiologie e. V. (GMDS)</MeetingName>
        <MeetingTitle></MeetingTitle>
        <MeetingSession>PS 11: Wissens- und Prozessmanagement</MeetingSession>
        <MeetingCity>Jena</MeetingCity>
        <MeetingDate>
          <DateFrom>20250907</DateFrom>
          <DateTo>20250911</DateTo>
        </MeetingDate>
      </Meeting>
    </SourceGroup>
    <ArticleNo>Abstr. 214</ArticleNo>
  </MetaData>
  <OrigData>
    <TextBlock name="Text" linked="yes">
      <MainHeadline>Text</MainHeadline><Pgraph><Mark1>Introduction:</Mark1> Premedication in anesthesia requires clinicians to follow an evolving set of clinical guidelines. These documents are often lengthy and stored across multiple documents, making quick access to relevant information during clinical workflows challenging. Existing retrieval-augmented generation (RAG) systems using large language models provide a promising foundation for intelligent document querying <TextLink reference="1"></TextLink>. However, standard methods for splitting documents into search units may not be well-suited for the structure and complexity of clinical guidelines. While small chunks can improve retrieval precision, they often lack the broader context required for coherent and reliable answers <TextLink reference="2"></TextLink>. To address these limitations, we introduce NicerSlicer <TextLink reference="3"></TextLink> to slice large documents into semantically coherent sections. We also present MedQueryGuide <TextLink reference="4"></TextLink>, an interactive frontend for intelligent clinical guideline search. </Pgraph><Pgraph><Mark1>Methods:</Mark1> NicerSlicer generates section splits, which users can refine by discarding, joining, splitting or adjusting sections. The sections can be downloaded and integrated into RAG pipelines. MedQueryGuide is an interactive frontend for RAG-based question answering, featuring: </Pgraph><Pgraph><OrderedList><ListItem level="1" levelPosition="1" numString="1.">a vector store with metadata filtering for targeted search across multiple documents,</ListItem><ListItem level="1" levelPosition="2" numString="2.">a recursive retriever returning small content units along with their broader context sections to support more informative answers,</ListItem><ListItem level="1" levelPosition="3" numString="3.">a user feedback function (&#8220;helpful&#8221; vs. &#8220;not helpful&#8221;) to iteratively improve search quality and content relevance. </ListItem></OrderedList></Pgraph><Pgraph>We quantitatively evaluated the RAG pipeline using 100 automatically generated question answer pairs derived from four clinical guidelines (127 pages). Of these, 70 questions required information from a single section (single-hop), while 30 involved reasoning across two distinct sections (multi-hop). Retrieval is evaluated by using  the hit rate and mean reciprocal rank (MRR), while the answer quality was evaluated against reference answers using BERTScore <TextLink reference="5"></TextLink>. Additionally, one anesthetist assessed 10 real-world questions in MedQueryGuide using its feedback system to explore whether autogenerated evaluation aligns with real-world scenarios. </Pgraph><Pgraph><Mark1>Results:</Mark1> For single-hop questions we achieved a hit rate of 0.87 and a MRR of 0.82. BERTScore of 0.79 indicates high degree of semantic similarity with reference answers. Our approach achieved a hit rate of 0.92 for at least one of the documents for multi-hop questions, however, when considering both reference documents the hit rate dropped to 0.54. Moreover, the BERTScore decreased to 0.75. This decline is reflected in the real-world evaluation: all five simple queries led to helpful documents and answers, while the five more complex or vague queries produced less relevant retrievals and unhelpful answers. Of 20 documents retrieved for five complex queries, only 10 were rated as helpful by the physician. </Pgraph><Pgraph><Mark1>Discussion:</Mark1> A key challenge lies in working with PDFs, common extraction methods often fall short and even state of the art visual language models can introduce subtle errors. The real-world evaluation, though limited in size, reflected the performance gap between simple and complex queries. As a next step, we plan to fine-tune retrieval using synthetic data to improve performance on complex queries.</Pgraph><Pgraph><Mark1>Conclusion:</Mark1> Our results demonstrate the importance of context-aware retrieval and flexible document segmentation when building intelligent search systems for clinical guidelines. Tools like NicerSlicer and MedQueryGuide show that tailored solutions can meaningfully support clinical workflows.</Pgraph><Pgraph>The authors declare that they have no competing interests.</Pgraph><Pgraph>The authors declare that an ethics committee vote is not required.</Pgraph></TextBlock>
    <References linked="yes">
      <Reference refNo="1">
        <RefAuthor>Ng KKY</RefAuthor>
        <RefAuthor>Matsuba I</RefAuthor>
        <RefAuthor>Zhang PC</RefAuthor>
        <RefTitle>RAG in Health Care: A Novel Framework for Improving Communication and Decision-Making by Addressing LLM Limitations</RefTitle>
        <RefYear>2025</RefYear>
        <RefJournal>NEJM AI</RefJournal>
        <RefPage>AIra2400380</RefPage>
        <RefTotal>Ng KKY, Matsuba I, Zhang PC. RAG in Health Care: A Novel Framework for Improving Communication and Decision-Making by Addressing LLM Limitations. NEJM AI. 2025 Jan;2(1):AIra2400380.</RefTotal>
      </Reference>
      <Reference refNo="2">
        <RefAuthor>Bhat SR</RefAuthor>
        <RefAuthor>Rudat M</RefAuthor>
        <RefAuthor>Spiekermann J</RefAuthor>
        <RefAuthor>Flores-Herr N</RefAuthor>
        <RefTitle>Rethinking Chunk Size For Long-Document Retrieval: A Multi-Dataset Analysis &#91;Preprint&#93;</RefTitle>
        <RefYear>2025</RefYear>
        <RefJournal>arXiv</RefJournal>
        <RefPage></RefPage>
        <RefTotal>Bhat SR, Rudat M, Spiekermann J, Flores-Herr N. Rethinking Chunk Size For Long-Document Retrieval: A Multi-Dataset Analysis &#91;Preprint&#93;. arXiv. 2025. DOI: 10.48550&#47;arXiv.2505.21700</RefTotal>
        <RefLink>http:&#47;&#47;dx.doi.org&#47;10.48550&#47;arXiv.2505.21700</RefLink>
      </Reference>
      <Reference refNo="3">
        <RefAuthor>Anonym</RefAuthor>
        <RefTitle></RefTitle>
        <RefYear></RefYear>
        <RefBookTitle>UKEIAM&#47;NicerSlicer: Repository to create nicely sliced PDFs for your RAG</RefBookTitle>
        <RefPage></RefPage>
        <RefTotal>UKEIAM&#47;NicerSlicer: Repository to create nicely sliced PDFs for your RAG. GitHub; &#91;cited 2025 Jun 20&#93;. Available from: https:&#47;&#47;github.com&#47;UKEIAM&#47;NicerSlicer&#47;tree&#47;main</RefTotal>
        <RefLink>https:&#47;&#47;github.com&#47;UKEIAM&#47;NicerSlicer&#47;tree&#47;main</RefLink>
      </Reference>
      <Reference refNo="4">
        <RefAuthor>Anonym</RefAuthor>
        <RefTitle></RefTitle>
        <RefYear></RefYear>
        <RefBookTitle>IAMspiegel&#47;MedQueryGuide: RAG application for medical guidelines</RefBookTitle>
        <RefPage></RefPage>
        <RefTotal>IAMspiegel&#47;MedQueryGuide: RAG application for medical guidelines. GitHub; &#91;cited 2025 Jun 20&#93;. Available from: https:&#47;&#47;github.com&#47;IAMspiegel&#47;MedQueryGuide</RefTotal>
        <RefLink>https:&#47;&#47;github.com&#47;IAMspiegel&#47;MedQueryGuide</RefLink>
      </Reference>
      <Reference refNo="5">
        <RefAuthor>Zhang T</RefAuthor>
        <RefAuthor>Kishore V</RefAuthor>
        <RefAuthor>Wu F</RefAuthor>
        <RefAuthor>Weinberger KQ</RefAuthor>
        <RefAuthor>Artzi Y</RefAuthor>
        <RefTitle>BERTScore: Evaluating Text Generation with BERT</RefTitle>
        <RefYear></RefYear>
        <RefBookTitle>International Conference on Learning Representations (ICLR) 2020</RefBookTitle>
        <RefPage></RefPage>
        <RefTotal>Zhang T, Kishore V, Wu F, Weinberger KQ, Artzi Y. BERTScore: Evaluating Text Generation with BERT. In: International Conference on Learning Representations (ICLR) 2020. Available from: https:&#47;&#47;openreview.net&#47;forum&#63;id&#61;SkeHuCVFDr</RefTotal>
        <RefLink>https:&#47;&#47;openreview.net&#47;forum&#63;id&#61;SkeHuCVFDr</RefLink>
      </Reference>
    </References>
    <Media>
      <Tables>
        <NoOfTables>0</NoOfTables>
      </Tables>
      <Figures>
        <NoOfPictures>0</NoOfPictures>
      </Figures>
      <InlineFigures>
        <NoOfPictures>0</NoOfPictures>
      </InlineFigures>
      <Attachments>
        <NoOfAttachments>0</NoOfAttachments>
      </Attachments>
    </Media>
  </OrigData>
</GmsArticle>