<?xml version="1.0" encoding="iso-8859-1" standalone="no"?>
<!DOCTYPE GmsArticle SYSTEM "http://www.egms.de/dtd/2.0.34/GmsArticle.dtd">
<GmsArticle xmlns:xlink="http://www.w3.org/1999/xlink">
  <MetaData>
    <Identifier>25dkou245</Identifier>
    <IdentifierDoi>10.3205/25dkou245</IdentifierDoi>
    <IdentifierUrn>urn:nbn:de:0183-25dkou2451</IdentifierUrn>
    <ArticleType>Meeting Abstract</ArticleType>
    <TitleGroup>
      <Title language="en">Deep learning bone tumor entity classification model collapses under real-world distribution shifts</Title>
    </TitleGroup>
    <CreatorList>
      <Creator>
        <PersonNames>
          <Lastname>Curto Vilalta</Lastname>
          <LastnameHeading>Curto Vilalta</LastnameHeading>
          <Firstname>Anna</Firstname>
          <Initials>A</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Technical University of Munich, Munich, Deutschland</Affiliation>
          <Affiliation>Klinikum rechts der Isar, Munich, Deutschland</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="yes">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>del Val Guardiola</Lastname>
          <LastnameHeading>del Val Guardiola</LastnameHeading>
          <Firstname>Ines</Firstname>
          <Initials>I</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Technical University of Munich, Munich, Deutschland</Affiliation>
          <Affiliation>Klinikum rechts der Isar, Munich, Deutschland</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>von Eisenhart-Rothe</Lastname>
          <LastnameHeading>von Eisenhart-Rothe</LastnameHeading>
          <Firstname>R&#252;diger</Firstname>
          <Initials>R</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Klinikum rechts der Isar, Munich, Deutschland</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Consalvo</Lastname>
          <LastnameHeading>Consalvo</LastnameHeading>
          <Firstname>Sarah</Firstname>
          <Initials>S</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Klinikum rechts der Isar, Munich, Deutschland</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Rueckert</Lastname>
          <LastnameHeading>Rueckert</LastnameHeading>
          <Firstname>Daniel</Firstname>
          <Initials>D</Initials>
        </PersonNames>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Hardes</Lastname>
          <LastnameHeading>Hardes</LastnameHeading>
          <Firstname>Jendrik</Firstname>
          <Initials>J</Initials>
        </PersonNames>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
      <Creator>
        <PersonNames>
          <Lastname>Hinterwimmer</Lastname>
          <LastnameHeading>Hinterwimmer</LastnameHeading>
          <Firstname>Florian</Firstname>
          <Initials>F</Initials>
        </PersonNames>
        <Address>
          <Affiliation>Technical University of Munich, Munich, Deutschland</Affiliation>
          <Affiliation>Klinikum rechts der Isar, Munich, Deutschland</Affiliation>
        </Address>
        <Creatorrole corresponding="no" presenting="no">author</Creatorrole>
      </Creator>
    </CreatorList>
    <PublisherList>
      <Publisher>
        <Corporation>
          <Corporatename>German Medical Science GMS Publishing House</Corporatename>
        </Corporation>
        <Address>D&#252;sseldorf</Address>
      </Publisher>
    </PublisherList>
    <SubjectGroup>
      <SubjectheadingDDB>610</SubjectheadingDDB>
    </SubjectGroup>
    <DatePublishedList>
      <DatePublished>20251031</DatePublished>
    </DatePublishedList>
    <Language>engl</Language>
    <License license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
      <AltText language="en">This is an Open Access article distributed under the terms of the Creative Commons Attribution 4.0 License.</AltText>
      <AltText language="de">Dieser Artikel ist ein Open-Access-Artikel und steht unter den Lizenzbedingungen der Creative Commons Attribution 4.0 License (Namensnennung).</AltText>
    </License>
    <SourceGroup>
      <Meeting>
        <MeetingId>M0634</MeetingId>
        <MeetingSequence>245</MeetingSequence>
        <MeetingCorporation>Deutsche Gesellschaft f&#252;r Orthop&#228;die und Unfallchirurgie</MeetingCorporation>
        <MeetingCorporation>Deutsche Gesellschaft f&#252;r Orthop&#228;die und Orthop&#228;dische Chirurgie</MeetingCorporation>
        <MeetingCorporation>Deutsche Gesellschaft f&#252;r Unfallchirurgie</MeetingCorporation>
        <MeetingCorporation>Berufsverband f&#252;r Orthop&#228;die und Unfallchirurgie</MeetingCorporation>
        <MeetingName></MeetingName>
        <MeetingTitle>Deutscher Kongress f&#252;r Orthop&#228;die und Unfallchirurgie (DKOU 2025)</MeetingTitle>
        <MeetingSession>Grundlagenforschung &#124; Osteoarthrose 2</MeetingSession>
        <MeetingCity>Berlin</MeetingCity>
        <MeetingDate>
          <DateFrom>20251028</DateFrom>
          <DateTo>20251031</DateTo>
        </MeetingDate>
      </Meeting>
    </SourceGroup>
    <ArticleNo>AB35-4055</ArticleNo>
  </MetaData>
  <OrigData>
    <TextBlock name="Text" linked="yes">
      <MainHeadline>Text</MainHeadline><Pgraph><Mark1>Objectives and questions: </Mark1>Artificial intelligence (AI) models have demonstrated significant potential in classifying bone tumors. However, their clinical adoption remains limited due to poor generalizability across different healthcare centers. This study aims to assess the impact of training AI models on single-center data and evaluate their performance on datasets with distribution shifts caused by variations in imaging centers, scanners, and acquisition conditions.</Pgraph><Pgraph><Mark1>Material and methods: </Mark1>This retrospective study included x-rays from 635 patients diagnosed with Enchondroma or Atypical Cartilaginous Tumor (ACT). We used a pre-trained Vision Transformer to fine-tune it to classify bone tumor entities. A weighted cross-entropy loss function was applied to avoid a bias towards the majority class (enchondroma).</Pgraph><Pgraph>To assess model robustness, we simulated real-world distribution shifts. We introduced three perturbation scenarios to the test set: (1) sensor noise, modeled by adding Gaussian noise; (2) reduced image quality, simulated via image blurring; and (3) variations in acquisition settings, mimicked by modifying brightness and contrast. Model performance was evaluated on test dataset using classification metrics, including accuracy, sensitivity, and specificity. For sensitivity and specificity calculations, we considered Enchondroma as the negative class and ACT as the positive class.</Pgraph><Pgraph><Mark1>Results: </Mark1>As shown in Table 1 <ImgLink imgNo="1" imgType="table" />, the model achieved an overall accuracy of 77&#37;, with a sensitivity of 45.5&#37; and a specificity of 89.3&#37; on the test set. These results highlight the model&#8217;s difficulty in improving sensitivity for the minority class (ACT) due to the class imbalance.</Pgraph><Pgraph>When evaluating model robustness on the modified test set, simulating real-world distribution shifts, the model&#8217;s ability to balance sensitivity across classes collapsed. Under these conditions, sensitivity for ACT dropped to 0&#37;, while Enchondroma classification reached 100&#37;, indicating that the model classified all cases as Enchondroma.</Pgraph><Pgraph><Mark1>Discussion and conclusions: </Mark1>Our results highlight the challenges of AI bias in bone tumor classification, with models trained on single-center data failing even under very small distribution shifts (Figure 1 <ImgLink imgNo="1" imgType="figure" />). The strong reliance on dataset-specific features raises concerns about their reliability in broader clinical settings. To improve robustness and generalizability, multi-center data sharing is essential for developing accurate AI-based diagnostic tools.</Pgraph></TextBlock>
    <Media>
      <Tables>
        <Table format="png">
          <MediaNo>1</MediaNo>
          <MediaID>1</MediaID>
          <Caption><Pgraph><Mark1>Table 1: Model performance on the original and modified test datasets.</Mark1></Pgraph></Caption>
        </Table>
        <NoOfTables>1</NoOfTables>
      </Tables>
      <Figures>
        <Figure width="715" height="246" format="png">
          <MediaNo>1</MediaNo>
          <MediaID>1</MediaID>
          <Caption><Pgraph><Mark1>Figure 1</Mark1></Pgraph></Caption>
        </Figure>
        <NoOfPictures>1</NoOfPictures>
      </Figures>
      <InlineFigures>
        <NoOfPictures>0</NoOfPictures>
      </InlineFigures>
      <Attachments>
        <NoOfAttachments>0</NoOfAttachments>
      </Attachments>
    </Media>
  </OrigData>
</GmsArticle>