
<resource xmlns:rdf="http://www.w3.org/1999/02/22-rdf-syntax-ns#" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dcterms="http://purl.org/dc/terms/" xmlns:datacite="http://datacite.org/schema/kernel-4" xmlns="http://namespace.openaire.eu/schema/oaire/" xsi:schemaLocation="http://namespace.openaire.eu/schema/oaire/ https://www.openaire.eu/schema/repo-lit/4.0/openaire.xsd">
  
<datacite:identifier identifierType="URL">https://phaidra.vetmeduni.ac.at/o:5089</datacite:identifier>

  
<datacite:titles>
  
<datacite:title xml:lang="en">Beyond accuracy: Quantifying the reliability of multiple instance learning for whole slide image classification</datacite:title>

  
</datacite:titles>

  
<datacite:creators>
  
<datacite:creator>
  
<datacite:creatorName nameType="Personal">Keshvarikhojasteh, Hassan</datacite:creatorName>

  
<datacite:givenName>Hassan</datacite:givenName>

  
<datacite:familyName>Keshvarikhojasteh</datacite:familyName>

  
<datacite:nameIdentifier nameIdentifierScheme="ORCID" schemeURI="https://orcid.org/">0000-0002-5025-0468</datacite:nameIdentifier>

  
</datacite:creator>

  
<datacite:creator>
  
<datacite:creatorName nameType="Personal">Aubreville, Marc</datacite:creatorName>

  
<datacite:givenName>Marc</datacite:givenName>

  
<datacite:familyName>Aubreville</datacite:familyName>

  
</datacite:creator>

  
<datacite:creator>
  
<datacite:creatorName nameType="Personal">Bertram, Christof A.</datacite:creatorName>

  
<datacite:givenName>Christof A.</datacite:givenName>

  
<datacite:familyName>Bertram</datacite:familyName>

  
<datacite:nameIdentifier nameIdentifierScheme="ORCID" schemeURI="https://orcid.org/">0000-0002-2402-9997</datacite:nameIdentifier>

  
<datacite:affiliation>University of Veterinary Medicine Vienna</datacite:affiliation>

  
</datacite:creator>

  
<datacite:creator>
  
<datacite:creatorName nameType="Personal">Pluim, Josien P. W.</datacite:creatorName>

  
<datacite:givenName>Josien P. W.</datacite:givenName>

  
<datacite:familyName>Pluim</datacite:familyName>

  
</datacite:creator>

  
<datacite:creator>
  
<datacite:creatorName nameType="Personal">Veta, Mitko</datacite:creatorName>

  
<datacite:givenName>Mitko</datacite:givenName>

  
<datacite:familyName>Veta</datacite:familyName>

  
</datacite:creator>

  
</datacite:creators>

  
<dc:publisher>Public Library of Science</dc:publisher>

  
<resourceType resourceTypeGeneral="literature" uri="http://purl.org/coar/resource_type/c_6501">journal article</resourceType>

  
<datacite:rights rightsURI="http://purl.org/coar/access_right/c_abf2">open access</datacite:rights>

  
<dc:language>eng</dc:language>

  
<dc:description xml:lang="en">Machine learning models have become integral to many fields, but their reliability, defined as producing dependable, trustworthy, and domain-consistent predictions, remains a critical concern. Multiple Instance Learning (MIL) models designed for Whole Slide Image (WSI) classification in computational pathology are rarely evaluated in terms of reliability, leaving a key gap in understanding their suitability for high-stakes applications like clinical decision-making. In this paper, we address this gap by introducing three quantitative metrics for reliability assessment and applying them to several widely used MIL architectures across three region-wise annotated pathology datasets. Our findings indicate that the mean pooling instance (MEAN-POOL-INS) model demonstrates superior reliability compared to other networks, despite its simple architectural design and computational efficiency. These findings underscore the need of reliability evaluation alongside predictive performance in MIL models and establish MEAN-POOL-INS as a strong, trustworthy baseline for future research.</dc:description>

  
<datacite:subjects>
  
<datacite:subject xml:lang="en">Machine Learning</datacite:subject>

  
<datacite:subject xml:lang="en">Cancers And Neoplasms</datacite:subject>

  
<datacite:subject xml:lang="en">Sequence Alignment</datacite:subject>

  
<datacite:subject xml:lang="en">Breast Cancer</datacite:subject>

  
<datacite:subject xml:lang="en">Tissue Distribution</datacite:subject>

  
<datacite:subject xml:lang="en">Genome Annotation</datacite:subject>

  
<datacite:subject xml:lang="en">Reliability</datacite:subject>

  
<datacite:subject xml:lang="en">Learning Curves</datacite:subject>

  
</datacite:subjects>

  
<licenseCondition uri="http://creativecommons.org/licenses/by/4.0/">http://creativecommons.org/licenses/by/4.0/</licenseCondition>

  
<file accessRightsURI="http://purl.org/coar/access_right/c_abf2" mimeType="application/pdf" objectType="fulltext">https://phaidra.vetmeduni.ac.at/api/object/o:5089/download</file>

  
<datacite:alternateIdentifiers>
  
<datacite:alternateIdentifier alternateIdentifierType="DOI">10.1371/journal.pone.0337261</datacite:alternateIdentifier>

  
</datacite:alternateIdentifiers>

  
<datacite:relatedIdentifiers>
  
<datacite:relatedIdentifier relatedIdentifierType="URL" relationType="IsPartOf">https://phaidra.vetmeduni.ac.at/o:605</datacite:relatedIdentifier>

  
</datacite:relatedIdentifiers>

  
<dc:format>application/pdf</dc:format>

  
<dc:source xml:lang="en">PLOS One</dc:source>

  
<dc:source>issn:1932-6203</dc:source>

  
<version uri="http://purl.org/coar/version/c_970fb48d4fbd8a85">VoR</version>

  
<citationTitle>PLOS One</citationTitle>

  
<citationVolume>20</citationVolume>

  
<citationIssue>12</citationIssue>

  
<datacite:sizes>
  
<datacite:size>13.16 MB</datacite:size>

  
</datacite:sizes>

  
<datacite:dates>
  
<datacite:date dateType="Issued">2025</datacite:date>

  
</datacite:dates>

  
</resource>


