<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="1.3" xml:lang="en">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">diagnostics</journal-id>
      <journal-title-group>
        <journal-title>Diagnostics</journal-title>
        <abbrev-journal-title abbrev-type="publisher">Diagnostics</abbrev-journal-title>
        <abbrev-journal-title abbrev-type="pubmed">Diagnostics</abbrev-journal-title>
      </journal-title-group>
      <issn pub-type="epub">2075-4418</issn>
      <publisher>
        <publisher-name>MDPI</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.3390/diagnostics14100997</article-id>
      <article-id pub-id-type="publisher-id">diagnostics-14-00997</article-id>
      <article-version vocab="JAV" vocab-identifier="https://www.mdpi.com/2075-4418/14/10/997/pdf" vocab-term="Version of Record" article-version-type="VoR">v2</article-version>
      <article-categories>
        <subj-group>
          <subject>Article</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>IMPA-Net: Interpretable Multi-Part Attention Network for Trustworthy Brain Tumor Classification from MRI</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author">
          <name>
            <surname>Xie</surname>
            <given-names>Yuting</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Data curation" vocab-term-identifier="https://credit.niso.org/contributor-roles/data-curation/">Data curation</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing – original draft" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-original-draft/">Writing – original draft</role>
          <xref rid="af1-diagnostics-14-00997" ref-type="aff">1</xref>
          <xref rid="af2-diagnostics-14-00997" ref-type="aff">2</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Zaccagna</surname>
            <given-names>Fulvio</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing – review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
          <xref rid="af3-diagnostics-14-00997" ref-type="aff">3</xref>
          <xref rid="af4-diagnostics-14-00997" ref-type="aff">4</xref>
        </contrib>
        <contrib contrib-type="author">
          <contrib-id contrib-id-type="orcid" authenticated="true">https://orcid.org/0000-0003-3341-5483</contrib-id>
          <name>
            <surname>Rundo</surname>
            <given-names>Leonardo</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing – review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
          <xref rid="af5-diagnostics-14-00997" ref-type="aff">5</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Testa</surname>
            <given-names>Claudia</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing – review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
          <xref rid="af6-diagnostics-14-00997" ref-type="aff">6</xref>
          <xref rid="af7-diagnostics-14-00997" ref-type="aff">7</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Zhu</surname>
            <given-names>Ruifeng</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Methodology" vocab-term-identifier="https://credit.niso.org/contributor-roles/methodology/">Methodology</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Software" vocab-term-identifier="https://credit.niso.org/contributor-roles/software/">Software</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
          <xref rid="af8-diagnostics-14-00997" ref-type="aff">8</xref>
        </contrib>
        <contrib contrib-type="author">
          <contrib-id contrib-id-type="orcid" authenticated="true">https://orcid.org/0000-0002-0506-499X</contrib-id>
          <name>
            <surname>Tonon</surname>
            <given-names>Caterina</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing – review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
          <xref rid="af1-diagnostics-14-00997" ref-type="aff">1</xref>
          <xref rid="af2-diagnostics-14-00997" ref-type="aff">2</xref>
        </contrib>
        <contrib contrib-type="author">
          <name>
            <surname>Lodi</surname>
            <given-names>Raffaele</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Resources" vocab-term-identifier="https://credit.niso.org/contributor-roles/resources/">Resources</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Funding acquisition" vocab-term-identifier="https://credit.niso.org/contributor-roles/funding-acquisition/">Funding acquisition</role>
          <xref rid="af1-diagnostics-14-00997" ref-type="aff">1</xref>
          <xref rid="af2-diagnostics-14-00997" ref-type="aff">2</xref>
        </contrib>
        <contrib contrib-type="author" corresp="yes">
          <contrib-id contrib-id-type="orcid" authenticated="true">https://orcid.org/0000-0002-2404-1101</contrib-id>
          <name>
            <surname>Manners</surname>
            <given-names>David Neil</given-names>
          </name>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Conceptualization" vocab-term-identifier="https://credit.niso.org/contributor-roles/conceptualization/">Conceptualization</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Formal analysis" vocab-term-identifier="https://credit.niso.org/contributor-roles/formal-analysis/">Formal analysis</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Investigation" vocab-term-identifier="https://credit.niso.org/contributor-roles/investigation/">Investigation</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Writing – review &amp; editing" vocab-term-identifier="https://credit.niso.org/contributor-roles/writing-review-editing/">Writing – review &amp; editing</role>
          <role vocab="credit" vocab-identifier="https://credit.niso.org/" vocab-term="Supervision" vocab-term-identifier="https://credit.niso.org/contributor-roles/supervision/">Supervision</role>
          <xref rid="af2-diagnostics-14-00997" ref-type="aff">2</xref>
          <xref rid="af9-diagnostics-14-00997" ref-type="aff">9</xref>
          <xref rid="c1-diagnostics-14-00997" ref-type="corresp">*</xref>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mustafa</surname>
            <given-names>Wan Azani</given-names>
          </name>
          <role>Academic Editor</role>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Alquran</surname>
            <given-names>Hiam</given-names>
          </name>
          <role>Academic Editor</role>
        </contrib>
      </contrib-group>
      <aff id="af1-diagnostics-14-00997"><label>1</label>Department of Biomedical and Neuromotor Sciences, University of Bologna, 40126 Bologna, Italy; <email>yuting.xie2@unibo.it</email> (Y.X.); <email>caterina.tonon@unibo.it</email> (C.T.); <email>raffaele.lodi@unibo.it</email> (R.L.)</aff>
      <aff id="af2-diagnostics-14-00997"><label>2</label>Functional and Molecular Neuroimaging Unit, IRCCS Istituto delle Scienze Neurologiche di Bologna, Bellaria Hospital, 40139 Bologna, Italy</aff>
      <aff id="af3-diagnostics-14-00997"><label>3</label>Department of Imaging, Cambridge University Hospitals NHS Foundation Trust, Cambridge Biomedical Campus, Cambridge CB2 0SL, UK; <email>fz247@cam.ac.uk</email></aff>
      <aff id="af4-diagnostics-14-00997"><label>4</label>Department of Radiology, University of Cambridge, Cambridge CB2 0QQ, UK</aff>
      <aff id="af5-diagnostics-14-00997"><label>5</label>Department of Information and Electrical Engineering and Applied Mathematics, University of Salerno, 84084 Fisciano, Italy; <email>lrundo@unisa.it</email></aff>
      <aff id="af6-diagnostics-14-00997"><label>6</label>INFN Bologna Division, Viale C. Berti Pichat, 6/2, 40127 Bologna, Italy</aff>
      <aff id="af7-diagnostics-14-00997"><label>7</label>Department of Physics and Astronomy, University of Bologna, 40127 Bologna, Italy</aff>
      <aff id="af8-diagnostics-14-00997"><label>8</label>Department of Engineering “Enzo Ferrari”, University of Modena and Reggio Emilia, 41125 Modena, Italy; <email>reefing.z@gmail.com</email></aff>
      <aff id="af9-diagnostics-14-00997"><label>9</label>Department for Life Quality Studies, University of Bologna, 40126 Bologna, Italy</aff>
      <author-notes>
        <corresp id="c1-diagnostics-14-00997"><label>*</label>Correspondence: <email>davidneil.manners@unibo.it</email></corresp>
      </author-notes>
      <pub-date pub-type="epub">
        <day>11</day>
        <month>05</month>
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="collection">
        <month>05</month>
        <year>2024</year>
      </pub-date>
      <volume>14</volume>
      <issue>10</issue>
      <elocation-id>997</elocation-id>
      <history>
        <date date-type="received">
          <day>18</day>
          <month>04</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>08</day>
          <month>05</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>09</day>
          <month>05</month>
          <year>2024</year>
        </date>
      </history>
      <permissions>
        <copyright-statement>© 2024 by the authors.</copyright-statement>
        <copyright-year>2024</copyright-year>
        <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
          <license-p>Licensee MDPI, Basel, Switzerland. This article is an open access article distributed under the terms and conditions of the Creative Commons Attribution (CC BY) license (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>).</license-p>
        </license>
      </permissions>
      <abstract>
        <p>Deep learning (DL) networks have shown attractive performance in medical image processing tasks such as brain tumor classification. However, they are often criticized as mysterious “black boxes”. The opaqueness of the model and the reasoning process make it difficult for health workers to decide whether to trust the prediction outcomes. In this study, we develop an interpretable multi-part attention network (IMPA-Net) for brain tumor classification to enhance the interpretability and trustworthiness of classification outcomes. The proposed model not only predicts the tumor grade but also provides a global explanation for the model interpretability and a local explanation as justification for the proffered prediction. Global explanation is represented as a group of feature patterns that the model learns to distinguish high-grade glioma (HGG) and low-grade glioma (LGG) classes. Local explanation interprets the reasoning process of an individual prediction by calculating the similarity between the prototypical parts of the image and a group of pre-learned task-related features. Experiments conducted on the BraTS2017 dataset demonstrate that IMPA-Net is a verifiable model for the classification task. A percentage of 86% of feature patterns were assessed by two radiologists to be valid for representing task-relevant medical features. The model shows a classification accuracy of 92.12%, of which 81.17% were evaluated as trustworthy based on local explanations. Our interpretable model is a trustworthy model that can be used for decision aids for glioma classification. Compared with black-box CNNs, it allows health workers and patients to understand the reasoning process and trust the prediction outcomes.</p>
      </abstract>
      <kwd-group>
        <kwd>decision support</kwd>
        <kwd>interpretability</kwd>
        <kwd>trustworthiness</kwd>
        <kwd>deep neural networks</kwd>
        <kwd>brain tumor classification</kwd>
        <kwd>multi-part attention</kwd>
      </kwd-group>
      <funding-group>
        <award-group>
          <funding-source>China Scholarship Council</funding-source>
          <award-id>202008320283</award-id>
        </award-group>
        <award-group>
          <funding-source>Italian Ministry of Health</funding-source>
        </award-group>
        <funding-statement>The research was funded by the China Scholarship Council (grant number: 202008320283). The publication of this article was supported by the “Ricerca Corrente” funding from the Italian Ministry of Health.</funding-statement>
      </funding-group>
    </article-meta>
  </front>
  <body>
    <sec id="sec1-diagnostics-14-00997" sec-type="intro">
      <title>1. Introduction</title>
      <p>Brain cancer is one of the ten leading causes of death globally among men and women [<xref ref-type="bibr" rid="B1-diagnostics-14-00997">1</xref>,<xref ref-type="bibr" rid="B2-diagnostics-14-00997">2</xref>]. The World Health Organization estimates the 5-year survival rate is only 21% for people aged 40 and over [<xref ref-type="bibr" rid="B2-diagnostics-14-00997">2</xref>]. In most clinical scenarios, LGGs are well-differentiated, slow-growing lesions, while HGGs are usually aggressive with dismal prognosis [<xref ref-type="bibr" rid="B3-diagnostics-14-00997">3</xref>,<xref ref-type="bibr" rid="B4-diagnostics-14-00997">4</xref>]. Survival rates differ markedly for different tumor grades. Identifying tumor grade at an early stage is a major unmet need; it contributes to formulating better treatment strategies and enhances the overall quality of life of patients.</p>
      <p>Magnetic resonance (MR) imaging is a non-invasive technique that remains the standard of care for brain tumor diagnosis and treatment planning in clinical practice [<xref ref-type="bibr" rid="B5-diagnostics-14-00997">5</xref>,<xref ref-type="bibr" rid="B6-diagnostics-14-00997">6</xref>]. It provides a reasonably good delineation of the gliomas and conveys biological information on the tumor location, size, necrosis, edema tissue, the mass effect, and breakdown of the blood–brain barrier (which results in contrast enhancement in post-contrast-enhanced T<sub>1</sub>-weighted (ceT<sub>1</sub>w) MR images) [<xref ref-type="bibr" rid="B6-diagnostics-14-00997">6</xref>]. In general, LGGs are less invasive. They usually have well-defined boundaries and homogeneous tumor cores without prominent mitosis, necrosis, and microvascular proliferation [<xref ref-type="bibr" rid="B6-diagnostics-14-00997">6</xref>,<xref ref-type="bibr" rid="B7-diagnostics-14-00997">7</xref>,<xref ref-type="bibr" rid="B8-diagnostics-14-00997">8</xref>,<xref ref-type="bibr" rid="B9-diagnostics-14-00997">9</xref>]. HGGs always show more mass effect. They usually show microscopic peritumoral white matter tract invasion. The demonstration of this diffuse infiltration is an important discriminating feature for the accurate glioma diagnosis [<xref ref-type="bibr" rid="B6-diagnostics-14-00997">6</xref>].</p>
      <p>Diagnosis of brain tumors from MR images is a time-consuming and challenging task that requires professional knowledge and careful observation. As alternatives, various automated diagnosis approaches have been developed to assist radiologists in the interpretation of the brain MR images and reduce the likelihood of misdiagnosis. Convolutional neural networks (CNNs) provide a powerful technology for medical data analysis [<xref ref-type="bibr" rid="B10-diagnostics-14-00997">10</xref>]. CNN-based deep learning architectures can extract important low-level and high-level features automatically from the given training dataset of sufficient variety and quality [<xref ref-type="bibr" rid="B11-diagnostics-14-00997">11</xref>]; they embed the phase of feature extraction and classification into a self-learning procedure, allowing fully automatic classification without human interaction, which can be applied to the problem of tumor diagnosis.</p>
      <p>Over the last decade, methods using CNNs have been extensively investigated for brain tumor classification due to their outstanding performance with very high accuracy in a research context [<xref ref-type="bibr" rid="B12-diagnostics-14-00997">12</xref>,<xref ref-type="bibr" rid="B13-diagnostics-14-00997">13</xref>]. The differential classification of HGG and LGG is a comparatively simple task that has been tackled in numerous different ways using different CNN methods, and the best-performing models have demonstrated close to 100% performance [<xref ref-type="bibr" rid="B10-diagnostics-14-00997">10</xref>]. For example, Khazaee et al. [<xref ref-type="bibr" rid="B14-diagnostics-14-00997">14</xref>] used a pre-trained EfficientNetB0 for HGG and LGG classification. The model achieved a mean classification accuracy of 98.87%. Chikhalikar et al. [<xref ref-type="bibr" rid="B15-diagnostics-14-00997">15</xref>] proposed a custom CNN model to classify the type of tumor present in MRI images, achieving an accuracy of 99.46%. The authors in [<xref ref-type="bibr" rid="B16-diagnostics-14-00997">16</xref>] used transfer learning with stacking InceptionResNetV2, DenseNet121, MobileNet, Incep-tionV3, Xception, VGG16, and VGG19 for the same classification task. The average classification accuracy for the test dataset reached 98.06%. Zhuge et al. [<xref ref-type="bibr" rid="B17-diagnostics-14-00997">17</xref>] utilized a pre-trained ResNet50. The classification accuracy of the proposed model reached 96.3%.</p>
      <p>The above CNN-based methods all achieved remarkable performance on automated HGG and LGG classification. However, MR images are unlikely to be artifact-free [<xref ref-type="bibr" rid="B18-diagnostics-14-00997">18</xref>], and the lesion signal measured by MRI is typically mixed with nuisance sources. The above-mentioned black-box CNNs may learn confounding sources from MR images for decision making, and the health outcomes cannot easily gain the trust of physicians or patients because the evidence is unknown [<xref ref-type="bibr" rid="B6-diagnostics-14-00997">6</xref>,<xref ref-type="bibr" rid="B19-diagnostics-14-00997">19</xref>].</p>
      <p>The lack of transparency and interpretability concerning the decision-making process still limits their development into clinical practice [<xref ref-type="bibr" rid="B12-diagnostics-14-00997">12</xref>,<xref ref-type="bibr" rid="B19-diagnostics-14-00997">19</xref>,<xref ref-type="bibr" rid="B20-diagnostics-14-00997">20</xref>]. Visualizing the features that are faithful to the underlying lesion is crucial to ensuring the interpretability and trustworthiness of classification outcomes. Interpretability is the ability to provide explanations in terms understandable to a human [<xref ref-type="bibr" rid="B21-diagnostics-14-00997">21</xref>], based on their domain knowledge related to the task, or common knowledge, according to the task characteristics. The need for interpretability has already been stressed by many papers [<xref ref-type="bibr" rid="B21-diagnostics-14-00997">21</xref>,<xref ref-type="bibr" rid="B22-diagnostics-14-00997">22</xref>,<xref ref-type="bibr" rid="B23-diagnostics-14-00997">23</xref>], emphasizing cases where lack of interpretability may be harmful. Can we explain why algorithms go wrong? When things go well, do we know why and how to exploit them further?</p>
      <p>In order to deploy a system in practice, it is necessary to present classification results in such a way that they are acceptable to end users. This is only possible if users trust the decision-making process, which, as a consequence, must be transparent and interpretable. To date, a limited number of saliency-based interpretable methods have suggested different frameworks to improve the interpretability and trustworthiness of CNNs for brain tumor classifications [<xref ref-type="bibr" rid="B24-diagnostics-14-00997">24</xref>,<xref ref-type="bibr" rid="B25-diagnostics-14-00997">25</xref>,<xref ref-type="bibr" rid="B26-diagnostics-14-00997">26</xref>,<xref ref-type="bibr" rid="B27-diagnostics-14-00997">27</xref>]. We divide the previous interpretable approaches into two categories: object-level methods and pixel-level/part-level methods.</p>
      <p>At the coarsest level, there are models that have been proposed to offer object-level explanations for brain tumor classification tasks, such as a class activation mapping method GradCAM [<xref ref-type="bibr" rid="B24-diagnostics-14-00997">24</xref>,<xref ref-type="bibr" rid="B25-diagnostics-14-00997">25</xref>] that highlights that entire object as the explanation behind the tumor predictions. The authors in [<xref ref-type="bibr" rid="B25-diagnostics-14-00997">25</xref>] proposed a pre-trained ResNet-50 CNN architecture to classify three posterior fossa tumors and explained the classification decision by using GradCAM. The heatmap generated by the GradCAM technique can identify the area of emphasis and help visualize where the classification model looks for individual predictions.</p>
      <p>At a finer level, there are a few interpretable techniques that have been applied to explain the brain tumor classification results with pixel-level/part-level explanations, such as pixel-level interpretable algorithms SHAP, Guided Backpropagation (GBP) [<xref ref-type="bibr" rid="B24-diagnostics-14-00997">24</xref>], and a part-level interpretable model called LIME. Authors in [<xref ref-type="bibr" rid="B27-diagnostics-14-00997">27</xref>] explained the tumor predictions made by the CNN model with SHAP and LIME methods. The SHAP algorithm explains the individual prediction by computing the contribution of each pixel on a predicted image to the prediction using Shapley values to understand what are the main pixels that affect the output of the model [<xref ref-type="bibr" rid="B28-diagnostics-14-00997">28</xref>]. The LIME algorithm is a counterfactual explanation method that approximates the classification behavior of a complex neural network using a simpler, more understandable model without exploring the model itself [<xref ref-type="bibr" rid="B29-diagnostics-14-00997">29</xref>]. In the study, the authors segmented the input image into superpixels and made small disturbances around each superpixel to figure out the contribution/importance of each superpixel to the prediction result. Another study conducted by Pereira et al. [<xref ref-type="bibr" rid="B24-diagnostics-14-00997">24</xref>] utilized GradCAM and GBP maps to provide insights into the regions that support the prediction to perform quality assessment of tumor grade prediction between HGG and LGG. The GBP is a gradient-based visualization method that can visualize which pixels in the input image are more informative for the correct classification.</p>
      <p>The above methods identify the most important pixels or objects of an image as the explanation for the prediction outcomes. To some extent, they verify the validity of the classification models. Nevertheless, it is worth stressing that knowing the most important pixels or objects of an image that determined a specific prediction does not always amount to a good-quality explanation.</p>
      <p>Ideally, networks should be able to explain the reasoning process behind each individual decision, and this process, ideally, would be similar to that used by a radiologist, who looks at specific features of the MR image relevant to the task. For example, if a doctor classifies a tumor as HGG, this decision always relies mainly on the high-level class-representative features or properties, like the tumor’s irregularity, the necrotic area, or the enhancing ring [<xref ref-type="bibr" rid="B30-diagnostics-14-00997">30</xref>].</p>
      <p>The objectives of this study were to build an interpretable multi-part attention [<xref ref-type="bibr" rid="B31-diagnostics-14-00997">31</xref>] network (IMPA-Net) for brain tumor classification to unbox the model and the reasoning process of individual predictions with understandable MR imaging features. The proposed IMPA-Net, motivated by [<xref ref-type="bibr" rid="B32-diagnostics-14-00997">32</xref>], provides both global and local explanations for brain tumor classification on MRI images. <xref ref-type="fig" rid="diagnostics-14-00997-f001">Figure 1</xref> gives a more detailed illustration of the connections and distinctions between the two explanations. The global explanation is represented by a group of feature patterns that the model learns and uses for the classification. The quality of the feature patterns can be used to evaluate the ability and reliability of the model on the classification task. The local explanation interprets the reasoning process of an individual prediction by comparing the prototypical parts of the image with feature patterns. It can be used to evaluate the trustworthiness of individual predictions.</p>
      <p>The main contribution of this paper is that it addresses the black-box problems of CNN classification models for glioma diagnosis by developing a model with the following characteristics:<list list-type="roman-lower"><list-item><label>(i)</label><p>The first multi-part interpretable model that can provide both global and local explanations for brain tumor classification, enabling better human–machine collaboration for decision aid.</p></list-item><list-item><label>(ii)</label><p>It presents the reasoning process of individual predictions to show how the model arrives at the decision making in this context, allowing health workers to evaluate the reliability of the prediction outcomes.</p></list-item><list-item><label>(iii)</label><p>It allows the prediction results to be interpreted in a clinical context.</p></list-item><list-item><label>(iv)</label><p>It highlights the most relevant information for predictions based on medical disease-related features that can be understood and interpreted by clinicians and patients.</p></list-item></list></p>
      <p>The remainder of the paper is structured as follows. <xref ref-type="sec" rid="sec3-diagnostics-14-00997">Section 3</xref> gives a detailed introduction to the dataset, the proposed interpretable multi-part attention network, and the experimental setup. Results are given in <xref ref-type="sec" rid="sec3-diagnostics-14-00997">Section 3</xref>. <xref ref-type="sec" rid="sec4-diagnostics-14-00997">Section 4</xref> evaluates the performance of the proposed method on both aspects of its classification and explanation. <xref ref-type="sec" rid="sec5-diagnostics-14-00997">Section 5</xref> concludes the key findings of this study. <xref ref-type="sec" rid="sec6-diagnostics-14-00997">Section 6</xref> concludes the proposed work and discusses the future research directions.</p>
    </sec>
    <sec id="sec2-diagnostics-14-00997">
      <title>2. Materials and Methods</title>
      <p>The overall workflow of the development and evaluation of the proposed methodology is shown in <xref ref-type="fig" rid="diagnostics-14-00997-f002">Figure 2</xref>. Input brain MRI images are firstly pre-processed by resizing, normalization, and cropping, and then three augmentation methods, including rotation, shearing, and skewing are performed to produce the training dataset. The proposed methodology classifies the input image by comparing its prototypical patches with pre-learned feature patterns of classes HGG and LGG. In this stage, feature patterns of both classes are optimized and produced. The quality of the feature patterns is evaluated in the next step on aspects of their interpretability, class representability, and correctness, and then poor-quality feature patterns are excluded in the local explanation process. In the next stage, local explanations of individual predictions are given to illustrate how the model arrives at the final decisions, and each case will be evaluated based on whether it satisfies two basic conditions identified for reliability assessment. Finally, the proposed model is evaluated on both aspects of its performance (classification and explanation), including classifier performance, global explanation evaluation, local explanation evaluation (correctness and confidence), and user evaluation.</p>
      <sec id="sec2dot1-diagnostics-14-00997">
        <title>2.1. Data and Image Processing</title>
        <p>We trained and evaluated our network on data from the BraTS 2017 database [<xref ref-type="bibr" rid="B33-diagnostics-14-00997">33</xref>,<xref ref-type="bibr" rid="B34-diagnostics-14-00997">34</xref>,<xref ref-type="bibr" rid="B35-diagnostics-14-00997">35</xref>]. The dataset contains 285 routine-acquired 3T multimodal clinical MRI scans from multiple institutions, comprising 210 patients with pathologically confirmed HGG and 75 patients with LGG. All images from the dataset were pre-processed by co-registration to the same anatomical template, interpolation to the same resolution (1 mm<sup>3</sup>), and skull stripping [<xref ref-type="bibr" rid="B33-diagnostics-14-00997">33</xref>].</p>
        <p>Slices that contain gliomas were extracted from each patient’s MRI scan. Considering the enhancing ring in post-contrast-enhanced T<sub>1</sub>-weighted (ceT<sub>1</sub>w) MR is an important discriminating feature for accurate tumor diagnosis between HGG and LGG [<xref ref-type="bibr" rid="B6-diagnostics-14-00997">6</xref>], in our experiments, only ceT<sub>1</sub>w MR images were considered. The dataset was then partitioned into a training dataset (70%) and a testing dataset (30%). A push dataset of 60 images was randomly selected from the training dataset (30 images for each class).</p>
        <p>All images were normalized by Z-score normalization and converted to PNG format, and then the background pixels were cropped to focus feature learning on the brain areas instead of the whole image. Moreover, the images were resized to 224 × 224 to fit the model’s training configurations.</p>
      </sec>
      <sec id="sec2dot2-diagnostics-14-00997">
        <title>2.2. Data Augmentation</title>
        <p>To increase the size and variability of the training dataset, data augmentation methods were performed, including twice rotating in the axial imaging plane by a random amount between 20° left and 20° right, shearing by a random amount between 10° left and right twice in the transverse direction, and skewing by tilting the images left/right by a random amount (magnitude = 0.2) twice. In this way, the training dataset is augmented six-fold, resulting in 6228 images (3546 HGG, 2682 LGG).</p>
      </sec>
      <sec id="sec2dot3-diagnostics-14-00997">
        <title>2.3. Interpretable Convolutional Neural Network</title>
        <p><xref ref-type="fig" rid="diagnostics-14-00997-f003">Figure 3</xref> gives an overview of the proposed IMPA-Net, which consists of a feature extractor, multi-part attention (MPA), and similarity-based classifier. Images are first propagated into convolutional layers for feature extraction, with a structure selected from VGG16. In the proposed classification model, we chose VGG16 as the feature extractor as it combines simplicity, ease of implementation, and fine-tuning capability with adequate feature extraction effectiveness and generalization ability. The pre-trained VGG16 model is suitable for transfer learning or fine-tuning as a feature extractor for brain tumor classification tasks [<xref ref-type="bibr" rid="B12-diagnostics-14-00997">12</xref>]. A non-linear activation function ReLU is used for all convolutional layers. Then, these convolutional layers are followed by a multi-part attention module for similarity calculation between CNN outputs and the feature patterns pre-learned by the model. In particular, our network tries to find evidence for an image (such as the pre-processed HGG image in <xref ref-type="fig" rid="diagnostics-14-00997-f003">Figure 3</xref>) to be of class HGG by comparing its prototypical patches with learned feature patterns of class HGG and LGG, as illustrated in the similarity correlation units. This comparison produces a map of similarity scores of each feature pattern, which is upsampled and superimposed on the input image to see which part of the input image is activated by each feature pattern. The activation maps are then propagated into a max-pooling layer, producing a single similarity score for each comparison. Finally, the model classifies the input image based on the top 10 similarity scores. The output <inline-formula><mml:math id="mm1"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>S</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi><mml:mi>G</mml:mi><mml:mi>G</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula> denotes the weighted sum of top-10 similarity scores generated by the multi-part attention module.</p>
        <sec id="sec2dot3dot1-diagnostics-14-00997">
          <title>2.3.1. Feature Extractor</title>
          <p>The architecture consists of a regular convolutional neural network for feature extraction with a structure selected from VGG16 (kernel size <inline-formula><mml:math id="mm2"><mml:semantics><mml:mrow><mml:mn>3</mml:mn><mml:mo>×</mml:mo><mml:mn>3</mml:mn></mml:mrow></mml:semantics></mml:math></inline-formula>), followed by two additional 1 × 1 convolutional layers. All these convolutional layers (<inline-formula><mml:math id="mm3"><mml:semantics><mml:mrow><mml:mi>f</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:semantics></mml:math></inline-formula> use a ReLU with a non-linear activation function.</p>
          <p>For a given pre-processed input image <inline-formula><mml:math id="mm4"><mml:semantics><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:semantics></mml:math></inline-formula> (such as the HGG sample image in <xref ref-type="fig" rid="diagnostics-14-00997-f003">Figure 3</xref>), the convolutional layers <inline-formula><mml:math id="mm5"><mml:semantics><mml:mrow><mml:mi>f</mml:mi></mml:mrow></mml:semantics></mml:math></inline-formula> extract useful features from <inline-formula><mml:math id="mm6"><mml:semantics><mml:mrow><mml:mi>x</mml:mi></mml:mrow></mml:semantics></mml:math></inline-formula> to use for prediction, whose output <inline-formula><mml:math id="mm7"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mi>f</mml:mi><mml:mo>(</mml:mo><mml:mi>x</mml:mi><mml:mo>)</mml:mo></mml:mrow></mml:semantics></mml:math></inline-formula> have spatial dimension <inline-formula><mml:math id="mm8"><mml:semantics><mml:mrow><mml:mi>D</mml:mi><mml:mo>×</mml:mo><mml:mn>7</mml:mn><mml:mo>×</mml:mo><mml:mn>7</mml:mn></mml:mrow></mml:semantics></mml:math></inline-formula>, where D is the number of the output channels of the last convolutional layer.</p>
        </sec>
        <sec id="sec2dot3dot2-diagnostics-14-00997">
          <title>2.3.2. Multi-Part Attention</title>
          <p>In our experiments, we allocated a pre-determined number of feature patterns <inline-formula><mml:math id="mm9"><mml:semantics><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mo>=</mml:mo><mml:msubsup><mml:mrow><mml:mfenced open="{" close="}" separators="|"><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>m</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula>, <inline-formula><mml:math id="mm10"><mml:semantics><mml:mrow><mml:mi>m</mml:mi><mml:mo>=</mml:mo><mml:mn>50</mml:mn></mml:mrow></mml:semantics></mml:math></inline-formula> for each class, where <inline-formula><mml:math id="mm11"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula> (<inline-formula><mml:math id="mm12"><mml:semantics><mml:mrow><mml:mi>j</mml:mi><mml:mo>∈</mml:mo><mml:mo>{</mml:mo><mml:mi mathvariant="normal">H</mml:mi><mml:mi mathvariant="normal">G</mml:mi><mml:mi mathvariant="normal">G</mml:mi><mml:mo>,</mml:mo><mml:mi mathvariant="normal">L</mml:mi><mml:mi mathvariant="normal">G</mml:mi><mml:mi mathvariant="normal">G</mml:mi><mml:mo>}</mml:mo></mml:mrow></mml:semantics></mml:math></inline-formula>) represents the class identity of the feature pattern and <inline-formula><mml:math id="mm13"><mml:semantics><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:semantics></mml:math></inline-formula> is the index of that feature pattern among all feature patterns of class <inline-formula><mml:math id="mm14"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula>. So that for each class, <inline-formula><mml:math id="mm15"><mml:semantics><mml:mrow><mml:mn>50</mml:mn></mml:mrow></mml:semantics></mml:math></inline-formula> feature patterns are learned and produced by the model from a push dataset. This dataset consists of a pre-determined number of MRI images that are randomly selected from the training dataset. The shape of each pattern is <inline-formula><mml:math id="mm16"><mml:semantics><mml:mrow><mml:mi>D</mml:mi><mml:mo>×</mml:mo><mml:mi>h</mml:mi><mml:mo>×</mml:mo><mml:mi>w</mml:mi></mml:mrow></mml:semantics></mml:math></inline-formula>, where <inline-formula><mml:math id="mm17"><mml:semantics><mml:mrow><mml:mi>h</mml:mi><mml:mo>×</mml:mo><mml:mi>w</mml:mi><mml:mo>&lt;</mml:mo><mml:mn>7</mml:mn><mml:mo>×</mml:mo><mml:mn>7</mml:mn></mml:mrow></mml:semantics></mml:math></inline-formula>. In our experiments, <inline-formula><mml:math id="mm18"><mml:semantics><mml:mrow><mml:mi>h</mml:mi></mml:mrow></mml:semantics></mml:math></inline-formula> and <inline-formula><mml:math id="mm19"><mml:semantics><mml:mrow><mml:mi>w</mml:mi></mml:mrow></mml:semantics></mml:math></inline-formula> are set to 1. The depth of each feature pattern is the same as that of <inline-formula><mml:math id="mm20"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula> but the height and width are smaller than those of the <inline-formula><mml:math id="mm21"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula>, each feature pattern will be supposed to represent some representative activation pattern in a patch of the convolutional output <inline-formula><mml:math id="mm22"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula>, which in turn will correspond to some prototypical image patch in the original training image.</p>
          <p>In our network, every feature patch can be considered as a representative pattern of one image from the push dataset, and these feature patterns are supposed to direct attention to enough medical semantic content for recognizing a class [<xref ref-type="bibr" rid="B36-diagnostics-14-00997">36</xref>]. As a schematic illustration of the multi-part attention for the HGG sample image in <xref ref-type="fig" rid="diagnostics-14-00997-f003">Figure 3</xref>, the first feature pattern <inline-formula><mml:math id="mm23"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi><mml:mi>G</mml:mi><mml:mi>G</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> corresponds to the necrotic tumor core of an HGG training image, and the fourth feature pattern <inline-formula><mml:math id="mm24"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mn>4</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi><mml:mi>G</mml:mi><mml:mi>G</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> enhancing tumor margin of an HGG training image, and the ninth feature pattern <inline-formula><mml:math id="mm25"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mn>9</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi><mml:mi>G</mml:mi><mml:mi>G</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> the edematous area of an HGG image.</p>
          <p>The similarity correlation units <inline-formula><mml:math id="mm26"><mml:semantics><mml:mrow><mml:mi>S</mml:mi><mml:mi>C</mml:mi><mml:mi>U</mml:mi></mml:mrow></mml:semantics></mml:math></inline-formula> in a multi-part attention module computes the L2 distance between the CNN outputs and the feature patterns, as shown in Equation (1). The <inline-formula><mml:math id="mm27"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>h</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula> similarity correlation unit <inline-formula><mml:math id="mm28"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>S</mml:mi><mml:mi>C</mml:mi><mml:mi>U</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> of class <inline-formula><mml:math id="mm29"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mo> </mml:mo><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula> calculates the squared Euclidean distances between feature patterns <inline-formula><mml:math id="mm30"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> and each patch <inline-formula><mml:math id="mm31"><mml:semantics><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>~</mml:mo></mml:mover></mml:mrow></mml:semantics></mml:math></inline-formula> generated from the convolutional outputs <inline-formula><mml:math id="mm32"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="bold-italic">c</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="bold-italic">o</mml:mi><mml:mi mathvariant="bold-italic">u</mml:mi><mml:mi mathvariant="bold-italic">t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula> and then inverts the distances to similarity scores. Mathematically, the similarity correlation unit <inline-formula><mml:math id="mm33"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>S</mml:mi><mml:mi>C</mml:mi><mml:mi>U</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> calculates the following:<disp-formula id="FD1-diagnostics-14-00997"><label>(1)</label><mml:math id="mm34" display="block"><mml:semantics><mml:mrow><mml:mi>d</mml:mi><mml:mi>i</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mfenced open="‖" close="‖" separators="|"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>,</mml:mo><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:mover accent="true"><mml:mrow><mml:mo> </mml:mo><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>∈</mml:mo><mml:mi>p</mml:mi><mml:mi>a</mml:mi><mml:mi>t</mml:mi><mml:mi>c</mml:mi><mml:mi>h</mml:mi><mml:mi>e</mml:mi><mml:mi>s</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:msub><mml:mrow><mml:mi mathvariant="bold-italic">c</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="bold-italic">o</mml:mi><mml:mi mathvariant="bold-italic">u</mml:mi><mml:mi mathvariant="bold-italic">t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mo>,</mml:mo></mml:mrow></mml:semantics></mml:math></disp-formula>
          <disp-formula id="FD2-diagnostics-14-00997"><label>(2)</label><mml:math id="mm35" display="block"><mml:semantics><mml:mrow><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:mrow><mml:mrow><mml:mi mathvariant="normal">log</mml:mi></mml:mrow><mml:mo>⁡</mml:mo><mml:mrow><mml:mfenced separators="|"><mml:mrow><mml:mfrac><mml:mrow><mml:msup><mml:mrow><mml:mi>d</mml:mi><mml:mi>i</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:msup><mml:mrow><mml:mi>d</mml:mi><mml:mi>i</mml:mi><mml:mi>s</mml:mi><mml:mi>t</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msup><mml:mo>+</mml:mo><mml:mi>ε</mml:mi></mml:mrow></mml:mfrac></mml:mrow></mml:mfenced><mml:mo>,</mml:mo></mml:mrow></mml:mrow></mml:mrow></mml:semantics></mml:math></disp-formula>
          <disp-formula id="FD3-diagnostics-14-00997"><label>(3)</label><mml:math id="mm36" display="block"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>S</mml:mi><mml:mi>C</mml:mi><mml:mi>U</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup><mml:mfenced separators="|"><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mo>=</mml:mo><mml:mtable><mml:mtr><mml:mtd><mml:mi mathvariant="normal">m</mml:mi><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">x</mml:mi></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>∈</mml:mo><mml:mi mathvariant="normal">p</mml:mi><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">t</mml:mi><mml:mi mathvariant="normal">c</mml:mi><mml:mi mathvariant="normal">h</mml:mi><mml:mi mathvariant="normal">e</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mo> </mml:mo><mml:mfenced separators="|"><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced></mml:mtd></mml:mtr></mml:mtable><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced><mml:mo>,</mml:mo></mml:mrow></mml:semantics></mml:math></disp-formula></p>
          <p>These similarity scores calculated by Equation (2) define an activation map, which retains the spatial relation of the convolutional output <inline-formula><mml:math id="mm37"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula>. The activation map can be unsampled to the size of the input image to visualize the part of the input image that looks most similar to the feature pattern [<xref ref-type="bibr" rid="B36-diagnostics-14-00997">36</xref>]. In <xref ref-type="fig" rid="diagnostics-14-00997-f003">Figure 3</xref>, the similarity score between the first feature patterns <inline-formula><mml:math id="mm38"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi><mml:mi>G</mml:mi><mml:mi>G</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula>, a an HGG necrotic tumor core, and the most activated patch of the input image of a an HGG is <inline-formula><mml:math id="mm39"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi><mml:mi>G</mml:mi><mml:mi>G</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula>. The similarity score between the fourth feature pattern <inline-formula><mml:math id="mm40"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mn>4</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi><mml:mi>G</mml:mi><mml:mi>G</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula>, an HGG enhancing tumor margin, and the most activated patch of the input image is <inline-formula><mml:math id="mm41"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mn>4</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi><mml:mi>G</mml:mi><mml:mi>G</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula>. The third feature pattern <inline-formula><mml:math id="mm42"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mn>9</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi><mml:mi>G</mml:mi><mml:mi>G</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula>, an HGG edematous area, activated mostly on the edematous tissue of the HGG sample image, with a similarity score of <inline-formula><mml:math id="mm43"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mn>9</mml:mn></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>H</mml:mi><mml:mi>G</mml:mi><mml:mi>G</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula>. This shows that our model finds that the necrotic tumor core of the HGG sample image has a stronger presence than that of enhancing tumor margin in the input image.</p>
          <p>Equation (2) indicates that the similarity is monotonically decreasing with respect to the squared Euclidean distance, that is, the highest similarity score of the similarity correlation unit <inline-formula><mml:math id="mm44"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>S</mml:mi><mml:mi>C</mml:mi><mml:mi>U</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> comes when <inline-formula><mml:math id="mm45"><mml:semantics><mml:mrow><mml:mover accent="true"><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>o</mml:mi><mml:mi>u</mml:mi><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mo>~</mml:mo></mml:mover></mml:mrow></mml:semantics></mml:math></inline-formula> is the closest patch to <inline-formula><mml:math id="mm46"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula>. In activation maps, warmer values indicate higher similarity between the learned feature patterns and the parts of the input image activated by the feature pattern, which is enclosed in the yellow rectangles on the superimposed source images. Then, the activation maps produced by similarity scores are max pooled to reduce to a single similarity score <inline-formula><mml:math id="mm47"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> for each feature pattern <inline-formula><mml:math id="mm48"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula>. Hence, if the similarity score of the <inline-formula><mml:math id="mm49"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>h</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula> similarity correlation unit <inline-formula><mml:math id="mm50"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>S</mml:mi><mml:mi>C</mml:mi><mml:mi>U</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> is high, it indicates that there is a patch in the input image that is very similar to the <inline-formula><mml:math id="mm51"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>h</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula> feature pattern of class <inline-formula><mml:math id="mm52"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mo> </mml:mo><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula> in the latent space, and that the activated patch contains a similar pattern to that represented in the <inline-formula><mml:math id="mm53"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mi>t</mml:mi><mml:mi>h</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula> feature pattern.</p>
        </sec>
        <sec id="sec2dot3dot3-diagnostics-14-00997">
          <title>2.3.3. Similarity-Based Classifier</title>
          <p>Finally, in the classifier block, the top 10 ranking similarity scores are multiplied by the class-connection weight matrix <inline-formula><mml:math id="mm54"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>ω</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> to produce the output logit to class <inline-formula><mml:math id="mm55"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula>. The matrix <inline-formula><mml:math id="mm56"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>ω</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> represents the relationship between feature patterns and the logit of the class. Higher class-connection values refer to higher representability of the feature pattern to its class.
          <disp-formula id="FD4-diagnostics-14-00997"><label>(4)</label><mml:math id="mm57" display="block"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>S</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mrow><mml:msubsup><mml:mo stretchy="false">∑</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mn>10</mml:mn></mml:mrow></mml:msubsup><mml:mrow><mml:msubsup><mml:mrow><mml:mi>ω</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:mrow><mml:mo>·</mml:mo><mml:msubsup><mml:mrow><mml:mi>s</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup><mml:mo>,</mml:mo><mml:mi>j</mml:mi><mml:mo>∈</mml:mo><mml:mfenced open="{" close="}" separators="|"><mml:mrow><mml:mi mathvariant="normal">H</mml:mi><mml:mi mathvariant="normal">G</mml:mi><mml:mi mathvariant="normal">G</mml:mi><mml:mo>,</mml:mo><mml:mi mathvariant="normal">L</mml:mi><mml:mi mathvariant="normal">G</mml:mi><mml:mi mathvariant="normal">G</mml:mi></mml:mrow></mml:mfenced></mml:mrow></mml:semantics></mml:math></disp-formula></p>
        </sec>
      </sec>
      <sec id="sec2dot4-diagnostics-14-00997">
        <title>2.4. Model Training</title>
        <p>The training of the proposed model is divided into three stages: stochastic gradient descent (SGD) of layers before the classifier layer, projection and optimization of feature patterns, and optimization of class-connection weights.</p>
        <sec id="sec2dot4dot1-diagnostics-14-00997">
          <title>2.4.1. Stochastic Gradient Descent (SGD) of Layers before the Classifier Layer</title>
          <p>The architecture aims to learn meaningful and teak-relevant features that can be used to distinguish between HGG and LGG, where the most important patches for the classification task are clustered (in Euclidean distance) around similar feature patterns of the ‘correct’ class and separated from feature patterns from a different class [<xref ref-type="bibr" rid="B36-diagnostics-14-00997">36</xref>]. To learn these features, an iterative algorithm SGD is used to simultaneously optimize the parameters of the convolutional layers <inline-formula><mml:math id="mm58"><mml:semantics><mml:mrow><mml:mi>f</mml:mi></mml:mrow></mml:semantics></mml:math></inline-formula> (<inline-formula><mml:math id="mm59"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mi>f</mml:mi></mml:mrow><mml:mrow><mml:mi>c</mml:mi><mml:mi>o</mml:mi><mml:mi>n</mml:mi><mml:mi>v</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula>) in the feature extractor and the feature pattern <inline-formula><mml:math id="mm60"><mml:semantics><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi><mml:mo>=</mml:mo><mml:msubsup><mml:mrow><mml:mfenced open="{" close="}" separators="|"><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>m</mml:mi></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> in the multi-part attention module via back propagation. In this step, the weight matrix (class connection values) <inline-formula><mml:math id="mm61"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>ω</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> of the last layer in the classifier block is frozen.</p>
          <p>Formally, let <inline-formula><mml:math id="mm62"><mml:semantics><mml:mrow><mml:mi>X</mml:mi><mml:mo>=</mml:mo><mml:mo>{</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mo>…</mml:mo><mml:mo>,</mml:mo><mml:mo> </mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msub><mml:mo>}</mml:mo></mml:mrow></mml:semantics></mml:math></inline-formula> be a set of training images, <inline-formula><mml:math id="mm63"><mml:semantics><mml:mrow><mml:mi>Y</mml:mi><mml:mo>=</mml:mo><mml:mo>{</mml:mo><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:mo>…</mml:mo><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msub><mml:mo>}</mml:mo></mml:mrow></mml:semantics></mml:math></inline-formula> be the set of the corresponding labels. The optimization problem to be solved here is to minimize the defined loss function that incorporates the cross-entropy loss (CELoss), cluster loss (ClstLoss), and separation loss (SepLoss):<disp-formula id="FD5-diagnostics-14-00997"><label>(5)</label><mml:math id="mm64" display="block"><mml:semantics><mml:mrow><mml:mi>L</mml:mi><mml:mi>o</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:mfrac><mml:mrow><mml:msubsup><mml:mo stretchy="false">∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msubsup><mml:mrow><mml:mi mathvariant="normal">C</mml:mi><mml:mi mathvariant="normal">E</mml:mi><mml:mi mathvariant="normal">L</mml:mi><mml:mi mathvariant="normal">o</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">s</mml:mi></mml:mrow></mml:mrow><mml:mfenced separators="|"><mml:mrow><mml:mi>f</mml:mi><mml:mo>∘</mml:mo><mml:mi>S</mml:mi><mml:mi>C</mml:mi><mml:mi>U</mml:mi><mml:mo>∘</mml:mo><mml:mi>f</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mo>+</mml:mo><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mi mathvariant="normal">C</mml:mi><mml:mi mathvariant="normal">l</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">t</mml:mi><mml:mi mathvariant="normal">L</mml:mi><mml:mi mathvariant="normal">o</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mo>+</mml:mo><mml:msub><mml:mrow><mml:mi>r</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mi mathvariant="normal">S</mml:mi><mml:mi mathvariant="normal">e</mml:mi><mml:mi mathvariant="normal">p</mml:mi><mml:mi mathvariant="normal">L</mml:mi><mml:mi mathvariant="normal">o</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">s</mml:mi></mml:mrow></mml:semantics></mml:math></disp-formula>
          where ClstLoss and SepLoss are
          <disp-formula id="FD6-diagnostics-14-00997"><label>(6)</label><mml:math id="mm65" display="block"><mml:semantics><mml:mrow><mml:mi mathvariant="normal">C</mml:mi><mml:mi mathvariant="normal">l</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">t</mml:mi><mml:mi mathvariant="normal">L</mml:mi><mml:mi mathvariant="normal">o</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:mfrac><mml:mrow><mml:munderover><mml:mo stretchy="false">∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:munderover><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">r</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mi mathvariant="normal">m</mml:mi><mml:mi mathvariant="normal">i</mml:mi><mml:mi mathvariant="normal">n</mml:mi></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mi>i</mml:mi><mml:mo>:</mml:mo><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup><mml:mo>∈</mml:mo><mml:msup><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msup></mml:mtd></mml:mtr></mml:mtable><mml:mtable><mml:mtr><mml:mtd><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">r</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mi mathvariant="normal">m</mml:mi><mml:mi mathvariant="normal">i</mml:mi><mml:mi mathvariant="normal">n</mml:mi></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mo> </mml:mo><mml:mover accent="true"><mml:mrow><mml:mi>f</mml:mi><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>∈</mml:mo><mml:mi mathvariant="normal">p</mml:mi><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">t</mml:mi><mml:mi mathvariant="normal">c</mml:mi><mml:mi mathvariant="normal">h</mml:mi><mml:mi mathvariant="normal">e</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mo>(</mml:mo><mml:mi>f</mml:mi><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo><mml:mo>)</mml:mo></mml:mtd></mml:mtr></mml:mtable><mml:msubsup><mml:mrow><mml:mfenced open="‖" close="‖" separators="|"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>f</mml:mi><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>−</mml:mo><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup></mml:mrow></mml:mrow></mml:mrow></mml:semantics></mml:math></disp-formula>
          <disp-formula id="FD7-diagnostics-14-00997"><label>(7)</label><mml:math id="mm66" display="block"><mml:semantics><mml:mrow><mml:mi mathvariant="normal">S</mml:mi><mml:mi mathvariant="normal">e</mml:mi><mml:mi mathvariant="normal">p</mml:mi><mml:mi mathvariant="normal">L</mml:mi><mml:mi mathvariant="normal">o</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mo>=</mml:mo><mml:mo>−</mml:mo><mml:mfrac><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:mfrac><mml:mrow><mml:munderover><mml:mo stretchy="false">∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:munderover><mml:mrow><mml:mtable><mml:mtr><mml:mtd><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">r</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mi mathvariant="normal">m</mml:mi><mml:mi mathvariant="normal">i</mml:mi><mml:mi mathvariant="normal">n</mml:mi></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mi>i</mml:mi><mml:mo>:</mml:mo><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup><mml:mo>∉</mml:mo><mml:msup><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msup><mml:mo> </mml:mo></mml:mtd></mml:mtr></mml:mtable><mml:mtable><mml:mtr><mml:mtd><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">r</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mi mathvariant="normal">m</mml:mi><mml:mi mathvariant="normal">i</mml:mi><mml:mi mathvariant="normal">n</mml:mi></mml:mtd></mml:mtr><mml:mtr><mml:mtd><mml:mover accent="true"><mml:mrow><mml:mi>f</mml:mi><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>∈</mml:mo><mml:mi mathvariant="normal">p</mml:mi><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">t</mml:mi><mml:mi mathvariant="normal">c</mml:mi><mml:mi mathvariant="normal">h</mml:mi><mml:mi mathvariant="normal">e</mml:mi><mml:mi mathvariant="normal">s</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>f</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced></mml:mrow></mml:mfenced></mml:mtd></mml:mtr></mml:mtable><mml:msubsup><mml:mrow><mml:mfenced open="‖" close="‖" separators="|"><mml:mrow><mml:mover accent="true"><mml:mrow><mml:mi>f</mml:mi><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mo>~</mml:mo></mml:mover><mml:mo>−</mml:mo><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msubsup></mml:mrow></mml:mrow><mml:mo>,</mml:mo></mml:mrow></mml:semantics></mml:math></disp-formula></p>
          <p>The CELoss penalizes misclassification during the training process, and the aim is to minimize CELoss to give better classifications. The ClstLoss is minimized to encourage the prototypical parts to cluster around the correct class, see Equation (6), whereas the SepLoss is minimized to separate the prototypical parts from the incorrect class; see Equation (7).</p>
        </sec>
        <sec id="sec2dot4dot2-diagnostics-14-00997">
          <title>2.4.2. Projection of Feature Patterns</title>
          <p>To visualize which parts of the training images from the push dataset are used as feature patterns, the network projects every feature pattern <inline-formula><mml:math id="mm67"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> onto the closest patch of the output <inline-formula><mml:math id="mm68"><mml:semantics><mml:mrow><mml:mi>f</mml:mi><mml:mo>(</mml:mo><mml:msup><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msup><mml:mo>)</mml:mo></mml:mrow></mml:semantics></mml:math></inline-formula> that has the smallest distance from <inline-formula><mml:math id="mm69"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula>, and the closest patch has the same class <inline-formula><mml:math id="mm70"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mo> </mml:mo><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></inline-formula> as that of <inline-formula><mml:math id="mm71"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> [<xref ref-type="bibr" rid="B32-diagnostics-14-00997">32</xref>]. The reason is that the patch of training image <inline-formula><mml:math id="mm72"><mml:semantics><mml:mrow><mml:msup><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msup></mml:mrow></mml:semantics></mml:math></inline-formula> that corresponds to <inline-formula><mml:math id="mm73"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> should be the one that <inline-formula><mml:math id="mm74"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> activates most strongly on. We can visualize the part of <inline-formula><mml:math id="mm75"><mml:semantics><mml:mrow><mml:msup><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msup></mml:mrow></mml:semantics></mml:math></inline-formula> on which <inline-formula><mml:math id="mm76"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> has the strongest activation by forwarding <inline-formula><mml:math id="mm77"><mml:semantics><mml:mrow><mml:msup><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msup></mml:mrow></mml:semantics></mml:math></inline-formula> through a trained network. Mathematically, for feature pattern <inline-formula><mml:math id="mm78"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> of class <inline-formula><mml:math id="mm79"><mml:semantics><mml:mrow><mml:msub><mml:mrow><mml:mo> </mml:mo><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo> </mml:mo></mml:mrow></mml:semantics></mml:math></inline-formula>(<inline-formula><mml:math id="mm80"><mml:semantics><mml:mrow><mml:mi>j</mml:mi><mml:mo>∈</mml:mo><mml:mo>{</mml:mo><mml:mi mathvariant="normal">H</mml:mi><mml:mi mathvariant="normal">G</mml:mi><mml:mi mathvariant="normal">G</mml:mi><mml:mo>,</mml:mo><mml:mi mathvariant="normal">L</mml:mi><mml:mi mathvariant="normal">G</mml:mi><mml:mi mathvariant="normal">G</mml:mi><mml:mo>}</mml:mo></mml:mrow></mml:semantics></mml:math></inline-formula>), the network performs the following update:<disp-formula id="FD8-diagnostics-14-00997"><label>(8)</label><mml:math id="mm81" display="block"><mml:semantics><mml:mrow><mml:mi>f</mml:mi><mml:msubsup><mml:mrow><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup><mml:mo>=</mml:mo><mml:munder><mml:mrow><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">r</mml:mi><mml:mi mathvariant="normal">g</mml:mi><mml:mi mathvariant="normal">m</mml:mi><mml:mi mathvariant="normal">i</mml:mi><mml:mi mathvariant="normal">n</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="italic">patch</mml:mi><mml:mo>,</mml:mo><mml:mi mathvariant="italic">patch</mml:mi><mml:mo>∈</mml:mo><mml:mi mathvariant="italic">patches</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>f</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:msup><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msup></mml:mrow></mml:mfenced></mml:mrow></mml:mfenced></mml:mrow></mml:munder><mml:mo>∥</mml:mo><mml:mi mathvariant="italic">patch</mml:mi><mml:mo>−</mml:mo><mml:mi>f</mml:mi><mml:msubsup><mml:mrow><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup><mml:msub><mml:mrow><mml:mo>∥</mml:mo></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:semantics></mml:math></disp-formula></p>
        </sec>
        <sec id="sec2dot4dot3-diagnostics-14-00997">
          <title>2.4.3. Optimization of Class-Connection Weights</title>
          <p>In this stage, all the parameters from the convolutional layers and multi-part attention blocks are frozen, and a convex optimization on the class-connection weight matrix <inline-formula><mml:math id="mm82"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>ω</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> of the last layer is performed. To rely only on positive connections between feature patterns and logits, the negative connection <inline-formula><mml:math id="mm83"><mml:semantics><mml:mrow><mml:msubsup><mml:mrow><mml:mi>ω</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:semantics></mml:math></inline-formula> is set to 0 for all to reduce the reliance of the model on a negative reasoning process of the form “this image is of class HGG because it is not of class LGG.”. Mathematically, we perform this step to optimize
          <disp-formula id="FD9-diagnostics-14-00997"><label>(9)</label><mml:math id="mm84" display="block"><mml:semantics><mml:mrow><mml:mrow><mml:mrow><mml:munder><mml:mrow><mml:mi mathvariant="normal">min</mml:mi></mml:mrow><mml:mrow><mml:msubsup><mml:mrow><mml:mi>ω</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup></mml:mrow></mml:munder></mml:mrow><mml:mo>⁡</mml:mo><mml:mrow><mml:mfrac><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:mfrac><mml:mrow><mml:munderover><mml:mo stretchy="false">∑</mml:mo><mml:mrow><mml:mi>k</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:munderover><mml:mrow><mml:mi>C</mml:mi><mml:mi>E</mml:mi><mml:mi>L</mml:mi><mml:mi>o</mml:mi><mml:mi>s</mml:mi><mml:mi>s</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:mi>f</mml:mi><mml:mo>∘</mml:mo><mml:mi>S</mml:mi><mml:mi>C</mml:mi><mml:mi>U</mml:mi><mml:mo>∘</mml:mo><mml:mi>f</mml:mi><mml:mfenced separators="|"><mml:mrow><mml:msub><mml:mrow><mml:mi>x</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:mfenced><mml:mo>+</mml:mo><mml:mi>λ</mml:mi><mml:mrow><mml:munder><mml:mo stretchy="false">∑</mml:mo><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>:</mml:mo><mml:msubsup><mml:mrow><mml:mi>f</mml:mi><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msubsup><mml:mo>∉</mml:mo><mml:msup><mml:mrow><mml:mi>F</mml:mi><mml:mi>P</mml:mi></mml:mrow><mml:mrow><mml:msub><mml:mrow><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mi>k</mml:mi></mml:mrow></mml:msub></mml:mrow></mml:msup></mml:mrow></mml:munder><mml:mrow><mml:mfenced open="|" close="|" separators="|"><mml:mrow><mml:msubsup><mml:mrow><mml:mi>ω</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mi>k</mml:mi><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>c</mml:mi></mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow></mml:msubsup></mml:mrow></mml:mfenced></mml:mrow></mml:mrow></mml:mrow></mml:mrow></mml:mrow></mml:mrow><mml:mo>,</mml:mo></mml:mrow></mml:semantics></mml:math></disp-formula></p>
        </sec>
      </sec>
      <sec id="sec2dot5-diagnostics-14-00997">
        <title>2.5. Experimental Setup</title>
        <p>All the experiments were conducted on a PC with an Intel Core i7-6700K 4.00 GHz processor running Ubuntu 18.04.6 with one NVIDIA GeForce RTX 2060, using Python 3.9.7 and PyTorch 1.10.1.</p>
        <p>The parameters of the convolutional layers from the VGG16 model were pre-trained on ImageNet [<xref ref-type="bibr" rid="B37-diagnostics-14-00997">37</xref>], and the parameters of the additional convolutional layers were initialized with Kaiming uniform methods [<xref ref-type="bibr" rid="B38-diagnostics-14-00997">38</xref>]. The parameters of the two additional convolutional layers are trained and optimized with the learning rate <inline-formula><mml:math id="mm85"><mml:semantics><mml:mrow><mml:mn>3</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mrow><mml:mn>10</mml:mn></mml:mrow><mml:mrow><mml:mo>−</mml:mo><mml:mn>3</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:semantics></mml:math></inline-formula> for 5 epochs, while the pre-trained parameters and biases are fixed. In the following joint training stage, the parameters of all convolutional layers are optimized from epoch 6, and the model performs feature pattern projection every 20 epochs, that is, epochs 20, 40, 60, 80, and 100, and the convex optimization of the last layer is performed after each feature pattern projection process for 20 iterations with learning rate <inline-formula><mml:math id="mm86"><mml:semantics><mml:mrow><mml:msup><mml:mrow><mml:mn>10</mml:mn></mml:mrow><mml:mrow><mml:mo>−</mml:mo><mml:mn>4</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:semantics></mml:math></inline-formula>.</p>
        <p>The other hyperparameters are learning rate for layers pre-trained on ImageNet: <inline-formula><mml:math id="mm87"><mml:semantics><mml:mrow><mml:msup><mml:mrow><mml:mn>10</mml:mn></mml:mrow><mml:mrow><mml:mo>−</mml:mo><mml:mn>4</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:semantics></mml:math></inline-formula> and learning rate for feature pattern optimization: <inline-formula><mml:math id="mm88"><mml:semantics><mml:mrow><mml:mn>3</mml:mn><mml:mo>×</mml:mo><mml:msup><mml:mrow><mml:mn>10</mml:mn></mml:mrow><mml:mrow><mml:mo>−</mml:mo><mml:mn>3</mml:mn></mml:mrow></mml:msup></mml:mrow></mml:semantics></mml:math></inline-formula>. For VGG16, we set <inline-formula><mml:math id="mm89"><mml:semantics><mml:mrow><mml:mi>D</mml:mi><mml:mo>=</mml:mo><mml:mn>128</mml:mn></mml:mrow></mml:semantics></mml:math></inline-formula> as the number of channels in a similarity correlation unit.</p>
      </sec>
    </sec>
    <sec id="sec3-diagnostics-14-00997" sec-type="results">
      <title>3. Results</title>
      <sec id="sec3dot1-diagnostics-14-00997">
        <title>3.1. Global Explanation</title>
        <p>Global explanation can be interpreted as the class-representative features the entire model uses to distinguish two classes. <xref ref-type="fig" rid="diagnostics-14-00997-f004">Figure 4</xref> shows six learned feature patterns and their activation maps for each class. It can be seen that all feature patterns localize important distinguishing features of both classes. The feature patterns of HGG that have higher responses in contrast-enhancing tumors as a classification feature agrees with the actual imaging characteristics of HGG [<xref ref-type="bibr" rid="B6-diagnostics-14-00997">6</xref>]; the feature patterns that focus on the necrotic tumor core that present heterogeneous high signal and the edematous areas are also important disease-representative features of HGG [<xref ref-type="bibr" rid="B6-diagnostics-14-00997">6</xref>]; the feature patterns of LGG present higher responses on the homogeneous tumor cores and the non-enhancing tumor margins [<xref ref-type="bibr" rid="B7-diagnostics-14-00997">7</xref>,<xref ref-type="bibr" rid="B8-diagnostics-14-00997">8</xref>,<xref ref-type="bibr" rid="B9-diagnostics-14-00997">9</xref>]. It is worth mentioning that those localized medical features can be understood and interpreted by the users, and thus, our framework can help provide global explanations in a human-understandable manner.</p>
      </sec>
      <sec id="sec3dot2-diagnostics-14-00997">
        <title>3.2. Local Explanation: Individual Predictions</title>
        <p>The local explanation of individual predictions has to satisfy two conditions in order for its prediction explanations to be considered trustworthy and reliable; that is, all feature patterns that present the 10 highest similarity scores are from the class of the test image, and the concept of each top-10 feature pattern is consistent with that of the activated prototypical patch.</p>
        <p><xref ref-type="fig" rid="diagnostics-14-00997-f005">Figure 5</xref> shows the reasoning process of our interpretable model in reaching a prediction on a test image of an HGG. As shown in the activation maps, the highest responses were found on the tumor core activated by the top and 2nd ranked feature patterns of class HGG (with similarity scores 8.143 and 8.105, respectively), the 3rd ranked feature pattern on the tumor enhancing margins, the 6th, 8th, and 9th ranked feature patterns on the edematous tissues.</p>
        <p>The network correctly classifies the tumor as an HGG according to the ground truth. Furthermore, it provides the evidence of this prediction outcome with multi-part attention between patches of the test image and feature patterns as the tumor is classified as an HGG because prototypical patches of the test image, including its necrotic tumor core, enhancing margins, and edematous tissue was found to have higher similarity (top 10) with feature patterns from HGG class. The evidence is evaluated to be trustworthy according to the two reliability criteria, that is, all top-10 feature patterns are from the HGG class, and the concept of each top-10 feature pattern is consistent with that of the localized prototypical patch.</p>
        <p><xref ref-type="fig" rid="diagnostics-14-00997-f006">Figure 6</xref> shows the reasoning process for reaching a classification decision on a test image of an LGG. As shown in the third column, the highest responses were found on the tumor core of the LGG image activated by two ‘tumor core’ feature patterns (similarity score of 7.420 and 7.332, respectively), the 3rd and 4th ranked feature patterns on the tumor margins. The network correctly classifies the tumor as an LGG. The explanation is the network classifies the tumor as an LGG because prototypical patches of the test image, including its homogeneous tumor core and non-enhancing tumor margins, were found to have higher similarity (top 10) with feature patterns from the LGG class. Those medical feature patterns can be understood and interpreted by the users, and thus, our framework can help provide global explanations in a human-understandable manner. The evidence for the prediction is evaluated to be trustworthy according to the two reliability criteria.</p>
      </sec>
    </sec>
    <sec id="sec4-diagnostics-14-00997">
      <title>4. Performance Evaluation</title>
      <sec id="sec4dot1-diagnostics-14-00997">
        <title>4.1. Classification Performance</title>
        <p>Statistic metrics for classification performance, including accuracy (ACC), precision (PRE), specificity (SPE), sensitivity (SEN), and F<sub>1</sub>-score, were calculated both for the interpretable decision-aid system described in this work and the baseline model, whose architecture consisted of the same convolutional layers without the intermediate multi-part attention module and similarity-based classifier. Correct predictions were further evaluated on their reliability based on local explanations to obtain reliable prediction accuracy to assess the trustworthiness of the model.</p>
        <p><xref ref-type="table" rid="diagnostics-14-00997-t001">Table 1</xref> presents the comparison of the classification performance of our interpretable model (before and after the exclusion of ‘background’ feature patterns) with the baseline model trained on the same dataset. Results show that the interpretable model is slightly less accurate than the baseline model and that the exclusion of the ‘background’ feature patterns improved the classification accuracy by 6.53%.</p>
      </sec>
      <sec id="sec4dot2-diagnostics-14-00997">
        <title>4.2. Explanation Performance</title>
        <sec id="sec4dot2dot1-diagnostics-14-00997">
          <title>4.2.1. Global Explanation Evaluation</title>
          <p>Once trained, the system provides global explanations in the form of a set of feature patterns that identify image features characteristic of the classes to be predicted. Each of the feature patterns learned by the system was evaluated on whether it corresponds to a feature of the class (HGG or LGG) that it is supposed to represent and whether the area with the highest response (red) is located within the tumor or tissue altered by the presence of the tumor. A feature pattern is considered invalid if its most activated area is situated in the background regions, namely healthy tissue, ventricles, non-brain tissue, or image background.</p>
          <p>Within all feature patterns, two apparent duplicates were found of the LGG class. Thirteen invalid ‘background’ feature patterns (6 HGG and 7 LGG) were found to have higher responses in regions irrelevant to the classification task (e.g., low-signal ventricles and high-intensity background areas). The accuracy of global explanation, defined as the fraction of learned feature patterns that focus on task-relevant regions, was 86%. The initial assessment process was conducted by one author (Y.T.X). In cases of ambiguity, feature patterns were reviewed by other authors (F.Z, L.R), and the final evaluation was arrived at by consensus. Considering the impact of invalid feature patterns on local explanation, those ‘background’ feature patterns were excluded in the further local analysis process.</p>
          <p><xref ref-type="fig" rid="diagnostics-14-00997-f007">Figure 7</xref> evaluates the representability of two feature patterns that have the largest class connection weight of each class. The similarity score between the feature pattern (class connection of 0.737 to HGG) and the prototypical patch from the tumor core of the first HGG sample image ranks #2 with a similarity of 8.020 (max. 8.782) and #4 with a similarity of 7.653 (max. 8.379) with the prototypical patch from the tumor core of the second sample image, showing its high representativity of class HGG. The feature pattern of LGG with the highest class-connection value (1.311) also shows high representativity of class LGG; the similarity scores with the localized patches rank first among 10 feature patterns for two LGG sample images.</p>
        </sec>
        <sec id="sec4dot2dot2-diagnostics-14-00997">
          <title>4.2.2. Local Explanation Evaluation</title>
          <p>The reliability of an individual prediction was evaluated based on whether its local explanation satisfies two basic reliability conditions, namely that the reasoning process should be both confident and correct.</p>
          <p><italic>Confidence in the reasoning process</italic>. Confidence in the reasoning process can be evaluated by examining the output of the local explanation. For each case in the test set, the number of feature patterns corresponding to a correctly or incorrectly identified tumor type was counted among those with the 10 highest similarity scores. The results were averaged and summarized in <xref ref-type="table" rid="diagnostics-14-00997-t002">Table 2</xref>. Results demonstrate that the inconsistency of the feature patterns with the class of test images has a high impact on the classification performance of the model (comparison between wrong predictions and correct predictions, mean 8.62, 0.34, respectively) and a small impact on the reliability of the predictions (comparison between correct predictions and unreliable predictions).</p>
          <p><italic>Correctness of the reasoning process.</italic> A correct reasoning process is defined as one in which the concept of the activated prototypical patch is consistent with that of the feature pattern. <xref ref-type="table" rid="diagnostics-14-00997-t003">Table 3</xref> summarizes the number of incorrectly activated background patches by top 10 feature patterns among all test images, unreliable predictions, wrong predictions, and correct predictions.</p>
          <p>Wilcoxon Signed-Ranks tests were used to assess the effect of incorrectly activated background patches on the number of mismatched feature patterns among the top 10 ranked, an indicator of prediction reliability, comparing image background areas and brain background (i.e., healthy tissue or CSF), for each classification class both separately and jointly.</p>
          <p>Considering all test images, image background showed a significantly lower influence (<italic>p</italic>-value &lt; 0.05) on reliability compared to brain background (W = 1244.5, <italic>p</italic>-value &lt; 0.001), and the same pattern was repeated considering only the HGG test images (W = 411.0, <italic>p</italic>-value = 0.002) or the LGG test images (W = 214.0, <italic>p</italic>-value = 0.005). Dividing the test images based on correct predictions (reliable predictions and unreliable predictions, HGG: W = 171.5, <italic>p</italic>-value = 0.011; LGG: W = 114.5, <italic>p</italic>-value = 0.003), wrong predictions (HGG: W = 53.5, <italic>p</italic>-value = 0.095 (<italic>p</italic> &gt; 0.05), LGG: W = 17.5, <italic>p</italic>-value = 0.943 (<italic>p</italic> &gt; 0.05)) and unreliable predictions (same values as correct predictions), only in the second group did these two sources of error show no difference in their effect.</p>
          <p><xref ref-type="table" rid="diagnostics-14-00997-t002">Table 2</xref> and <xref ref-type="table" rid="diagnostics-14-00997-t003">Table 3</xref> indicate the necessity and importance of unboxing the inference process of CNN models for brain tumor classification. This allows health workers to screen out unreliable ‘correct’ predictions that might have been learned from irrelevant regions for decision making.</p>
        </sec>
      </sec>
    </sec>
    <sec id="sec5-diagnostics-14-00997" sec-type="discussion">
      <title>5. Discussion</title>
      <p>This work proposed an interpretable multi-part attention network for brain tumor classification. In detail, the widely used VGG16 was built with a specific interpretable architecture to ensure good enough classification performance for the BRATS 2017 dataset. The model was evaluated in terms of both classification and explainability perspectives. Results demonstrated the model produced accurate tumor classification, and the classification accuracy is on par with some of the best-performing CNN models. Furthermore, the proposed framework is able to provide higher quality explanations for HGG and LGG classification, including global explanation and local explanation.</p>
      <p>In detail, global explanation is interpreted as a set of feature patterns the model learns from to classify HGG and LGG. The quality of the feature patterns in terms of their validity and representativity was evaluated by radiologists to see if they were valid evidence for decision aids. Results demonstrated the model learns from the class-representative features of both classes for the classification task, and the HGG feature patterns have higher responses in the contrast-enhancing tumor, necrotic tumor core, and the edematous areas as classification evidence; this agrees with the actual imaging characteristics of HGG. The LGG feature patterns present higher responses on the homogeneous tumor cores and the non-enhancing tumor margins.</p>
      <p>Another important advantage of the proposed model is the local explanation it presents for individual predictions. Background areas, such as the ventricles, were found to be activated by the ‘tumor core’ feature patterns of the LGG class. These background patches are not faithful features to the underlying lesion. Therefore, unboxing the reasoning process is necessary; it allows the clinicians and patients to screen out ‘unreliable’ correct predictions.</p>
      <p>The local explanation of individual explanations was also evaluated by radiologists to see if it is reliable and acceptable for decision-making support. This form of reliability evaluation and model tuning is not available in the development of “black box” networks or the interpretable models mentioned above. According to the findings, the developed solution provided positive outcomes regarding the brain tumor classification and explanation targeted in this study.</p>
      <p>Considering the limitations of the present study, these can be divided into methodological limitations in the construction of the network and limitations in the contextualization of the results.</p>
      <p>It is reasonable to suppose that network construction limitations contribute to the lower classification accuracy of the proposed interpretable model compared with the baseline model. This discrepancy could be attributed to the model’s classification inference process, which is greatly influenced by the feature patterns obtained from the randomly generated push dataset. In future work, optimizing the selection of the push dataset may help to improve the classification accuracy of the model. It is also possible that the training data augmentation process could be optimized, as some recent evidence suggests that, even though we used very widely used augmentation methods, the inclusion of image orientations not found in the testing set does not improve the generalizing ability of the model [<xref ref-type="bibr" rid="B39-diagnostics-14-00997">39</xref>].</p>
      <p>Regarding interpretation of the results, we did not find other interpretable deep learning methods applied to brain tumor classification based on the same dataset, and we cannot confirm the degree to which the 86% reliability obtained by the model would be considered acceptable by the health workers. Further collaboration with medical practitioners is important for the practical assessment of our model. Considering possible future developments or our work, several possible extensions are clear. The data modalities could be extended to incorporate a greater variety of structural images, such as T1w, T2w, and FLAIR, as well as more targeted sequences, including amide proton transfer [<xref ref-type="bibr" rid="B40-diagnostics-14-00997">40</xref>] and MR spectroscopy [<xref ref-type="bibr" rid="B41-diagnostics-14-00997">41</xref>]. It is also important to consider whether findings in the BraTS2017 dataset carry over into other datasets. For example, many clinical scanners continue to use lower field strengths. Publicly available data sets such as MNIBITE [<xref ref-type="bibr" rid="B42-diagnostics-14-00997">42</xref>] and the recent ReMIND [<xref ref-type="bibr" rid="B43-diagnostics-14-00997">43</xref>] could be leveraged to test IMPA-Net with 1.5-T data.</p>
    </sec>
    <sec id="sec6-diagnostics-14-00997" sec-type="conclusions">
      <title>6. Conclusions</title>
      <p>An interpretable classification model based on CNN was developed for brain tumor classification to enhance the interpretability and trustworthiness of the model and the health outcomes. The proposed model visualizes the features the model learns and uses for the classification task. It unboxes the reasoning process of individual predictions and explains the outcomes in a human-understandable manner, allowing clinicians and patients to understand and evaluate the reliability of predictions.</p>
      <p>In future investigations, alternative datasets encompassing a greater variety of sequences and settings, will be included to improve the classification performance and the generality of the work. Further discussions on the quality of decision aids are also necessary to determine whether they improved decision making and outcomes for patients facing treatment or screening decisions and to explore the applicability of IMPA-Net in other medical imaging tasks.</p>
    </sec>
  </body>
  <back>
    <notes>
      <title>Author Contributions</title>
      <p>Conceptualization, C.T. (Claudia Testa), D.N.M., R.Z., F.Z., L.R. and Y.X.; methodology, R.Z. and Y.X.; hardware and software, R.Z. and Y.X.; formal analysis, C.T. (Caterina Tonon), C.T. (Claudia Testa), D.N.M., F.Z. and L.R.; investigation, C.T. (Claudia Testa), D.N.M., F.Z. and L.R.; resources, C.T. (Caterina Tonon), R.Z. and R.L.; data curation, D.N.M. and Y.X.; writing—original draft preparation, Y.X.; writing—review and editing, C.T. (Caterina Tonon), C.T. (Claudia Testa), D.N.M., F.Z., L.R. and R.Z.; supervision, C.T. (Caterina Tonon), C.T. (Claudia Testa) and D.N.M.; funding acquisition, C.T. (Caterina Tonon), R.L. and D.N.M. All authors have read and agreed to the published version of the manuscript.</p>
    </notes>
    <notes>
      <title>Institutional Review Board Statement</title>
      <p>Not applicable.</p>
    </notes>
    <notes>
      <title>Informed Consent Statement</title>
      <p>Not applicable.</p>
    </notes>
    <notes>
      <title>Data Availability Statement</title>
      <p>The first author takes full responsibility for the analyses, interpretation, and conduct of the research. The underlying codes are available from the first author upon reasonable request. The data are publicly available at <uri>https://www.med.upenn.edu/sbia/brats2017/data.html</uri> (accessed on 10 May 2024).</p>
    </notes>
    <notes notes-type="COI-statement">
      <title>Conflicts of Interest</title>
      <p>The authors declare no conflicts of interest.</p>
    </notes>
    <ref-list>
      <title>References</title>
      <ref id="B1-diagnostics-14-00997">
        <label>1.</label>
        <element-citation publication-type="web">
          <person-group person-group-type="author">
            <collab>Cancer Research UK</collab>
          </person-group>
          <article-title>Brain, Other CNS and Intracranial Tumours Statistics</article-title>
          <comment>Available online: <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="https://www.cancerresearchuk.org/health-professional/cancer-statistics/statistics-by-cancer-type/brain-other-cns-and-intracranial-tumours/incidence%23collapseTen#heading-One" ext-link-type="uri">https://www.cancerresearchuk.org/health-professional/cancer-statistics/statistics-by-cancer-type/brain-other-cns-and-intracranial-tumours/incidence%23collapseTen#heading-One</ext-link></comment>
          <date-in-citation content-type="access-date" iso-8601-date="2023-12-06">(accessed on 6 December 2023)</date-in-citation>
        </element-citation>
      </ref>
      <ref id="B2-diagnostics-14-00997">
        <label>2.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Louis</surname>
              <given-names>D.N.</given-names>
            </name>
            <name>
              <surname>Perry</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Wesseling</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Brat</surname>
              <given-names>D.J.</given-names>
            </name>
            <name>
              <surname>Cree</surname>
              <given-names>I.A.</given-names>
            </name>
            <name>
              <surname>Figarella-Branger</surname>
              <given-names>D.</given-names>
            </name>
            <name>
              <surname>Hawkins</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Ng</surname>
              <given-names>H.K.</given-names>
            </name>
            <name>
              <surname>Pfister</surname>
              <given-names>S.M.</given-names>
            </name>
            <name>
              <surname>Reifenberger</surname>
              <given-names>G.</given-names>
            </name>
            <etal/>
          </person-group>
          <article-title>The 2021 WHO Classification of Tumors of the Central Nervous System: A Summary</article-title>
          <source>Neuro. Oncol.</source>
          <year>2021</year>
          <volume>23</volume>
          <fpage>1231</fpage>
          <lpage>1251</lpage>
          <pub-id pub-id-type="doi">10.1093/neuonc/noab106</pub-id>
          <pub-id pub-id-type="pmid">34185076</pub-id>
        </element-citation>
      </ref>
      <ref id="B3-diagnostics-14-00997">
        <label>3.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Norden</surname>
              <given-names>A.D.</given-names>
            </name>
            <name>
              <surname>Drappatz</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Wen</surname>
              <given-names>P.Y.</given-names>
            </name>
          </person-group>
          <article-title>Malignant Gliomas in Adults</article-title>
          <source>Blue Books Neurol.</source>
          <year>2010</year>
          <volume>36</volume>
          <fpage>99</fpage>
          <lpage>120</lpage>
          <pub-id pub-id-type="doi">10.1016/B978-0-7506-7516-1.00005-0</pub-id>
        </element-citation>
      </ref>
      <ref id="B4-diagnostics-14-00997">
        <label>4.</label>
        <element-citation publication-type="book">
          <person-group person-group-type="author">
            <name>
              <surname>Wirsching</surname>
              <given-names>H.G.</given-names>
            </name>
            <name>
              <surname>Weller</surname>
              <given-names>M.</given-names>
            </name>
          </person-group>
          <article-title>Glioblastoma</article-title>
          <source>Malignant Brain Tumors: State-of-the-Art Treatment</source>
          <publisher-name>Springer International Publishing</publisher-name>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <year>2016</year>
          <fpage>265</fpage>
          <lpage>288</lpage>
          <isbn>3319498649</isbn>
        </element-citation>
      </ref>
      <ref id="B5-diagnostics-14-00997">
        <label>5.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Fink</surname>
              <given-names>J.R.</given-names>
            </name>
            <name>
              <surname>Muzi</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Peck</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Krohn</surname>
              <given-names>K.A.</given-names>
            </name>
          </person-group>
          <article-title>Multimodality Brain Tumor Imaging: MR Imaging, PET, and PET/MR Imaging</article-title>
          <source>J. Nucl. Med.</source>
          <year>2015</year>
          <volume>56</volume>
          <fpage>1554</fpage>
          <lpage>1561</lpage>
          <pub-id pub-id-type="doi">10.2967/jnumed.113.131516</pub-id>
          <pub-id pub-id-type="pmid">26294301</pub-id>
        </element-citation>
      </ref>
      <ref id="B6-diagnostics-14-00997">
        <label>6.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Villanueva-Meyer</surname>
              <given-names>J.E.</given-names>
            </name>
            <name>
              <surname>Mabray</surname>
              <given-names>M.C.</given-names>
            </name>
            <name>
              <surname>Cha</surname>
              <given-names>S.</given-names>
            </name>
          </person-group>
          <article-title>Current Clinical Brain Tumor Imaging</article-title>
          <source>Clin. Neurosurg.</source>
          <year>2017</year>
          <volume>81</volume>
          <fpage>397</fpage>
          <lpage>415</lpage>
          <pub-id pub-id-type="doi">10.1093/neuros/nyx103</pub-id>
          <pub-id pub-id-type="pmid">28486641</pub-id>
        </element-citation>
      </ref>
      <ref id="B7-diagnostics-14-00997">
        <label>7.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Grier</surname>
              <given-names>J.T.</given-names>
            </name>
            <name>
              <surname>Batchelor</surname>
              <given-names>T.</given-names>
            </name>
          </person-group>
          <article-title>Low-Grade Gliomas in Adults</article-title>
          <source>Oncologist</source>
          <year>2006</year>
          <volume>6</volume>
          <fpage>681</fpage>
          <lpage>693</lpage>
          <pub-id pub-id-type="doi">10.1634/theoncologist.11-6-681</pub-id>
          <pub-id pub-id-type="pmid">16794247</pub-id>
        </element-citation>
      </ref>
      <ref id="B8-diagnostics-14-00997">
        <label>8.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ganz</surname>
              <given-names>J.C.</given-names>
            </name>
          </person-group>
          <article-title>Low Grade Gliomas</article-title>
          <source>Prog. Brain Res.</source>
          <year>2022</year>
          <volume>268</volume>
          <fpage>271</fpage>
          <lpage>277</lpage>
          <pub-id pub-id-type="doi">10.1016/bs.pbr.2021.10.036</pub-id>
          <pub-id pub-id-type="pmid">35074085</pub-id>
        </element-citation>
      </ref>
      <ref id="B9-diagnostics-14-00997">
        <label>9.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Forst</surname>
              <given-names>D.A.</given-names>
            </name>
            <name>
              <surname>Nahed</surname>
              <given-names>B.V.</given-names>
            </name>
            <name>
              <surname>Loeffler</surname>
              <given-names>J.S.</given-names>
            </name>
            <name>
              <surname>Batchelor</surname>
              <given-names>T.T.</given-names>
            </name>
          </person-group>
          <article-title>Low-Grade Gliomas</article-title>
          <source>Oncologist</source>
          <year>2014</year>
          <volume>19</volume>
          <fpage>403</fpage>
          <lpage>413</lpage>
          <pub-id pub-id-type="doi">10.1634/theoncologist.2013-0345</pub-id>
        </element-citation>
      </ref>
      <ref id="B10-diagnostics-14-00997">
        <label>10.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Shen</surname>
              <given-names>D.</given-names>
            </name>
            <name>
              <surname>Wu</surname>
              <given-names>G.</given-names>
            </name>
            <name>
              <surname>Suk</surname>
              <given-names>H.-I.</given-names>
            </name>
          </person-group>
          <article-title>Deep Learning in Medical Image Analysis</article-title>
          <source>J. Imaging</source>
          <year>2021</year>
          <volume>7</volume>
          <elocation-id>74</elocation-id>
          <pub-id pub-id-type="doi">10.3390/jimaging7040074</pub-id>
          <pub-id pub-id-type="pmid">34460524</pub-id>
        </element-citation>
      </ref>
      <ref id="B11-diagnostics-14-00997">
        <label>11.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Yasaka</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Akai</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Kunimatsu</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Kiryu</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Abe</surname>
              <given-names>O.</given-names>
            </name>
          </person-group>
          <article-title>Deep Learning with Convolutional Neural Network in Radiology</article-title>
          <source>Jpn. J. Radiol.</source>
          <year>2018</year>
          <volume>36</volume>
          <fpage>257</fpage>
          <lpage>272</lpage>
          <pub-id pub-id-type="doi">10.1007/s11604-018-0726-3</pub-id>
        </element-citation>
      </ref>
      <ref id="B12-diagnostics-14-00997">
        <label>12.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Xie</surname>
              <given-names>Y.</given-names>
            </name>
            <name>
              <surname>Zaccagna</surname>
              <given-names>F.</given-names>
            </name>
            <name>
              <surname>Rundo</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Testa</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Agati</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Lodi</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Manners</surname>
              <given-names>D.N.</given-names>
            </name>
            <name>
              <surname>Tonon</surname>
              <given-names>C.</given-names>
            </name>
          </person-group>
          <article-title>Convolutional Neural Network Techniques for Brain Tumor Classification (from 2015 to 2022): Review, Challenges, and Future Perspectives</article-title>
          <source>Diagnostics</source>
          <year>2022</year>
          <volume>12</volume>
          <elocation-id>1850</elocation-id>
          <pub-id pub-id-type="doi">10.3390/diagnostics12081850</pub-id>
        </element-citation>
      </ref>
      <ref id="B13-diagnostics-14-00997">
        <label>13.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Nazir</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Shakil</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Khurshid</surname>
              <given-names>K.</given-names>
            </name>
          </person-group>
          <article-title>Role of Deep Learning in Brain Tumor Detection and Classification (2015 to 2020): A Review</article-title>
          <source>Comput. Med. Imaging Graph.</source>
          <year>2021</year>
          <volume>91</volume>
          <fpage>101940</fpage>
          <pub-id pub-id-type="doi">10.1016/j.compmedimag.2021.101940</pub-id>
          <pub-id pub-id-type="pmid">34293621</pub-id>
        </element-citation>
      </ref>
      <ref id="B14-diagnostics-14-00997">
        <label>14.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Khazaee</surname>
              <given-names>Z.</given-names>
            </name>
            <name>
              <surname>Langarizadeh</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Ahmadabadi</surname>
              <given-names>M.E.S.</given-names>
            </name>
          </person-group>
          <article-title>Developing an Artificial Intelligence Model for Tumor Grading and Classification, Based on MRI Sequences of Human Brain Gliomas</article-title>
          <source>Int. J. Cancer Manag.</source>
          <year>2022</year>
          <volume>15</volume>
          <fpage>e120638</fpage>
          <pub-id pub-id-type="doi">10.5812/ijcm.120638</pub-id>
        </element-citation>
      </ref>
      <ref id="B15-diagnostics-14-00997">
        <label>15.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Chikhalikar</surname>
              <given-names>A.M.</given-names>
            </name>
            <name>
              <surname>Dharwadkar</surname>
              <given-names>N.V.</given-names>
            </name>
          </person-group>
          <article-title>Model for Enhancement and Segmentation of Magnetic Resonance Images for Brain Tumor Classification</article-title>
          <source>Pattern Recognit. Image Anal.</source>
          <year>2021</year>
          <volume>31</volume>
          <fpage>49</fpage>
          <lpage>59</lpage>
          <pub-id pub-id-type="doi">10.1134/S1054661821010065</pub-id>
        </element-citation>
      </ref>
      <ref id="B16-diagnostics-14-00997">
        <label>16.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>El Hamdaoui</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Benfares</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Boujraf</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>El Houda Chaoui</surname>
              <given-names>N.</given-names>
            </name>
            <name>
              <surname>Alami</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Maaroufi</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Qjidaa</surname>
              <given-names>H.</given-names>
            </name>
          </person-group>
          <article-title>High Precision Brain Tumor Classification Model Based on Deep Transfer Learning and Stacking Concepts</article-title>
          <source>Indones. J. Electr. Eng. Comput. Sci.</source>
          <year>2021</year>
          <volume>24</volume>
          <fpage>167</fpage>
          <lpage>177</lpage>
          <pub-id pub-id-type="doi">10.11591/ijeecs.v24.i1.pp167-177</pub-id>
        </element-citation>
      </ref>
      <ref id="B17-diagnostics-14-00997">
        <label>17.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhuge</surname>
              <given-names>Y.</given-names>
            </name>
            <name>
              <surname>Ning</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Mathen</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Cheng</surname>
              <given-names>J.Y.</given-names>
            </name>
            <name>
              <surname>Krauze</surname>
              <given-names>A.V.</given-names>
            </name>
            <name>
              <surname>Camphausen</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Miller</surname>
              <given-names>R.W.</given-names>
            </name>
          </person-group>
          <article-title>Automated Glioma Grading on Conventional MRI Images Using Deep Convolutional Neural Networks</article-title>
          <source>Med. Phys.</source>
          <year>2020</year>
          <volume>47</volume>
          <fpage>3044</fpage>
          <lpage>3053</lpage>
          <pub-id pub-id-type="doi">10.1002/mp.14168</pub-id>
        </element-citation>
      </ref>
      <ref id="B18-diagnostics-14-00997">
        <label>18.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Kaufman</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Kramer</surname>
              <given-names>D.M.</given-names>
            </name>
            <name>
              <surname>Crooks</surname>
              <given-names>L.E.</given-names>
            </name>
            <name>
              <surname>Ortendahl</surname>
              <given-names>D.A.</given-names>
            </name>
          </person-group>
          <article-title>Measuring Signal-to-Noise Ratios in MR Imaging</article-title>
          <source>Radiology</source>
          <year>1989</year>
          <volume>173</volume>
          <fpage>265</fpage>
          <lpage>267</lpage>
          <pub-id pub-id-type="doi">10.1148/radiology.173.1.2781018</pub-id>
          <pub-id pub-id-type="pmid">2781018</pub-id>
        </element-citation>
      </ref>
      <ref id="B19-diagnostics-14-00997">
        <label>19.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Antoniadi</surname>
              <given-names>A.M.</given-names>
            </name>
            <name>
              <surname>Du</surname>
              <given-names>Y.</given-names>
            </name>
            <name>
              <surname>Guendouz</surname>
              <given-names>Y.</given-names>
            </name>
            <name>
              <surname>Wei</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Mazo</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Becker</surname>
              <given-names>B.A.</given-names>
            </name>
            <name>
              <surname>Mooney</surname>
              <given-names>C.</given-names>
            </name>
          </person-group>
          <article-title>Current Challenges and Future Opportunities for Xai in Machine Learning-Based Clinical Decision Support Systems: A Systematic Review</article-title>
          <source>Appl. Sci.</source>
          <year>2021</year>
          <volume>11</volume>
          <elocation-id>5088</elocation-id>
          <pub-id pub-id-type="doi">10.3390/app11115088</pub-id>
        </element-citation>
      </ref>
      <ref id="B20-diagnostics-14-00997">
        <label>20.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Salahuddin</surname>
              <given-names>Z.</given-names>
            </name>
            <name>
              <surname>Woodruff</surname>
              <given-names>H.C.</given-names>
            </name>
            <name>
              <surname>Chatterjee</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Lambin</surname>
              <given-names>P.</given-names>
            </name>
          </person-group>
          <article-title>Transparency of Deep Neural Networks for Medical Image Analysis: A Review of Interpretability Methods</article-title>
          <source>Comput. Biol. Med.</source>
          <year>2022</year>
          <volume>140</volume>
          <elocation-id>105111</elocation-id>
          <pub-id pub-id-type="doi">10.1016/j.compbiomed.2021.105111</pub-id>
        </element-citation>
      </ref>
      <ref id="B21-diagnostics-14-00997">
        <label>21.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Zhang</surname>
              <given-names>Y.</given-names>
            </name>
            <name>
              <surname>Tino</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Leonardis</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Tang</surname>
              <given-names>K.</given-names>
            </name>
          </person-group>
          <article-title>A Survey on Neural Network Interpretability</article-title>
          <source>IEEE Trans. Emerg. Top. Comput. Intell.</source>
          <year>2021</year>
          <volume>5</volume>
          <fpage>726</fpage>
          <lpage>742</lpage>
          <pub-id pub-id-type="doi">10.1109/TETCI.2021.3100641</pub-id>
        </element-citation>
      </ref>
      <ref id="B22-diagnostics-14-00997">
        <label>22.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Tjoa</surname>
              <given-names>E.</given-names>
            </name>
            <name>
              <surname>Guan</surname>
              <given-names>C.</given-names>
            </name>
          </person-group>
          <article-title>A Survey on Explainable Artificial Intelligence (XAI): Toward Medical XAI</article-title>
          <source>IEEE Trans. Neural Networks Learn. Syst.</source>
          <year>2021</year>
          <volume>32</volume>
          <fpage>4793</fpage>
          <lpage>4813</lpage>
          <pub-id pub-id-type="doi">10.1109/TNNLS.2020.3027314</pub-id>
        </element-citation>
      </ref>
      <ref id="B23-diagnostics-14-00997">
        <label>23.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Vellido</surname>
              <given-names>A.</given-names>
            </name>
          </person-group>
          <article-title>The Importance of Interpretability and Visualization in Machine Learning for Applications in Medicine and Health Care</article-title>
          <source>Neural Comput. Appl.</source>
          <year>2020</year>
          <volume>32</volume>
          <fpage>18069</fpage>
          <lpage>18083</lpage>
          <pub-id pub-id-type="doi">10.1007/s00521-019-04051-w</pub-id>
        </element-citation>
      </ref>
      <ref id="B24-diagnostics-14-00997">
        <label>24.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Pereira</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Meier</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Alves</surname>
              <given-names>V.</given-names>
            </name>
            <name>
              <surname>Reyes</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Silva</surname>
              <given-names>C.A.</given-names>
            </name>
          </person-group>
          <article-title>Automatic Brain Tumor Grading from MRI Data Using Convolutional Neural Networks and Quality Assessment</article-title>
          <source>Lect. Notes Comput. Sci. (Incl. Subser. Lect. Notes Artif. Intell. Lect. Notes Bioinform.)</source>
          <year>2018</year>
          <volume>11038</volume>
          <fpage>106</fpage>
          <lpage>114</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-02628-8_12</pub-id>
          <pub-id pub-id-type="pmid">38370860</pub-id>
        </element-citation>
      </ref>
      <ref id="B25-diagnostics-14-00997">
        <label>25.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Artzi</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Redmard</surname>
              <given-names>E.</given-names>
            </name>
            <name>
              <surname>Tzemach</surname>
              <given-names>O.</given-names>
            </name>
            <name>
              <surname>Zeltser</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Gropper</surname>
              <given-names>O.</given-names>
            </name>
            <name>
              <surname>Roth</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Shofty</surname>
              <given-names>B.</given-names>
            </name>
            <name>
              <surname>Kozyrev</surname>
              <given-names>D.A.</given-names>
            </name>
            <name>
              <surname>Constantini</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Ben-Sira</surname>
              <given-names>L.</given-names>
            </name>
          </person-group>
          <article-title>Classification of Pediatric Posterior Fossa Tumors Using Convolutional Neural Network and Tabular Data</article-title>
          <source>IEEE Access</source>
          <year>2021</year>
          <volume>9</volume>
          <fpage>91966</fpage>
          <lpage>91973</lpage>
          <pub-id pub-id-type="doi">10.1109/ACCESS.2021.3085771</pub-id>
        </element-citation>
      </ref>
      <ref id="B26-diagnostics-14-00997">
        <label>26.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Marmolejo-Saucedo</surname>
              <given-names>J.A.</given-names>
            </name>
            <name>
              <surname>Kose</surname>
              <given-names>U.</given-names>
            </name>
          </person-group>
          <article-title>Numerical Grad-Cam Based Explainable Convolutional Neural Network for Brain Tumor Diagnosis</article-title>
          <source>Mob. Networks Appl.</source>
          <year>2022</year>
          <pub-id pub-id-type="doi">10.1007/s11036-022-02021-6</pub-id>
        </element-citation>
      </ref>
      <ref id="B27-diagnostics-14-00997">
        <label>27.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Gaur</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Bhandari</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Razdan</surname>
              <given-names>T.</given-names>
            </name>
            <name>
              <surname>Mallik</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Zhao</surname>
              <given-names>Z.</given-names>
            </name>
          </person-group>
          <article-title>Explanation-Driven Deep Learning Model for Prediction of Brain Tumour Status Using MRI Image Data</article-title>
          <source>Front. Genet.</source>
          <year>2022</year>
          <volume>13</volume>
          <fpage>822666</fpage>
          <pub-id pub-id-type="doi">10.3389/fgene.2022.822666</pub-id>
        </element-citation>
      </ref>
      <ref id="B28-diagnostics-14-00997">
        <label>28.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Thomson</surname>
              <given-names>W.</given-names>
            </name>
            <name>
              <surname>Roth</surname>
              <given-names>A.E.</given-names>
            </name>
          </person-group>
          <article-title>The Shapley Value: Essays in Honor of Lloyd S. Shapley</article-title>
          <source>Economica</source>
          <year>1991</year>
          <volume>58</volume>
          <fpage>123</fpage>
          <lpage>124</lpage>
          <pub-id pub-id-type="doi">10.2307/2554979</pub-id>
        </element-citation>
      </ref>
      <ref id="B29-diagnostics-14-00997">
        <label>29.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ribeiro</surname>
              <given-names>M.T.</given-names>
            </name>
            <name>
              <surname>Singh</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Guestrin</surname>
              <given-names>C.</given-names>
            </name>
          </person-group>
          <article-title>“Why Should i Trust You?” Explaining the Predictions of Any Classifier</article-title>
          <source>Proc. ACM SIGKDD Int. Conf. Knowl. Discov. Data Min.</source>
          <year>2016</year>
          <volume>13</volume>
          <fpage>1135</fpage>
          <lpage>1144</lpage>
          <pub-id pub-id-type="doi">10.1145/2939672.2939778</pub-id>
        </element-citation>
      </ref>
      <ref id="B30-diagnostics-14-00997">
        <label>30.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Pintelas</surname>
              <given-names>E.</given-names>
            </name>
            <name>
              <surname>Liaskos</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Livieris</surname>
              <given-names>I.E.</given-names>
            </name>
            <name>
              <surname>Kotsiantis</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Pintelas</surname>
              <given-names>P.</given-names>
            </name>
          </person-group>
          <article-title>Explainable Machine Learning Framework for Image Classification Problems: Case Study on Glioma Cancer Prediction</article-title>
          <source>J. Imaging</source>
          <year>2020</year>
          <volume>6</volume>
          <elocation-id>37</elocation-id>
          <pub-id pub-id-type="doi">10.3390/JIMAGING6060037</pub-id>
          <pub-id pub-id-type="pmid">34460583</pub-id>
        </element-citation>
      </ref>
      <ref id="B31-diagnostics-14-00997">
        <label>31.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Niu</surname>
              <given-names>Z.</given-names>
            </name>
            <name>
              <surname>Zhong</surname>
              <given-names>G.</given-names>
            </name>
            <name>
              <surname>Yu</surname>
              <given-names>H.</given-names>
            </name>
          </person-group>
          <article-title>A Review on the Attention Mechanism of Deep Learning</article-title>
          <source>Neurocomputing</source>
          <year>2021</year>
          <volume>452</volume>
          <fpage>48</fpage>
          <lpage>62</lpage>
          <pub-id pub-id-type="doi">10.1016/j.neucom.2021.03.091</pub-id>
        </element-citation>
      </ref>
      <ref id="B32-diagnostics-14-00997">
        <label>32.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Chen</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Li</surname>
              <given-names>O.</given-names>
            </name>
            <name>
              <surname>Tao</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Barnett</surname>
              <given-names>A.J.</given-names>
            </name>
            <name>
              <surname>Su</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Rudin</surname>
              <given-names>C.</given-names>
            </name>
          </person-group>
          <article-title>This Looks like That: Deep Learning for Interpretable Image Recognition</article-title>
          <source>Adv. Neural Inf. Process. Syst.</source>
          <year>2019</year>
          <volume>32</volume>
          <fpage>1</fpage>
          <lpage>12</lpage>
        </element-citation>
      </ref>
      <ref id="B33-diagnostics-14-00997">
        <label>33.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Menze</surname>
              <given-names>B.H.</given-names>
            </name>
            <name>
              <surname>Jakab</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Bauer</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Kalpathy-Cramer</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Farahani</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Kirby</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Burren</surname>
              <given-names>Y.</given-names>
            </name>
            <name>
              <surname>Porz</surname>
              <given-names>N.</given-names>
            </name>
            <name>
              <surname>Slotboom</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Wiest</surname>
              <given-names>R.</given-names>
            </name>
            <etal/>
          </person-group>
          <article-title>The Multimodal Brain Tumor Image Segmentation Benchmark (BRATS)</article-title>
          <source>IEEE Trans. Med. Imaging</source>
          <year>2015</year>
          <volume>34</volume>
          <fpage>1993</fpage>
          <lpage>2024</lpage>
          <pub-id pub-id-type="doi">10.1109/TMI.2014.2377694</pub-id>
          <pub-id pub-id-type="pmid">25494501</pub-id>
        </element-citation>
      </ref>
      <ref id="B34-diagnostics-14-00997">
        <label>34.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Bakas</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Akbari</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Sotiras</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Bilello</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Rozycki</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Kirby</surname>
              <given-names>J.S.</given-names>
            </name>
            <name>
              <surname>Freymann</surname>
              <given-names>J.B.</given-names>
            </name>
            <name>
              <surname>Farahani</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Davatzikos</surname>
              <given-names>C.</given-names>
            </name>
          </person-group>
          <article-title>Advancing The Cancer Genome Atlas Glioma MRI Collections with Expert Segmentation Labels and Radiomic Features</article-title>
          <source>Sci. Data</source>
          <year>2017</year>
          <volume>4</volume>
          <fpage>170117</fpage>
          <pub-id pub-id-type="doi">10.1038/sdata.2017.117</pub-id>
          <pub-id pub-id-type="pmid">28872634</pub-id>
        </element-citation>
      </ref>
      <ref id="B35-diagnostics-14-00997">
        <label>35.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Bakas</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Reyes</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Jakab</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Bauer</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Rempfler</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Crimi</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Shinohara</surname>
              <given-names>R.T.</given-names>
            </name>
            <name>
              <surname>Berger</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Ha</surname>
              <given-names>S.M.</given-names>
            </name>
            <name>
              <surname>Rozycki</surname>
              <given-names>M.</given-names>
            </name>
            <etal/>
          </person-group>
          <article-title>Identifying the Best Machine Learning Algorithms for Brain Tumor Segmentation, Progression Assessment, and Overall Survival Prediction in the BRATS Challenge</article-title>
          <source>arXiv</source>
          <year>2018</year>
          <pub-id pub-id-type="arxiv">1811.02629</pub-id>
        </element-citation>
      </ref>
      <ref id="B36-diagnostics-14-00997">
        <label>36.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Singh</surname>
              <given-names>G.</given-names>
            </name>
            <name>
              <surname>Yow</surname>
              <given-names>K.C.</given-names>
            </name>
          </person-group>
          <article-title>These Do Not Look like Those: An Interpretable Deep Learning Model for Image Recognition</article-title>
          <source>IEEE Access</source>
          <year>2021</year>
          <volume>9</volume>
          <fpage>41482</fpage>
          <lpage>41493</lpage>
          <pub-id pub-id-type="doi">10.1109/ACCESS.2021.3064838</pub-id>
        </element-citation>
      </ref>
      <ref id="B37-diagnostics-14-00997">
        <label>37.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Russakovsky</surname>
              <given-names>O.</given-names>
            </name>
            <name>
              <surname>Deng</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Su</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>Krause</surname>
              <given-names>J.</given-names>
            </name>
            <name>
              <surname>Satheesh</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Ma</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Huang</surname>
              <given-names>Z.</given-names>
            </name>
            <name>
              <surname>Karpathy</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Khosla</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Bernstein</surname>
              <given-names>M.</given-names>
            </name>
            <etal/>
          </person-group>
          <article-title>ImageNet Large Scale Visual Recognition Challenge</article-title>
          <source>Int. J. Comput. Vis.</source>
          <year>2015</year>
          <volume>115</volume>
          <fpage>211</fpage>
          <lpage>252</lpage>
          <pub-id pub-id-type="doi">10.1007/s11263-015-0816-y</pub-id>
        </element-citation>
      </ref>
      <ref id="B38-diagnostics-14-00997">
        <label>38.</label>
        <element-citation publication-type="confproc">
          <person-group person-group-type="author">
            <name>
              <surname>He</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Zhang</surname>
              <given-names>X.</given-names>
            </name>
            <name>
              <surname>Ren</surname>
              <given-names>S.</given-names>
            </name>
            <name>
              <surname>Sun</surname>
              <given-names>J.</given-names>
            </name>
          </person-group>
          <article-title>Delving Deep into Rectifiers: Surpassing Human-Level Performance on ImageNet Classification</article-title>
          <source>Proceedings of the 2015 IEEE International Conference on Computer Vision (ICCV)</source>
          <conf-loc>Santiago, Chile</conf-loc>
          <conf-date>7–13 December 2015</conf-date>
          <fpage>1026</fpage>
          <lpage>1034</lpage>
          <pub-id pub-id-type="doi">10.1109/ICCV.2015.123</pub-id>
        </element-citation>
      </ref>
      <ref id="B39-diagnostics-14-00997">
        <label>39.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Reyes</surname>
              <given-names>D.</given-names>
            </name>
            <name>
              <surname>Sánchez</surname>
              <given-names>J.</given-names>
            </name>
          </person-group>
          <article-title>Performance of Convolutional Neural Networks for the Classification of Brain Tumors Using Magnetic Resonance Imaging</article-title>
          <source>Heliyon</source>
          <year>2024</year>
          <volume>10</volume>
          <fpage>e25468</fpage>
          <pub-id pub-id-type="doi">10.1016/j.heliyon.2024.e25468</pub-id>
          <pub-id pub-id-type="pmid">38352765</pub-id>
        </element-citation>
      </ref>
      <ref id="B40-diagnostics-14-00997">
        <label>40.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Guo</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Unberath</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Heo</surname>
              <given-names>H.Y.</given-names>
            </name>
            <name>
              <surname>Eberhart</surname>
              <given-names>C.G.</given-names>
            </name>
            <name>
              <surname>Lim</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Blakeley</surname>
              <given-names>J.O.</given-names>
            </name>
            <name>
              <surname>Jiang</surname>
              <given-names>S.</given-names>
            </name>
          </person-group>
          <article-title>Learning-Based Analysis of Amide Proton Transfer-Weighted MRI to Identify True Progression in Glioma Patients</article-title>
          <source>NeuroImage Clin.</source>
          <year>2022</year>
          <volume>35</volume>
          <fpage>103121</fpage>
          <pub-id pub-id-type="doi">10.1016/j.nicl.2022.103121</pub-id>
          <pub-id pub-id-type="pmid">35905666</pub-id>
        </element-citation>
      </ref>
      <ref id="B41-diagnostics-14-00997">
        <label>41.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Ranjith</surname>
              <given-names>G.</given-names>
            </name>
            <name>
              <surname>Parvathy</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Vikas</surname>
              <given-names>V.</given-names>
            </name>
            <name>
              <surname>Chandrasekharan</surname>
              <given-names>K.</given-names>
            </name>
            <name>
              <surname>Nair</surname>
              <given-names>S.</given-names>
            </name>
          </person-group>
          <article-title>Machine Learning Methods for the Classification of Gliomas: Initial Results Using Features Extracted from MR Spectroscopy</article-title>
          <source>Neuroradiol. J.</source>
          <year>2015</year>
          <volume>28</volume>
          <fpage>106</fpage>
          <lpage>111</lpage>
          <pub-id pub-id-type="doi">10.1177/1971400915576637</pub-id>
          <pub-id pub-id-type="pmid">25923676</pub-id>
        </element-citation>
      </ref>
      <ref id="B42-diagnostics-14-00997">
        <label>42.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Laurence</surname>
              <given-names>M.</given-names>
            </name>
            <name>
              <surname>Rolando</surname>
              <given-names>F.D.M.</given-names>
            </name>
            <name>
              <surname>Kevin</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>David</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Claire</surname>
              <given-names>H.</given-names>
            </name>
            <name>
              <surname>D Louis</surname>
              <given-names>C.</given-names>
            </name>
          </person-group>
          <article-title>Online Database of Clinical MR and Ultrasound Images of Brain Tumors</article-title>
          <source>Med. Phys.</source>
          <year>2012</year>
          <volume>39</volume>
          <fpage>3253</fpage>
          <lpage>3261</lpage>
          <pub-id pub-id-type="doi">10.1118/1.4709600</pub-id>
        </element-citation>
      </ref>
      <ref id="B43-diagnostics-14-00997">
        <label>43.</label>
        <element-citation publication-type="journal">
          <person-group person-group-type="author">
            <name>
              <surname>Juvekar</surname>
              <given-names>P.</given-names>
            </name>
            <name>
              <surname>Dorent</surname>
              <given-names>R.</given-names>
            </name>
            <name>
              <surname>Ogl</surname>
              <given-names>F.K.</given-names>
            </name>
            <name>
              <surname>Torio</surname>
              <given-names>E.</given-names>
            </name>
            <name>
              <surname>Barr</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Rigolo</surname>
              <given-names>L.</given-names>
            </name>
            <name>
              <surname>Galvin</surname>
              <given-names>C.</given-names>
            </name>
            <name>
              <surname>Jowkar</surname>
              <given-names>N.</given-names>
            </name>
            <name>
              <surname>Kazi</surname>
              <given-names>A.</given-names>
            </name>
            <name>
              <surname>Haouchine</surname>
              <given-names>N.</given-names>
            </name>
            <etal/>
          </person-group>
          <article-title>ReMIND: The Brain Resection Multimodal Imaging Database</article-title>
          <source>medRxiv</source>
          <year>2023</year>
          <pub-id pub-id-type="doi">10.1101/2023.09.14.23295596</pub-id>
        </element-citation>
      </ref>
    </ref-list>
    <sec sec-type="display-objects">
      <title>Figures and Tables</title>
      <fig id="diagnostics-14-00997-f001" position="float">
        <label>Figure 1</label>
        <caption>
          <p>Global and local explanations provided by the proposed IMPA-Net. (<bold>a</bold>) Research context illustrates the importance and basic ideas of global and local explanations for deep learning-based brain tumor classification. It outlines the problems in this research field that the proposed IMPA-Net attempts to address; (<bold>b</bold>) local explanation: given an input image, IMPA-Net compares the activated parts of the input image with the feature patterns and thereby predicts the tumor grade; (<bold>c</bold>) global explanation can be interpreted as the class-representative features the entire model learns to distinguish two classes.</p>
        </caption>
        <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="diagnostics-14-00997-g001.tif"/>
      </fig>
      <fig id="diagnostics-14-00997-f002" position="float">
        <label>Figure 2</label>
        <caption>
          <p>The overall workflow of the development and evaluation of the proposed methodology.</p>
        </caption>
        <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="diagnostics-14-00997-g002.tif"/>
      </fig>
      <fig id="diagnostics-14-00997-f003" position="float">
        <label>Figure 3</label>
        <caption>
          <p>Schematic diagram of the proposed IMPA-Net. It consists of three modules: a feature extractor, a multi-part attention block, and a similarity-based classifier. The feature patterns within the multi-part attention block are learned from the push dataset during the training phase.</p>
        </caption>
        <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="diagnostics-14-00997-g003.tif"/>
      </fig>
      <fig id="diagnostics-14-00997-f004" position="float">
        <label>Figure 4</label>
        <caption>
          <p>Six learned feature patterns and activation maps of HGG (<bold>a</bold>) and LGG (<bold>b</bold>) selected to represent different clinically relevant discriminative features of each class learned by the model. Training image where feature pattern comes from (feature pattern in box); Activation map (warmer colors indicate higher activation).</p>
        </caption>
        <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="diagnostics-14-00997-g004.tif"/>
      </fig>
      <fig id="diagnostics-14-00997-f005" position="float">
        <label>Figure 5</label>
        <caption>
          <p>The reasoning process of our network for deciding the grade of a tumor. There are ten rows, split into two groups for ease of presentation: (<bold>a</bold>) top 1~#5th part attention between a patch of the test image and feature pattern, (<bold>b</bold>) #6th~#10th part attention between a patch of the test image and feature pattern. Each row is organized as follows: in the leftmost column a yellow rectangle generated by the proposed model is superimposed on the test image, showing a part that looks like a feature pattern; second column, an enlargement of the part of the test image considered by the model to look similar to the feature pattern (shown in col. 4); third column: activation maps indicating how similar each featured pattern resembles part of the test image, in which warmer color indicates higher responses; fifth column: training images where feature pattern comes from; sixth column: corresponding activation maps. The final columns quantify the result of the comparison. Column 7: similarity score between the localized prototypical part of the test image (col. 2) and the feature pattern (col. 4). Column 8: class connection values generated by the proposed model correspond to the class-connection weight connection between the feature patterns and the logit of class. Column 9: weighted similarity scores between the localized prototypical patches of the test image with top-10 feature patterns.</p>
        </caption>
        <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="diagnostics-14-00997-g005.tif"/>
      </fig>
      <fig id="diagnostics-14-00997-f006" position="float">
        <label>Figure 6</label>
        <caption>
          <p>Example output showing the reasoning process of our network in deciding the grade of an LGG tumor, (<bold>a</bold>) top 1~#5th part attention between a patch of the test image and feature pattern, (<bold>b</bold>) #6th~#10th part attention between a patch of the test image and feature pattern.</p>
        </caption>
        <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="diagnostics-14-00997-g006.tif"/>
      </fig>
      <fig id="diagnostics-14-00997-f007" position="float">
        <label>Figure 7</label>
        <caption>
          <p>Representability of the feature patterns. The explanations on two input MR images are shown for the feature pattern that has the largest class-connection weight on each class.</p>
        </caption>
        <graphic xmlns:xlink="http://www.w3.org/1999/xlink" xlink:href="diagnostics-14-00997-g007.tif"/>
      </fig>
      <table-wrap id="diagnostics-14-00997-t001" position="float">
        <object-id pub-id-type="pii">diagnostics-14-00997-t001_Table 1</object-id>
        <label>Table 1</label>
        <caption>
          <p>Comparison of the classification performance of our interpretable model with the baseline model.</p>
        </caption>
        <table>
          <thead>
            <tr>
              <th rowspan="2" align="center" valign="middle" style="border-top:solid thin;border-bottom:solid thin">Model
              </th>
              <th colspan="5" align="center" valign="middle" style="border-top:solid thin;border-bottom:solid thin">Performance Metrics</th>
            </tr>
            <tr>
              <th align="center" valign="middle" style="border-bottom:solid thin">ACC</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">PRE</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">SPE</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">SEN</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">F<sub>1</sub> Score</th>
            </tr>
          </thead>
          <tbody>
            <tr>
              <td align="center" valign="middle">Baseline model</td>
              <td align="center" valign="middle">97.30%</td>
              <td align="center" valign="middle">99.18%</td>
              <td align="center" valign="middle">98.96%</td>
              <td align="center" valign="middle">96.03%</td>
              <td align="center" valign="middle">0.9758</td>
            </tr>
            <tr>
              <td align="center" valign="middle">Our model before exclusion</td>
              <td align="center" valign="middle">85.59%</td>
              <td align="center" valign="middle">89.17%</td>
              <td align="center" valign="middle">86.46%</td>
              <td align="center" valign="middle">84.92%</td>
              <td align="center" valign="middle">0.8699</td>
            </tr>
            <tr>
              <td align="center" valign="middle" style="border-bottom:solid thin">Our model after exclusion</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">92.12%</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">94.65%</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">93.23%</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">91.27%</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">0.9293</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <table-wrap id="diagnostics-14-00997-t002" position="float">
        <object-id pub-id-type="pii">diagnostics-14-00997-t002_Table 2</object-id>
        <label>Table 2</label>
        <caption>
          <p>Summary of the number of feature patterns (top 10) consistent or inconsistent with the actual class of test images among all test cases, unreliable predictions, wrong predictions, and correct predictions (TP and TN predictions), summarized as mean (standard deviation) of the fraction of feature patterns among the top 10 that match or mismatch to the actual class of test images.</p>
        </caption>
        <table>
          <thead>
            <tr>
              <th rowspan="2" align="center" valign="middle" style="border-top:solid thin">Class of Feature Pattern
              </th>
              <th colspan="8" align="center" valign="middle" style="border-top:solid thin;border-bottom:solid thin">Class of Test Image
              </th>
            </tr>
            <tr>
              <th colspan="2" align="center" valign="middle" style="border-bottom:solid thin">All Test Cases</th>
              <th colspan="2" align="center" valign="middle" style="border-bottom:solid thin">Unreliable Predictions <sup>1</sup></th>
              <th colspan="2" align="center" valign="middle" style="border-bottom:solid thin">Wrong Predictions <sup>2</sup></th>
              <th colspan="2" align="center" valign="middle" style="border-bottom:solid thin">Correct Predictions <sup>3</sup></th>
            </tr>
            <tr>
              <th align="center" valign="middle" style="border-bottom:solid thin"> </th>
              <th align="center" valign="middle" style="border-bottom:solid thin">HGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">LGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">HGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">LGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">HGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">LGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">HGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">LGG</th>
            </tr>
          </thead>
          <tbody>
            <tr>
              <td align="center" valign="middle">
              HGG
              </td>
              <td align="center" valign="middle">9.29 (2.27)</td>
              <td align="center" valign="middle">0.90 (2.26)</td>
              <td align="center" valign="middle">9.87 (0.41)</td>
              <td align="center" valign="middle">1.56 (1.17)</td>
              <td align="center" valign="middle">2.09 (1.27)</td>
              <td align="center" valign="middle">8.62 (1.26)</td>
              <td align="center" valign="middle">9.98 (0.17)</td>
              <td align="center" valign="middle">0.34 (0.84)</td>
            </tr>
            <tr>
              <td align="center" valign="middle" style="border-bottom:solid thin">
              LGG
              </td>
              <td align="center" valign="middle" style="border-bottom:solid thin">0.71 (2.27)</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">9.10 (2.26)</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">0.13 (0.41)</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">8.44 (1.17)</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">7.91 (1.27)</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">1.38 (1.26)</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">0.02 (0.17)</td>
              <td align="center" valign="middle" style="border-bottom:solid thin">9.66 (0.84)</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn>
            <p>Note: <sup>1</sup> Unreliable predictions are cases among {TP, TN} predictions that are evaluated to be unreliable according to the two identified reliability criteria. <sup>2</sup> Wrong predictions are {FP, FN}. <sup>3</sup> Correct predictions are {unreliable predictions, reliable predictions}.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap id="diagnostics-14-00997-t003" position="float">
        <object-id pub-id-type="pii">diagnostics-14-00997-t003_Table 3</object-id>
        <label>Table 3</label>
        <caption>
          <p>The numbers of incorrectly activated background patches by the top 10 feature patterns were given as mean (standard deviation) of the fraction of feature patterns among the top 10 that mismatched the actual class of test images.</p>
        </caption>
        <table>
          <thead>
            <tr>
              <th rowspan="3" align="center" valign="middle" style="border-top:solid thin;border-bottom:solid thin">
            Concept of Activated Patch
              </th>
              <th colspan="8" align="center" valign="middle" style="border-top:solid thin;border-bottom:solid thin">
           Class of Test Image
              </th>
            </tr>
            <tr>
              <th colspan="2" align="center" valign="middle" style="border-bottom:solid thin">All Test Images</th>
              <th colspan="2" align="center" valign="middle" style="border-bottom:solid thin">Unreliable Predictions</th>
              <th colspan="2" align="center" valign="middle" style="border-bottom:solid thin">Wrong Predictions</th>
              <th colspan="2" align="center" valign="middle" style="border-bottom:solid thin">Correct Predictions</th>
            </tr>
            <tr>
              <th align="center" valign="middle" style="border-bottom:solid thin">HGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">LGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">HGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">LGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">HGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">LGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">HGG</th>
              <th align="center" valign="middle" style="border-bottom:solid thin">LGG</th>
            </tr>
          </thead>
          <tbody>
            <tr>
              <td rowspan="2" align="center" valign="middle" style="border-bottom:solid thin">Image<break/>background area
              </td>
              <td align="center" valign="middle">0.33 (0.89)</td>
              <td align="center" valign="middle">0.46 (1.40)</td>
              <td align="center" valign="middle">1.37 (1.34)</td>
              <td align="center" valign="middle">1.85 (2.41)</td>
              <td align="center" valign="middle">1.46 (1.44)</td>
              <td align="center" valign="middle">1.23 (1.83)</td>
              <td align="center" valign="middle">0.23 (0.74)</td>
              <td align="center" valign="middle">0.40 (1.35)</td>
            </tr>
            <tr>
              <td colspan="2" align="center" valign="middle" style="border-bottom:solid thin">0.39 (1.14)</td>
              <td colspan="2" align="center" valign="middle" style="border-bottom:solid thin">1.61 (1.96)</td>
              <td colspan="2" align="center" valign="middle" style="border-bottom:solid thin">1.37 (1.57)</td>
              <td colspan="2" align="center" valign="middle" style="border-bottom:solid thin">0.30 (1.06)</td>
            </tr>
            <tr>
              <td rowspan="2" align="center" valign="middle" style="border-bottom:solid thin">Brain<break/>background area
              </td>
              <td align="center" valign="middle">0.65 (1.55)</td>
              <td align="center" valign="middle">0.97 (3.19)</td>
              <td align="center" valign="middle">2.61 (2.07)</td>
              <td align="center" valign="middle">4.46 (3.67)</td>
              <td align="center" valign="middle">2.32 (2.30)</td>
              <td align="center" valign="middle">1.00 (0.71)</td>
              <td align="center" valign="middle">0.43 (1.28)</td>
              <td align="center" valign="middle">0.97 (2.51)</td>
            </tr>
            <tr>
              <td colspan="2" align="center" valign="middle" style="border-bottom:solid thin">0.75 (11.96)</td>
              <td colspan="2" align="center" valign="middle" style="border-bottom:solid thin">3.55 (3.11)</td>
              <td colspan="2" align="center" valign="middle" style="border-bottom:solid thin">1.83 (1.96)</td>
              <td colspan="2" align="center" valign="middle" style="border-bottom:solid thin">0.67 (1.93)</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
    </sec>
    <fn-group>
      <fn>
        <p><bold>Disclaimer/Publisher’s Note:</bold> The statements, opinions and data contained in all publications are solely those of the individual author(s) and contributor(s) and not of MDPI and/or the editor(s). MDPI and/or the editor(s) disclaim responsibility for any injury to people or property resulting from any ideas, methods, instructions or products referred to in the content.</p>
      </fn>
    </fn-group>
  </back>
</article>
