<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JFR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id>
      <journal-title>JMIR Formative Research</journal-title>
      <issn pub-type="epub">2561-326X</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i1e50328</article-id>
      <article-id pub-id-type="pmid">37955948</article-id>
      <article-id pub-id-type="doi">10.2196/50328</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Mobile App That Addresses Interpretability Challenges in Machine Learning–Based Diabetes Predictions: Survey-Based User Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Fotopoulos</surname>
            <given-names>Dimitris</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Li</surname>
            <given-names>Xiaoying</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Hendawi</surname>
            <given-names>Rasha</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5828-2651</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Li</surname>
            <given-names>Juan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>North Dakota State University</institution>
            <addr-line>1340 Administration Ave</addr-line>
            <addr-line>Fargo, ND, 58105</addr-line>
            <country>United States</country>
            <phone>1 (701) 231 8011</phone>
            <email>j.li@ndsu.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7668-5996</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Roy</surname>
            <given-names>Souradip</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2917-9705</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>North Dakota State University</institution>
        <addr-line>Fargo, ND</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Juan Li <email>j.li@ndsu.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>13</day>
        <month>11</month>
        <year>2023</year>
      </pub-date>
      <volume>7</volume>
      <elocation-id>e50328</elocation-id>
      <history>
        <date date-type="received">
          <day>27</day>
          <month>6</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>22</day>
          <month>8</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>12</day>
          <month>9</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>8</day>
          <month>10</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Rasha Hendawi, Juan Li, Souradip Roy. Originally published in JMIR Formative Research (https://formative.jmir.org), 13.11.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on https://formative.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://formative.jmir.org/2023/1/e50328" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Machine learning approaches, including deep learning, have demonstrated remarkable effectiveness in the diagnosis and prediction of diabetes. However, these approaches often operate as opaque black boxes, leaving health care providers in the dark about the reasoning behind predictions. This opacity poses a barrier to the widespread adoption of machine learning in diabetes and health care, leading to confusion and eroding trust.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to address this critical issue by developing and evaluating an explainable artificial intelligence (AI) platform, XAI4Diabetes, designed to empower health care professionals with a clear understanding of AI-generated predictions and recommendations for diabetes care. XAI4Diabetes not only delivers diabetes risk predictions but also furnishes easily interpretable explanations for complex machine learning models and their outcomes.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>XAI4Diabetes features a versatile multimodule explanation framework that leverages machine learning, knowledge graphs, and ontologies. The platform comprises the following four essential modules: (1) knowledge base, (2) knowledge matching, (3) prediction, and (4) interpretation. By harnessing AI techniques, XAI4Diabetes forecasts diabetes risk and provides valuable insights into the prediction process and outcomes. A structured, survey-based user study assessed the app’s usability and influence on participants’ comprehension of machine learning predictions in real-world patient scenarios.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>A prototype mobile app was meticulously developed and subjected to thorough usability studies and satisfaction surveys. The evaluation study findings underscore the substantial improvement in medical professionals’ comprehension of key aspects, including the (1) diabetes prediction process, (2) data sets used for model training, (3) data features used, and (4) relative significance of different features in prediction outcomes. Most participants reported heightened understanding of and trust in AI predictions following their use of XAI4Diabetes. The satisfaction survey results further revealed a high level of overall user satisfaction with the tool.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>This study introduces XAI4Diabetes, a versatile multi-model explainable prediction platform tailored to diabetes care. By enabling transparent diabetes risk predictions and delivering interpretable insights, XAI4Diabetes empowers health care professionals to comprehend the AI-driven decision-making process, thereby fostering transparency and trust. These advancements hold the potential to mitigate biases and facilitate the broader integration of AI in diabetes care.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>disease prediction</kwd>
        <kwd>explainable AI</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>knowledge graph</kwd>
        <kwd>machine learning</kwd>
        <kwd>ontology</kwd>
        <kwd>diabetes</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec>
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Diabetes is a prevalent chronic disease with severe health implications, affecting millions of individuals around the world. According to the Centers for Disease Control and Prevention, over 37 million Americans (approximately 1 in 10) are affected by diabetes, with type 2 diabetes accounting for 90% to 95% of the cases [<xref ref-type="bibr" rid="ref1">1</xref>]. Artificial intelligence (AI) has brought about transformative advancements in the field of diabetes diagnosis and management. Expert systems using logical rules have been developed to model medical experts’ knowledge, specifically for prediabetes diagnosis [<xref ref-type="bibr" rid="ref2">2</xref>]. Machine learning–based approaches have also been used to construct predictive models for diabetes risk and its associated complications [<xref ref-type="bibr" rid="ref3">3</xref>]. In recent years, deep learning methods have gained prominence in diabetes prediction systems [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        <p>Although machine learning models, particularly deep learning models, have demonstrated remarkable predictive performance in predictive analytics [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref11">11</xref>] they often lack transparency in their decision-making process. The ability of health care professionals to comprehend and trust the predictive analyses generated by these models is crucial, as they directly impact human lives. Thus, there is a growing need for explainability or interpretability in machine learning models.</p>
        <p>Existing methods for explaining machine learning model predictions have been extensively studied, such as in the studies by Pintelas et al [<xref ref-type="bibr" rid="ref12">12</xref>], Tasin et al [<xref ref-type="bibr" rid="ref13">13</xref>], Davagdorj et al [<xref ref-type="bibr" rid="ref14">14</xref>], Abdulsalam et al [<xref ref-type="bibr" rid="ref15">15</xref>], Gao et al [<xref ref-type="bibr" rid="ref16">16</xref>], Joseph et al [<xref ref-type="bibr" rid="ref17">17</xref>], Ibrahim et al [<xref ref-type="bibr" rid="ref18">18</xref>], Du et al [<xref ref-type="bibr" rid="ref19">19</xref>], Nagaraj et al [<xref ref-type="bibr" rid="ref20">20</xref>], Maillot and Thonnat [<xref ref-type="bibr" rid="ref21">21</xref>], Icarte et al [<xref ref-type="bibr" rid="ref22">22</xref>], Daniels et al [<xref ref-type="bibr" rid="ref23">23</xref>], Zafar and Khan [<xref ref-type="bibr" rid="ref24">24</xref>], Srinivasu et al [<xref ref-type="bibr" rid="ref25">25</xref>], Gerlings et al [<xref ref-type="bibr" rid="ref26">26</xref>], and Dave et al [<xref ref-type="bibr" rid="ref27">27</xref>]. However, these methods often have limitations in providing comprehensive and easily understandable insights into the decision-making process [<xref ref-type="bibr" rid="ref28">28</xref>]. Although explainable models such as local interpretable model-agnostic explanations (LIME) and Shapley additive explanations (SHAP) have made progress in increasing transparency, their explanations can still be challenging for nonexperts, including health care providers, to comprehend [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. Moreover, these methods primarily focus on explaining the results without diving into the underlying mechanisms, specific machine learning techniques, or training data sets and features.</p>
        <p>Therefore, there is a need to enhance the clarity and comprehensibility of explanations regarding how machine learning models arrive at their predictions, including the entire process from data use to model generation, as well as to interpret the results accurately. This comprehensive understanding is crucial for health care providers to trust and effectively use the predictions provided by these models. By addressing these limitations, we can bridge the gap between complex machine learning models and their practical applicability in health care and other domains.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>The primary objective of our study was to address the pressing need for improving the interpretability of machine learning predictions in the context of diabetes risk assessment. Specifically, we aimed to overcome the limitations of existing approaches by developing and evaluating a comprehensive explanation framework that encompasses the entire prediction process, from data use to model generation to diabetes risk prediction results. This framework was designed to bridge the gap between complex machine learning models and their practical applicability in health care and other domains.</p>
        <p>Our study sought to achieve the following specific objectives:</p>
        <list list-type="order">
          <list-item>
            <p>Develop a robust and comprehensive explanation framework that enhances the transparency and interpretability of machine learning–based diabetes risk predictions.</p>
          </list-item>
          <list-item>
            <p>Create an AI platform, XAI4Diabetes, that incorporates the explanation framework and facilitates easy comprehension of the prediction process by health care professionals.</p>
          </list-item>
          <list-item>
            <p>Evaluate the usability and effectiveness of XAI4Diabetes through rigorous usability studies and satisfaction surveys among health care providers.</p>
          </list-item>
        </list>
        <p>By addressing the limitations of existing methods and providing clear, interpretable insights into how machine learning models arrive at their predictions, we aimed to empower health care providers to trust and effectively use the predictions generated by these models. Ultimately, our research contributed to the broader goal of fostering transparency and trust in AI applications in health care, with the potential to improve diabetes care and, by extension, health care in general.</p>
      </sec>
    </sec>
    <sec>
      <title>Methods</title>
      <sec>
        <title>Ethics Approval</title>
        <p>This study was approved by the institutional review board of North Dakota State University (IRB0004513).</p>
      </sec>
      <sec>
        <title>System Overview</title>
        <p>The proposed framework, shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>, consists of the following 4 key modules: the knowledge base, knowledge matching, prediction, and interpretation modules.</p>
        <p>The knowledge base module serves as the foundation of the platform and uses a knowledge graph (KG) constructed from ontologies, semantic rules, and external knowledge sources. It provides machine-interpretable representations of the entire prediction process, capturing relevant information for the task. Within the prediction module, machine learning algorithms are trained and tested on diabetes-related data sets to predict the associated risks. The knowledge matching module plays a vital role in mapping data sets, machine learning algorithms, and their properties (such as hyperparameters) to the entities within the KG. The interpretation module is pivotal for providing comprehensive explanations. It elucidates data set features, underlying machine learning models, and prediction results. By offering these explanations, our platform aims to enhance the understanding of health care stakeholders regarding the functioning of the models and insights derived from the prediction process. In the subsequent subsections, we provide detailed explanations of each module within the framework.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>The architecture of the system. KG: knowledge graph; SNOMED CT: Systematized Nomenclature of Medicine Clinical Terms.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e50328_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Knowledge Base Module</title>
        <p>The knowledge base module serves as a foundational component of our platform, providing a comprehensive understanding of the key concepts, relationships, and rules necessary for explaining the machine learning model. To achieve this, we leveraged 2 primary ontologies: the diabetes ontology and machine learning ontology. These ontologies serve as formalized and standardized representations of their respective domains, facilitating a structured and organized approach to knowledge representation.</p>
        <p>We began by defining top-level concepts and relationships within the diabetes ontology, which acts as the core knowledge representation for diabetes-related concepts and relationships in our system. In this ontology, we built upon existing ontologies, such as the Diabetes Mellitus Diagnosis Ontology [<xref ref-type="bibr" rid="ref31">31</xref>], which captures various aspects of diabetes, including its clinical presentation, diagnosis, treatment, and complications. We extended this ontology by incorporating additional classes and properties to encompass lifestyle interventions, complications, and health care providers. For instance, classes such as physical activity, diet, smoking status, and alcohol consumption were added to capture crucial lifestyle factors that influence diabetes management. <xref rid="figure2" ref-type="fig">Figure 2</xref> provides an overview of the major concepts and relationships within the high-level diabetes ontology. The top-level classes of the diabetes ontology include “DiabetesComplication,” “Drug,” “Symptom,” “Diagnosis,” “Disease,” “DemographicInfo,” “Examination,” “LaboratoryTests,” “Intervention,” “Patient,” “PhysicalFinding,” and “RiskFactor.” This enriched diabetes ontology acts as the bedrock upon which the KG is built.</p>
        <p>The KG is an integral part of our platform. The KG, represented in a graph format, further extends the semantic layer of the diabetes ontology. In the KG, nodes represent entities such as diabetes complications, diabetes medications, diabetes symptoms, and other relevant elements. The edges within the KG symbolize the relationships connecting these entities. For instance, the diabetes ontology may include a concept such as <italic>diabetes</italic>, which forms relationships with other concepts such as <italic>complications</italic>, <italic>insulin therapy</italic>, and <italic>medications</italic>. Each of these concepts is represented as nodes within the KG, with edges establishing connections among them to reflect their associations. To enrich the semantic layer and enhance the depth and breadth of diabetes-related information, we incorporated external knowledge sources such as UMLS (Unified Medical Language System) [<xref ref-type="bibr" rid="ref32">32</xref>], SNOWMED CT (Systematized Nomenclature of Medicine Clinical Terms) [<xref ref-type="bibr" rid="ref33">33</xref>], and Wikidata [<xref ref-type="bibr" rid="ref34">34</xref>] into the KG. Through this integration, a broader knowledge base can be drawn upon. The connections between our locally defined knowledge and external sources are established through KG links. This interconnected approach enables access to external knowledge on demand, providing a more comprehensive knowledge representation.</p>
        <p>In addition, the KG is designed to be dynamic and adaptable, allowing for the incorporation of new knowledge and concepts as they emerge.</p>
        <p>The KG plays a pivotal role in the explanation process within our platform. It provides a structured framework for generating explanations by connecting relevant concepts and relationships, making the AI-driven predictions more transparent and interpretable for health care professionals.</p>
        <p>By contrast, we developed a dedicated ontology that offers a structured representation of the machine learning domain, primarily based on the MLOnto ontology [<xref ref-type="bibr" rid="ref35">35</xref>]. This ontology encompasses various aspects of machine learning, including algorithms, applications, and types. We extended the ontology by introducing classes and properties specific to evaluation metrics and machine learning purposes. The machine learning ontology helps our platform understand and interpret machine learning model behaviors and results. <xref rid="figure3" ref-type="fig">Figure 3</xref> illustrates a segment of the high-level machine learning ontology, highlighting key concepts such as algorithms, applications, and application purposes.</p>
        <p>The integration of these ontologies into our platform enables it to bridge the gap between complex machine learning models and the practical needs of health care professionals. By leveraging the structured knowledge from these ontologies, our platform provides clear and coherent explanations for AI-driven predictions, fostering transparency and trust among users.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Part of the high-level diabetes ontology (produced by Protégé [version 5.5.0; Stanford University]) [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
          </caption>
          <graphic xlink:href="formative_v7i1e50328_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Part of the high-level machine learning ontology (produced by Protégé [version 5.5.0; Stanford University]) [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
          </caption>
          <graphic xlink:href="formative_v7i1e50328_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Knowledge Matching Module</title>
        <p>The knowledge matching module assumes a pivotal role in our platform, serving as the vital link between data items, such as features extracted from a training data set, and the entities present within the KG. This module’s functionality is rooted in a sophisticated semantic matching process [<xref ref-type="bibr" rid="ref37">37</xref>] that assesses the semantic distances between data items and the semantic entities within the KG.</p>
        <p>To address the challenge of entity ambiguity, wherein a single data item may correspond to multiple candidate entries in the KG, we used advanced techniques grounded in word embeddings. These word embeddings represent words as low-dimensional vectors, effectively capturing their semantics and intricate relationships. Specifically, we leveraged a meticulously pretrained embedding model known as BioWordVec [<xref ref-type="bibr" rid="ref38">38</xref>], which excels in accurately capturing the nuanced meanings of entities within the medical and health care domains. Notably, BioWordVec was constructed using a wealth of data from authoritative sources, including PubMed and clinical notes from the MIMIC-III Clinical Database [<xref ref-type="bibr" rid="ref39">39</xref>]. Contextual information forms another crucial aspect of entity disambiguation within the knowledge matching module. In our case, the context of a data item encompasses other closely related features. By considering the broader context in which a data item appears, our platform significantly enhances its ability to pinpoint the most appropriate entity within the KG.</p>
        <p>Furthermore, the knowledge matching module intelligently explores the relationships among the entities contained within the KG. This examination of entity relationships serves as an additional source of information for disambiguation purposes. When 2 entities exhibit a close and meaningful relationship, it is more likely that the text references the entity that is the most relevant to the given context. This multifaceted approach to entity disambiguation ensures that our platform consistently delivers accurate and contextually appropriate explanations, thereby enhancing the interpretability of AI-driven diabetes predictions for health care professionals.</p>
      </sec>
      <sec>
        <title>Prediction Module</title>
        <p>The prediction module plays a crucial role in our system by using machine learning algorithms for diabetes risk prediction. We carefully selected the algorithms based on several factors, including problem understanding, data analysis, algorithm suitability, and performance evaluation. For our prototype, we worked with 2 data sets: the Pima Indians Diabetes Database [<xref ref-type="bibr" rid="ref40">40</xref>] and the early-stage diabetes risk prediction data set [<xref ref-type="bibr" rid="ref41">41</xref>]. After thorough analysis and testing, we selected 3 models: deep neural network (DNN), random forest (RF), and decision tree (DT).</p>
        <p>To ensure compatibility and consistency in the training process, we applied the <italic>z</italic> score scaling method to normalize the data sets. In addition, we addressed the issue of imbalanced data in the Pima data set using the synthetic minority oversampling technique [<xref ref-type="bibr" rid="ref42">42</xref>] to balance the classes. We then used Tomek links [<xref ref-type="bibr" rid="ref43">43</xref>] to remove any introduced noise. The DNN model consists of 3 hidden layers, with 16 and 8 neurons in the first 2 layers, respectively, using the Sigmoid activation function. The final layer consists of 2 neurons using the SoftMax activation function for multiclass classification. By contrast, both the RF and DT models use entropy as a metric to measure the impurity or uncertainty within a group of observations.</p>
        <p>By leveraging these diverse models, our system aims to improve the accuracy and robustness of diabetes risk predictions. The combination of different algorithms allows the consideration of various aspects and perspectives of the data, leading to a comprehensive and well-rounded approach to prediction.</p>
      </sec>
      <sec>
        <title>Explanation Module</title>
        <p>The explanation model explains machine learning prediction on the following three levels: (1) the machine learning model used for diabetes prediction, (2) data used to train and test the machine learning model, and (3) prediction results generated by the machine learning model.</p>
        <sec>
          <title>Machine Learning Model and Data Set Explanation</title>
          <p>When data scientists create diabetes prediction models using machine learning approaches, instances of the machine learning model will be generated based on the machine learning ontology defined in the previous section. All the metadata about the machine learning model, such as the machine learning algorithm and parameters, are stored in the knowledge in the format of an ontology. Querying and reasoning can be performed on the knowledge base for explanatory purposes.</p>
          <p>To explain the data used for the training and testing of the diabetes prediction model, data features from the data set are mapped to the KG of diabetes. Information in the KG can be used to explain the data features, thus improving the user’s understanding of the training and testing data. A SPARQL [<xref ref-type="bibr" rid="ref44">44</xref>] query is used to query the KG to obtain appropriate information, for example, <italic>what machine learning algorithm and dataset are used to train the prediction model?</italic> This question can be translated into the following SPARQL query:</p>
          <disp-formula>
            <graphic xlink:href="formative_v7i1e50328_fig11.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </disp-formula>
          <p>The system retrieves the algorithm and data set information from the machine learning ontology and returns them to the user.</p>
          <p>Moreover, data items (features) are explained by leveraging entities from external KGs such as the Unified Medical Language System, Systematized Nomenclature of Medicine Clinical Terms, and Wikidata. These KGs provide a rich source of information and definitions that can assist in understanding unfamiliar data features. For instance, if a data feature is not known by health care providers, they can access the KG to retrieve the definition and even figures related to that feature, facilitating comprehension. In the <italic>Results</italic> section, we provide detailed examples of how the KG enhances the explanation of data items. These examples demonstrate how the system retrieves relevant information from the KG to help users understand and interpret data features in the context of diabetes risk prediction.</p>
        </sec>
        <sec>
          <title>Prediction Result Explanation</title>
          <sec>
            <title>Overview</title>
            <p>In our prediction result explanation, we adopt 2 perspectives: global explanations and local explanations. Global explanations aim to provide an understanding of the diabetes prediction model as a whole by identifying the data set features (eg, specific symptoms) that have the most substantial influence on the predictions. This perspective helps uncover the overarching patterns and relationships between the features and predictions. By contrast, local explanations focus on explaining how the different input features impact the diabetes prediction for an individual patient. This perspective is particularly valuable for complex models that exhibit varied responses to different combinations of features. By analyzing local explanations, we can gain insights into the specific factors that contribute to a patient’s prediction, enabling personalized interpretations and interventions.</p>
            <p>By incorporating both global and local explanation techniques, we covered a comprehensive range of insights from the macrolevel understanding of the model to the microlevel understanding of individual predictions. This approach provides a holistic view of the model’s behavior and empowers health care providers to make informed decisions based on the explanations tailored to their specific needs.</p>
          </sec>
          <sec>
            <title>Global Explanation</title>
            <p>We adopt the SHAP technique [<xref ref-type="bibr" rid="ref45">45</xref>] to explain the overall prediction model because of its effectiveness in providing interpretable and reliable insights. SHAP offers a game-theoretical approach to attribute the contribution of each feature in the data set to the model’s predictions [<xref ref-type="bibr" rid="ref46">46</xref>]. By quantifying the impact of individual features, SHAP helps understand the relative importance and influence of different factors with regard to the overall predictions. This technique allows for a comprehensive understanding of the prediction model’s behavior and facilitates the communication of these explanations to health care providers. The importance of feature j is defined by the Shapley value [<xref ref-type="bibr" rid="ref46">46</xref>] in the following equation:</p>
            <disp-formula>
              <graphic xlink:href="formative_v7i1e50328_fig12.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
            </disp-formula>
            <p>, which is calculated by averaging its contributions across all possible permutations of feature sets. This allows for the assessment of the individual impact of features on the model’s output and determination of their significance in the prediction process.</p>
          </sec>
          <sec>
            <title>Local Explanation</title>
            <p>For local explanations, we used LIME [<xref ref-type="bibr" rid="ref47">47</xref>]. LIME was chosen for its ability to provide insights into the behavior of the prediction function f(x) in the vicinity of a specific instance. LIME achieves this by generating a new data set of perturbed instances and their corresponding predictions from the black-box model. These perturbations involve the modification of feature values, such as introducing noise to continuous features or removing words from text data. The weighted interpretable model is then trained using this data set, where the weights are assigned based on the proximity of the samples to the original instance being explained. Instances closer to the original have higher weights, whereas those farther away have lower weights. The trained interpretable model estimates the probability of the instances belonging to a specific class, providing a localized explanation for the prediction of a particular instance. LIME may suffer from inherent instability arising from its perturbation technique. Stabilized-LIME for Model Explanation (S-LIME) [<xref ref-type="bibr" rid="ref48">48</xref>] can be used to tackle the problem of instability. S-LIME incorporates a hypothesis testing framework based on the central limit theorem to determine the number of perturbation points required to ensure the stability of the resulting explanations. By quantifying the necessary number of perturbations, S-LIME aims to provide explanations that are more consistent and less prone to fluctuations caused by small data variations.</p>
          </sec>
        </sec>
      </sec>
    </sec>
    <sec>
      <title>Results</title>
      <sec>
        <title>Prototype System</title>
        <p>We developed a mobile app, XAI4Diabetes, based on the proposed approach for predicting diabetes and explaining the prediction. The target users of the mobile app are health care providers who treat patients with diabetes. To use the app, a user can input patient information, such as the patient’s basic information (<xref rid="figure4" ref-type="fig">Figure 4</xref> [left]), examination information (<xref rid="figure4" ref-type="fig">Figure 4</xref> [right]), symptoms (<xref rid="figure5" ref-type="fig">Figure 5</xref>), and family history. Then, the patient’s risk of having diabetes is predicted (<xref rid="figure6" ref-type="fig">Figures 6</xref> [left] and 7 [left]) by the machine learning model. In addition, how this prediction is made by the machine learning model is explained using human-understandable language and figures (<xref rid="figure6" ref-type="fig">Figures 6</xref> [right] and 7 [right]).</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Screenshots of a patient’s basic information (left) and examination information (right).</p>
          </caption>
          <graphic xlink:href="formative_v7i1e50328_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Screenshots of patients’ symptom input.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e50328_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Screenshots of prediction result (left) and explanation based on a patient’s examination (right).</p>
          </caption>
          <graphic xlink:href="formative_v7i1e50328_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Screenshots of prediction result (left) and explanation based on patients’ symptoms (right).</p>
          </caption>
          <graphic xlink:href="formative_v7i1e50328_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Use Case Study</title>
        <p>In our research, we adopted use case studies to comprehensively evaluate the capabilities and performance of the XAI4Diabetes mobile app. A use case study is a research method commonly used in software development and system evaluation to understand the practical application of a system or technology in real-world scenarios. By creating various use cases, we aimed to simulate different scenarios and interactions that health care providers may encounter when using the app. This approach allowed us to examine the system’s functionality in a practical context and assess its effectiveness in supporting diabetes prediction and explanation tasks.</p>
        <p>In <xref rid="figure4" ref-type="fig">Figure 4</xref>, a user inputs the basic and examination information of a female patient aged 60 years. On the basis of this information, a prediction is made about whether she may have diabetes. The prediction result is shown in <xref rid="figure6" ref-type="fig">Figure 6</xref> (left). As shown in <xref rid="figure6" ref-type="fig">Figure 6</xref> (left), the machine learning model predicts that the patient has an 83% chance of being diagnosed with diabetes. <xref rid="figure6" ref-type="fig">Figure 6</xref> (right) explains why the machine learning model makes this prediction. It shows that the user’s BMI has a huge impact on this decision; the second factor is her blood glucose level. The figure lists some major factors impacting the machine learning model used to make the decision. For different patients, the factors may be quite different.</p>
        <p>The feature importance shown on the mobile app was generated using LIME, as it is suitable for local explanations of individual predictions. The output is a list of features and their corresponding weights, indicating their contribution to the prediction. This provides a better understanding of the model’s behavior for a specific data sample and allows for the identification of the most important features for a prediction. Our system illustrates feature importance in a user-friendly figure that can be interpreted without the need for an expert. To ensure the stability of the explanations, we conducted experiments using S-LIME. Fortunately, the outcomes of these experiments indicated that our explanations remain consistent and reliable, despite the potential instability of LIME.</p>
        <p>In <xref rid="figure5" ref-type="fig">Figure 5</xref>, the user inputs the symptoms of a female patient. The prediction module uses the patient’s symptoms to predict whether she is diabetic (<xref rid="figure7" ref-type="fig">Figure 7</xref> [left]) and to provide an explanation for why the model made this prediction (<xref rid="figure7" ref-type="fig">Figure 7</xref> [right]). As shown in <xref rid="figure7" ref-type="fig">Figure 7</xref> (left), the machine learning model predicts that the patient has a 100% chance of being diagnosed with diabetes. <xref rid="figure7" ref-type="fig">Figure 7</xref> (right) explains why the machine learning model makes this prediction. It shows that the patient has polyuria and that this symptom has the greatest contribution to the prediction result; polydipsia is the second most important factor that impacts the prediction The figure lists the factors with the highest effects on the machine learning prediction.</p>
        <p><xref rid="figure8" ref-type="fig">Figure 8</xref> shows the explanation of one of the features of the data set. The machine learning prediction model was trained using data sets. Users may not be familiar with the data items used in the training data sets. The app provides an explanation interface to help the user understand each data feature of the training and testing data. In the case of <xref rid="figure8" ref-type="fig">Figure 8</xref>, the user may not understand the meaning of the feature <italic>alopecia</italic> used in the data set. Alopecia is one of the common symptoms of diabetes, along with polyuria, polydipsia, polyphagia, weakness, obesity, irritability, genital thrush, and other data set attributes [<xref ref-type="bibr" rid="ref49">49</xref>]. Patients with diabetes are more likely to have alopecia areata [<xref ref-type="bibr" rid="ref50">50</xref>].</p>
        <p>The user can click on a feature, and its explanation is shown, as in <xref rid="figure8" ref-type="fig">Figure 8</xref> (left). More details from external links are provided, as in <xref rid="figure8" ref-type="fig">Figure 8</xref> (right). The knowledge matching module and the interpretation module link this feature to the corresponding KG entity and provide the symptom definition and a link to a trustworthy source for more information (<xref rid="figure8" ref-type="fig">Figure 8</xref> [right]).</p>
        <p>Besides the functions shown in <xref rid="figure4" ref-type="fig">Figures 4</xref>-<xref rid="figure8" ref-type="fig">8</xref>, XAI4Diabetes provides more services, such as detailed information about the data sets used to train the models, for instance, their source, the number of patient cases, and the features. In addition, XAI4Diabetes explains the machine learning model used to make the prediction such as its parameters and algorithms<italic>.</italic> XAI4Diabetes also gives general insight into the importance of each feature that influenced the predictive model. All these functions were evaluated in our user study.</p>
        <fig id="figure8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>Screenshot of the explanation of one of the data set features (left) [<xref ref-type="bibr" rid="ref51">51</xref>] and detailed information from an external knowledge source (right) [<xref ref-type="bibr" rid="ref52">52</xref>]. CTCAE: Common Terminology Criteria for Adverse Events; FDA: Food and Drug Administration; NCI: National Cancer Institute; NCI-GLOSS: National Cancer Institute-Dictionary of Cancer Terms; NHI: National Institutes of Health.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e50328_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Prediction Model Evaluation</title>
        <p>The prediction model was evaluated using 2 data sets: the Pima Indians Diabetes Dataset and early-stage diabetes risk prediction data set. The Pima Indians Diabetes Database is a widely used data set consisting of 768 instances representing female patients of Pima Indian heritage. The early-stage diabetes risk prediction data set includes data obtained from 520 individuals, 200 healthy individuals and 320 patients with diabetes, at Sylhet Diabetes Hospital. Our system used 3 models for diabetes risk prediction: DNN, RF, and DT. Our approaches yielded highly competitive results compared with state-of-the-art approaches, demonstrating the effectiveness of our framework.</p>
        <p>We evaluated our framework based on the metrics of accuracy, precision, recall, <italic>F</italic><sub>1</sub>-score, and precision-recall curve. <xref ref-type="table" rid="table1">Table 1</xref> lists the performance of the 3 algorithms on the Pima data set. We also compared our approaches with existing approaches, including naive Bayes [<xref ref-type="bibr" rid="ref53">53</xref>], sequential minimal optimization [<xref ref-type="bibr" rid="ref54">54</xref>], Java 48 [<xref ref-type="bibr" rid="ref55">55</xref>], k-nearest neighbor (KNN) [<xref ref-type="bibr" rid="ref56">56</xref>], deep learning [<xref ref-type="bibr" rid="ref5">5</xref>], and linear regression [<xref ref-type="bibr" rid="ref57">57</xref>]. <xref rid="figure9" ref-type="fig">Figure 9</xref> shows the receiver operating characteristic curves of the 3 algorithms on the Pima data set.</p>
        <p>Similarly, <xref ref-type="table" rid="table2">Table 2</xref> depicts the performance of the 3 algorithms and 2 other approaches, KNN [<xref ref-type="bibr" rid="ref56">56</xref>]and linear regression [<xref ref-type="bibr" rid="ref56">56</xref>], on the early-stage data set. <xref rid="figure10" ref-type="fig">Figure 10</xref> shows the ROC curves of the 3 algorithms on this data set.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Comparison of model performance for the Pima data set.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="310"/>
            <col width="190"/>
            <col width="190"/>
            <col width="170"/>
            <col width="140"/>
            <thead>
              <tr valign="top">
                <td>Model</td>
                <td>Accuracy</td>
                <td>Precision</td>
                <td>Recall</td>
                <td><italic>F</italic><sub>1</sub>-score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Random forest</td>
                <td>0.851</td>
                <td>0.847</td>
                <td>0.846</td>
                <td>0.845</td>
              </tr>
              <tr valign="top">
                <td>Decision tree</td>
                <td>0.785</td>
                <td>0.797</td>
                <td>0.796</td>
                <td>0.793</td>
              </tr>
              <tr valign="top">
                <td>Deep neural network</td>
                <td>0.825</td>
                <td>0.808</td>
                <td>0.816</td>
                <td>0.825</td>
              </tr>
              <tr valign="top">
                <td>Naive Bayes [<xref ref-type="bibr" rid="ref52">52</xref>]</td>
                <td>0.779</td>
                <td>0.776</td>
                <td>0.77</td>
                <td>0.767</td>
              </tr>
              <tr valign="top">
                <td>Sequential minimal optimization [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>N/A<sup>a</sup></td>
                <td>0.769</td>
                <td>0.776</td>
                <td>0.764</td>
              </tr>
              <tr valign="top">
                <td>Java 48 [<xref ref-type="bibr" rid="ref54">54</xref>]</td>
                <td>N/A</td>
                <td>0.804</td>
                <td>0.780</td>
                <td>0.792</td>
              </tr>
              <tr valign="top">
                <td>Deep learning [<xref ref-type="bibr" rid="ref5">5</xref>]</td>
                <td>0.981</td>
                <td>0.952</td>
                <td>0.985</td>
                <td>0.968</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure9" position="float">
          <label>Figure 9</label>
          <caption>
            <p>Receiver operating characteristic curves of different approaches on the Pima data set. AUC: area under receiver operating characteristic curve.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e50328_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Comparison of model performance for the early-stage data set.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="260"/>
            <col width="170"/>
            <col width="190"/>
            <col width="190"/>
            <col width="190"/>
            <thead>
              <tr valign="top">
                <td>Model</td>
                <td>Accuracy</td>
                <td>Precision</td>
                <td>Recall</td>
                <td><italic>F</italic><sub>1</sub>-score</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Random forest</td>
                <td>0.99</td>
                <td>0.993</td>
                <td>0.985</td>
                <td>0.989</td>
              </tr>
              <tr valign="top">
                <td>Decision tree</td>
                <td>0.952</td>
                <td>0.965</td>
                <td>0.946</td>
                <td>0.947</td>
              </tr>
              <tr valign="top">
                <td>Deep neural network</td>
                <td>0.991</td>
                <td>0.986</td>
                <td>0.985</td>
                <td>0.989</td>
              </tr>
              <tr valign="top">
                <td>K-nearest neighbor [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>0.925</td>
                <td>N/A<sup>a</sup></td>
                <td>N/A</td>
                <td>0.934</td>
              </tr>
              <tr valign="top">
                <td>Linear regression [<xref ref-type="bibr" rid="ref53">53</xref>]</td>
                <td>0.925</td>
                <td>N/A</td>
                <td>N/A</td>
                <td>0.936</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>N/A: not applicable.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure10" position="float">
          <label>Figure 10</label>
          <caption>
            <p>Receiver Operating Characteristic curves of different approaches on the early-stage data set. AUC: area under receiver operating characteristic curve.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e50328_fig10.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Usability Evaluation</title>
        <p>We conducted a preliminary user study to evaluate the technical viability and effectiveness of the mobile app. We invited health care professionals specializing in internal medicine, general surgery, and endocrinology to participate, and 10 physicians completed the survey. As the sample size was relatively small, it could provide only a preliminary assessment of the framework’s viability and effectiveness.</p>
        <p>The survey consisted of 12 questions measured on a 5-point Likert scale. The participants evaluated the app’s performance in 4 patient cases. The results, shown in <xref ref-type="table" rid="table3">Table 3</xref>, indicate that all the participants agreed that the machine learning prediction results were reasonable and that the app provided sufficient and helpful information. They also agreed that the app adequately explained complex medical features. Most participants (9/10,90 %) found the prediction result explanation reasonable, and the global explanations aligned with their medical opinions. In addition, 60% (6/10) of the participants strongly agreed that the app helped them understand how the machine learning model made the predictions and could assist data scientists in reproducing the model.</p>
        <p>Lower ratings were observed for the questions related to the explanation of the machine learning model. This may have been due to the physicians’ limited background in data science or machine learning, resulting in difficulty in understanding the technical details. The lack of familiarity with terminologies such as <italic>feature</italic> and <italic>hyperparameters</italic> could have also contributed to the challenge. The physicians may have had limited exposure to formal training in machine learning concepts, making it harder for them to comprehend how the model works.</p>
        <p>To assess the overall satisfaction, the participants were asked to provide feedback on their experience using the mobile app. As shown in <xref ref-type="table" rid="table4">Table 4</xref>, most participants (8/10,80 %) expressed satisfaction, stating that the app helped them trust AI predictions better and (10/10, 100%) stated that it was easy to use. Most participants (8/10,80 %) agreed that they would use the system more frequently and felt confident about using it. (10/10, 100%) participants found the predictions made by the machine learning model consistent with their medical opinions. All the participants (10/10, 100%) disagreed that the app required technical support to be used.</p>
        <p>These findings provide valuable insights into user satisfaction and highlight areas for improvement in explaining machine learning models to health care professionals.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Survey responses from health care professionals.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="320"/>
            <col width="130"/>
            <col width="110"/>
            <col width="180"/>
            <col width="140"/>
            <col width="120"/>
            <thead>
              <tr valign="top">
                <td>Survey question</td>
                <td colspan="5">Rating, n (%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Strongly agree</td>
                <td>Agree</td>
                <td>Neither agree nor disagree</td>
                <td>Disagree</td>
                <td>Strongly disagree</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>The predicted result is reasonable</td>
                <td>9 (90)</td>
                <td>1 (10)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>The explanation of the prediction is clear and reasonable</td>
                <td>8 (80)</td>
                <td>1 (10)</td>
                <td>1 (10)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>The explanation helps me comprehend how machine learning generates the prediction</td>
                <td>6 (60)</td>
                <td>0 (0)</td>
                <td>2 (20)</td>
                <td>2 (20)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>The data set explanation assists me in understanding the data set used by the machine learning model for prediction</td>
                <td>9 (90)</td>
                <td>1 (10)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>The machine learning model explanation aids data scientists in reproducing the model</td>
                <td>6 (60)</td>
                <td>0 (0)</td>
                <td>4 (40)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>The order of feature importance is logical</td>
                <td>9 (90)</td>
                <td>0 (0)</td>
                <td>1 (10)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>The explanation for complex medical features is sufficient</td>
                <td>8 (80)</td>
                <td>2 (20)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Overall feedback regarding the use of the mobile app.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="400"/>
            <col width="120"/>
            <col width="100"/>
            <col width="150"/>
            <col width="120"/>
            <col width="110"/>
            <thead>
              <tr valign="top">
                <td>Survey question</td>
                <td colspan="5">Rating, n (%)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Strongly agree</td>
                <td>Agree</td>
                <td>Neither agree nor disagree</td>
                <td>Disagree</td>
                <td>Strongly disagree</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>The application enhances my trust in AI<sup>a</sup> predictions</td>
                <td>7 (70)</td>
                <td>1 (10)</td>
                <td>2 (20)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>The application is user-friendly and easy to navigate</td>
                <td>10 (100)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>I feel very confident about using the system</td>
                <td>7 (70)</td>
                <td>1 (10)</td>
                <td>0 (0)</td>
                <td>2 (20)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>The AI predictions align with my medical opinion</td>
                <td>8 (80)</td>
                <td>2 (20)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>I believe I would require technical assistance to use this system effectively</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td>0 (0)</td>
                <td>2 (20)</td>
                <td>8 (80)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>AI: artificial intelligence.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Explanation Evaluation</title>
        <p>For the assessment of attribution explanation faithfulness qualities, we applied the monotonicity [<xref ref-type="bibr" rid="ref58">58</xref>] and implementation invariance [<xref ref-type="bibr" rid="ref59">59</xref>] quantitative metrics on the 2 data sets, and the results are shown in <xref ref-type="table" rid="table5">Table 5</xref>. We used the monotonicity explanation metric to measure the strength and direction of association between attributes and explanations. Monotonicity indicates how faithful a feature attribution explanation is. We applied Spearman correlation coefficient (ρ) between the feature’s absolute performance measure of interest and corresponding expectations. As can be seen in <xref ref-type="table" rid="table5">Table 5</xref>, the ρ value is positive and close to 1, which indicates a strong positive monotonic relationship between the LIME explanation features and true outcomes. In other words, the attributions are monotonic, and LIME assigns the correct importance.</p>
        <p>To assess explanation consistency, we used the implementation invariance quantitative metric by computing the Jaccard similarity between feature importance scores across random initializations of the predictive model. The Jaccard coefficient is a similarity and diversity measure among finite sets. It computes the similarity between 2 sets of data points by dividing the number of elements in an intersection by the number of elements in union. When the Jaccard index is between 0 and 1, there is some degree of overlap between the sets. The high Jaccard similarity coefficients that we achieved suggest that LIME consistently selects similar sets of features across data points, indicating consistency in the explanation.</p>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Quantitative metrics for measuring explanation faithfulness qualities.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="480"/>
            <col width="180"/>
            <col width="310"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Data set and model</td>
                <td>Monotonicity</td>
                <td>Implementation invariance</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="4">
                  <bold>Early-stage diabetes risk prediction data set</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Random forest</td>
                <td>0.97</td>
                <td>0.93</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Decision tree</td>
                <td>0.93</td>
                <td>0.91</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Deep neural network</td>
                <td>0.96</td>
                <td>0.93</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Pima Indians Diabetes Database</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Random forest</td>
                <td>0.86</td>
                <td>0.78</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Decision tree</td>
                <td>0.80</td>
                <td>0.76</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Deep neural network</td>
                <td>0.90</td>
                <td>.74</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Our research objectives focused on addressing the need for explaining machine learning predictions in the context of diabetes risk and developing a comprehensive framework to enhance their practical applicability in health care. By achieving these objectives, we aimed to enable health care providers to trust and effectively use the predictions generated by these models.</p>
        <p>To accomplish these objectives, we designed and developed the XAI4Diabetes mobile app, which leverages ontologies, a KG, and external knowledge sources. Our approach involves KG embedding and semantic similarity measurement to link concepts such as data sets and machine learning models to the entities in the KG. It uses both global and local result explanation mechanisms to deliver clear and understandable explanations of the diabetes prediction results. The app covers the entire prediction process, from data use to model generation, and presents diabetes prediction results in an understandable manner.</p>
        <p>The results of our research demonstrate the effectiveness of the XAI4Diabetes app in achieving our objectives. Through a user study and user satisfaction survey, we obtained valuable insights into the impact and usability of the app. The survey results revealed that the explanations provided by the app were instrumental in helping medical providers understand the prediction mechanism, predicted results, and features used in the training data. This comprehensive understanding of the predictions enhances trust in AI prediction in the field of diabetes risk assessment.</p>
        <p>Furthermore, the user satisfaction survey highlighted areas for improvement, particularly in explaining machine learning models. The participants expressed the need for more context, a simpler language, and additional training or resources to enhance their understanding of the technology. These results indicate that further enhancements to the explanation framework of the app are necessary to meet the specific needs of health care providers.</p>
        <p>In conclusion, the results of our study are strongly connected with our research objectives. The development of the XAI4Diabetes app successfully addressed the need for explaining machine learning predictions in diabetes risk assessment. By providing comprehensive and understandable explanations, the app supports health care providers in trusting and effectively using these predictions. However, the survey results also provide valuable feedback for future improvements, emphasizing the importance of refining the explanations of machine learning models to enhance their interpretability and usability in health care settings.</p>
      </sec>
      <sec>
        <title>Comparison With Existing Work</title>
        <p>Various machine learning techniques have been used in health care and disease prediction. Some studies used simple shallow models [<xref ref-type="bibr" rid="ref60">60</xref>], whereas others used deep learning models [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref61">61</xref>]. Hybrid techniques have been developed to improve the model’s outcomes [<xref ref-type="bibr" rid="ref10">10</xref>]. However, all the earlier studies focused on improving the model’s performance while neglecting the interpretability concerns. They lack the transparency required by physicians to trust AI systems [<xref ref-type="bibr" rid="ref62">62</xref>].</p>
        <p>Recently, there has been a surge in research focused on explainable AI [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref49">49</xref>] to provide explanations for machine learning results. For example, the study by Tiddi et al [<xref ref-type="bibr" rid="ref63">63</xref>] proposed a framework in which an inductive logic-based graph search is performed to generate explanations for data output by unsupervised learning algorithms (clusters, association rules, and time series). In addition, using structured knowledge for machine learning–based visual explanations was the subject of the image recognition tasks in the studies by Maillot and Thonnat [<xref ref-type="bibr" rid="ref21">21</xref>] and Icarte et al [<xref ref-type="bibr" rid="ref22">22</xref>]. Similarly, Daniels et al [<xref ref-type="bibr" rid="ref23">23</xref>] integrate a generic DNN architecture with WordNet for the scene classification task. Here, object types from WordNet are aligned with objects in the ADE20K data set, and the WordNet hierarchy is then used to train an object identification module, which is then input into a linear regression model capable of providing explanations automatically.</p>
        <p>A new paradigm of intelligent health care systems has begun to explore how to deliver understandable results along with transparent, reliable explanations. For example, in the study by Zafar and Khan [<xref ref-type="bibr" rid="ref24">24</xref>], the authors used agglomerative hierarchical clustering to group the training data and KNN to select the relevant cluster of the new instance that was being explained. Then, a linear model was trained over the selected cluster to generate explanations. The system was tested on 3 medical data sets. In the study by Caruana et al [<xref ref-type="bibr" rid="ref64">64</xref>], Microsoft presented 2 case studies based on real medical data, in which high-performance generalized additive models with pairwise interactions achieved state-of-the-art accuracy.</p>
        <p>Systems in the health care domain often integrate classification tasks with taxonomical knowledge found in medical diagnosis metathesaurus or medical ontologies [<xref ref-type="bibr" rid="ref65">65</xref>]. For example, the study by Vavpetič et al [<xref ref-type="bibr" rid="ref66">66</xref>] used the gene ontology and Kyoto Encyclopedia of Genes and Genomes ontology for subgroup discovery, with the sense that the constructed rules describing subgroups are good explanations for their formation. Moreover, the study by Che et al [<xref ref-type="bibr" rid="ref67">67</xref>] proposed a health diagnosis prediction system that uses medical ontologies to learn (embedded) representations for medical nodes in the KG and their parent codes. These are then used to learn the input representations of patient data, which are then loaded into a neural network architecture. The system uses an attention mechanism that learns weights to improve the prediction accuracy and allow the interpretation of the importance of various pieces of information. In the study by Phan et al [<xref ref-type="bibr" rid="ref68">68</xref>], a domain ontology was integrated into a neuro-symbolic architecture with a restricted Boltzmann machine model to predict and explain human behaviors for health care intervention systems in health social networks.</p>
        <p>Despite the advancements highlighted in the aforementioned studies, they primarily focus on explaining the predictive outcomes. The inner workings of the machine learning process, such as the training methodologies, used data sets, and selected data features, remain obscured. In addition, the explanations predominantly cater to data scientists and technical experts, requiring specialized knowledge for interpretation. Notably, these studies lack user-centric evaluations, neglecting feedback from potential end users.</p>
        <p>By contrast, XAI4Diabetes provides users with a thorough explanation from multiple aspects, thus improving their understanding of the predictions. The explanation is provided by an easy-to-use interface using natural language and straightforward figures.</p>
      </sec>
      <sec>
        <title>Limitations and Future Work</title>
        <p>There are limitations to our current framework. In addition, there are several avenues for future work and improvements, addressing which can enhance the usability and effectiveness of the system.</p>
        <p>One of the major limitations is the small sample size of the user study conducted during the evaluation of the XAI4Diabetes app. Although the initial user study provided valuable insights, a larger and more diverse participant pool is necessary to obtain a more comprehensive understanding of the system’s performance and user satisfaction. In the future, we plan to conduct a long-term, extensive user study with a larger number of participants, including health care professionals and patients, to gather more robust feedback and validate the effectiveness of the framework.</p>
        <p>Another limitation is that our current prototype is only a proof of concept and not a mature product. Although it demonstrates the feasibility of the proposed framework, there is room for improvement in terms of user interface design and functionality. To address this, we will perform a comprehensive requirement analysis by surveying medical professionals and patients as the final users. This analysis will help us better understand their needs and preferences, leading to the development of a more refined and user-friendly interface.</p>
        <p>Furthermore, the current system primarily targets health care providers, and additional work is needed to ensure that it can effectively serve patients as well. In the future, we will focus on enhancing the patient-centric features of the app to provide personalized explanations and support for individuals managing their diabetes risk. This includes tailoring the system’s functionalities to better meet the needs of patients. We plan to incorporate the use of resources such as MedlinePlus [<xref ref-type="bibr" rid="ref69">69</xref>] to make knowledge more accessible to the general public. In addition, we plan to integrate patient feedback mechanisms.</p>
        <p>In terms of explanation representation and presentation, there is ongoing research for exploring better ways of conveying explanations. We will investigate techniques such as animation and graph-based explanations to enhance the visual and interactive aspects of the app. These approaches have the potential to further improve the interpretability and understandability of the machine learning predictions for both health care providers and patients.</p>
        <p>In addition, the current version of the app lacks a user feedback mechanism. To foster continuous improvement, we recognize the importance of incorporating health care stakeholders’ feedback. Therefore, in future iterations, we will integrate a feedback feature that will allow users to provide their insights, suggestions, and concerns. This feedback will be invaluable for enhancing the interoperability, interpretability, and overall performance of the system.</p>
        <p>In summary, although our framework has demonstrated promising results, it is important to acknowledge its limitations and outline future directions for improvement. By addressing these limitations and conducting further research, we aim to develop a more mature and user-centric system that effectively explains machine learning predictions, empowers health care providers and patients, and ultimately enhances trust in AI-assisted diabetes risk assessment.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In conclusion, our study developed the XAI4Diabetes framework, addressing the need for explaining machine learning predictions in diabetes risk assessment. Our framework provides transparent and interpretable explanations for the diabetes prediction process and prediction results, enhancing the understanding of health care providers and stakeholders. This improves trust in AI predictions and supports informed decision-making in medical research.</p>
        <p>By incorporating ontologies and a KG, we created a user-friendly tool that bridges the gap between complex machine learning models and their practical applicability in health care. The framework’s multiaspect explanations link input features, machine learning algorithms, and external knowledge sources.</p>
        <p>Future works include conducting extensive user studies, refining the user interface based on feedback from health care professionals and patients, and exploring advanced presentation techniques such as animation and graph explanations. Our research has broader implications for transparent and explainable AI, enabling the adoption of machine learning models in various industries.</p>
        <p>Overall, our study contributes to the understanding and trustworthiness of machine learning predictions in health care, laying the foundation for reliable and transparent applications in medical decision-making processes.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AI</term>
          <def>
            <p>artificial intelligence</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">DNN</term>
          <def>
            <p>deep neural network</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">DT</term>
          <def>
            <p>decision tree</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">KG</term>
          <def>
            <p>knowledge graph</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">KNN</term>
          <def>
            <p>k-nearest neighbor</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">LIME</term>
          <def>
            <p>local interpretable model-agnostic explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">ROC</term>
          <def>
            <p>receiver operating characteristic</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">RF</term>
          <def>
            <p>random forest</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">SHAP</term>
          <def>
            <p>Shapley additive explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">S-LIME</term>
          <def>
            <p>Stabilized-LIME for Model Explanation</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was supported by the National Science Foundation (NSF; awards 1722913 and 2218046).</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data sets generated and analyzed during this study are not publicly available. However, the data are available from the corresponding author upon reasonable request.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>Type 2 diabetes</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <access-date>2023-11-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/diabetes/basics/type2.html">https://www.cdc.gov/diabetes/basics/type2.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zeki</surname>
              <given-names>TS</given-names>
            </name>
            <name name-style="western">
              <surname>Malakooti</surname>
              <given-names>MV</given-names>
            </name>
            <name name-style="western">
              <surname>Ataeipoor</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tabibi</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>An expert system for diabetes diagnosis</article-title>
          <source>Am Acad Scholar Res J</source>
          <year>2012</year>
          <month>09</month>
          <volume>4</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <lpage>13</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Keshavjee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Guergachi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Predictive models for diabetes mellitus using machine learning techniques</article-title>
          <source>BMC Endocr Disord</source>
          <year>2019</year>
          <month>10</month>
          <day>15</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>101</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcendocrdisord.biomedcentral.com/articles/10.1186/s12902-019-0436-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12902-019-0436-6</pub-id>
          <pub-id pub-id-type="medline">31615566</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12902-019-0436-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC6794897</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Myrzashova</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Diabetes prediction model based on an enhanced deep neural network</article-title>
          <source>J Wireless Com Network</source>
          <year>2020</year>
          <month>07</month>
          <day>17</day>
          <volume>2020</volume>
          <issue>1</issue>
          <pub-id pub-id-type="doi">10.1186/s13638-020-01765-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Naz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ahuja</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Deep learning approach for diabetes prediction using PIMA Indian dataset</article-title>
          <source>J Diabetes Metab Disord</source>
          <year>2020</year>
          <month>04</month>
          <day>14</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>391</fpage>
          <lpage>403</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32550190"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40200-020-00520-5</pub-id>
          <pub-id pub-id-type="medline">32550190</pub-id>
          <pub-id pub-id-type="pii">520</pub-id>
          <pub-id pub-id-type="pmcid">PMC7270283</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>LaFreniere</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zulkernine</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Barber</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Using machine learning to predict hypertension from a clinical dataset</article-title>
          <source>Proceedings of the IEEE Symposium Series on Computational Intelligence (SSCI)</source>
          <year>2016</year>
          <conf-name>IEEE Symposium Series on Computational Intelligence (SSCI)</conf-name>
          <conf-date>December 6-9, 2016</conf-date>
          <conf-loc>Athens, Greece</conf-loc>
          <pub-id pub-id-type="doi">10.1109/ssci.2016.7849886</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Attaluri</surname>
              <given-names>PK</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Applying neural networks to classify influenza virus antigenic types and hosts</article-title>
          <source>Proceedings of the IEEE Symposium on Computational Intelligence in Bioinformatics and Computational Biology</source>
          <year>2010</year>
          <conf-name>IEEE Symposium on Computational Intelligence in Bioinformatics and Computational Biology</conf-name>
          <conf-date>May 2-5, 2010</conf-date>
          <conf-loc>Montreal, QC</conf-loc>
          <pub-id pub-id-type="doi">10.1109/cibcb.2010.5510726</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Barnes</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>HCNN: heterogeneous convolutional neural networks for comorbid risk prediction with electronic health records</article-title>
          <source>Proceedings of the IEEE/ACM International Conference on Connected Health: Applications, Systems and Engineering Technologies (CHASE)</source>
          <year>2017</year>
          <conf-name>IEEE/ACM International Conference on Connected Health: Applications, Systems and Engineering Technologies (CHASE)</conf-name>
          <conf-date>July 17-19, 2017</conf-date>
          <conf-loc>Philadelphia, PA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/chase.2017.80</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ayon</surname>
              <given-names>SI</given-names>
            </name>
            <name name-style="western">
              <surname>Milon Islam</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Diabetes prediction: a deep learning approach</article-title>
          <source>Int J Inf Eng Electron Bus</source>
          <year>2019</year>
          <month>03</month>
          <day>08</day>
          <volume>11</volume>
          <issue>2</issue>
          <fpage>21</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.5815/ijieeb.2019.02.03</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yahyaoui</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jamil</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rasheed</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Yesiltepe</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A decision support system for diabetes prediction using machine learning and deep learning techniques</article-title>
          <source>Proceedings of the 1st International Informatics and Software Engineering Conference (UBMYK)</source>
          <year>2019</year>
          <conf-name>1st International Informatics and Software Engineering Conference (UBMYK)</conf-name>
          <conf-date>November 6-7, 2019</conf-date>
          <conf-loc>Ankara, Turkey</conf-loc>
          <pub-id pub-id-type="doi">10.1109/ubmyk48245.2019.8965556</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ramesh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Caytiles</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Iyenga</surname>
              <given-names>NC</given-names>
            </name>
          </person-group>
          <article-title>A deep learning approach to identify diabetes</article-title>
          <source>Adv Sci Technol Letters</source>
          <year>2017</year>
          <volume>145</volume>
          <fpage>44</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.14257/astl.2017.145.09</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pintelas</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Liaskos</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Livieris</surname>
              <given-names>IE</given-names>
            </name>
            <name name-style="western">
              <surname>Kotsiantis</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pintelas</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>A novel explainable image classification framework: case study on skin cancer and plant disease prediction</article-title>
          <source>Neural Comput Applic</source>
          <year>2021</year>
          <month>06</month>
          <day>04</day>
          <volume>33</volume>
          <issue>22</issue>
          <fpage>15171</fpage>
          <lpage>89</lpage>
          <pub-id pub-id-type="doi">10.1007/s00521-021-06141-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tasin</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Nabil</surname>
              <given-names>TU</given-names>
            </name>
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Diabetes prediction using machine learning and explainable AI techniques</article-title>
          <source>Healthc Technol Lett</source>
          <year>2023</year>
          <month>12</month>
          <day>14</day>
          <volume>10</volume>
          <issue>1-2</issue>
          <fpage>1</fpage>
          <lpage>10</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37077883"/>
          </comment>
          <pub-id pub-id-type="doi">10.1049/htl2.12039</pub-id>
          <pub-id pub-id-type="medline">37077883</pub-id>
          <pub-id pub-id-type="pii">HTL212039</pub-id>
          <pub-id pub-id-type="pmcid">PMC10107388</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davagdorj</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Bae</surname>
              <given-names>J-W</given-names>
            </name>
            <name name-style="western">
              <surname>Pham</surname>
              <given-names>V-H</given-names>
            </name>
            <name name-style="western">
              <surname>Theera-Umpon</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Ryu</surname>
              <given-names>KH</given-names>
            </name>
          </person-group>
          <article-title>Explainable artificial intelligence based framework for non-communicable diseases prediction</article-title>
          <source>IEEE Access</source>
          <year>2021</year>
          <month>09</month>
          <day>03</day>
          <volume>9</volume>
          <fpage>123672</fpage>
          <lpage>88</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2021.3110336</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abdulsalam</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Meshoul</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shaiba</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Explainable heart disease prediction using ensemble-quantum machine learning approach</article-title>
          <source>Intell Autom Soft Comput</source>
          <year>2022</year>
          <month>9</month>
          <day>29</day>
          <volume>36</volume>
          <issue>1</issue>
          <fpage>761</fpage>
          <lpage>79</lpage>
          <pub-id pub-id-type="doi">10.32604/iasc.2023.032262</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>XR</given-names>
            </name>
            <name name-style="western">
              <surname>Chiariglione</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Qin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nuytemans</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Scharre</surname>
              <given-names>DW</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y-J</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>ER</given-names>
            </name>
          </person-group>
          <article-title>Explainable machine learning aggregates polygenic risk scores and electronic health records for Alzheimer's disease prediction</article-title>
          <source>Sci Rep</source>
          <year>2023</year>
          <month>01</month>
          <day>09</day>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>450</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-023-27551-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-023-27551-1</pub-id>
          <pub-id pub-id-type="medline">36624143</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-023-27551-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC9829871</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Joseph</surname>
              <given-names>LP</given-names>
            </name>
            <name name-style="western">
              <surname>Joseph</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Prasad</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Explainable diabetes classification using hybrid Bayesian-optimized TabNet architecture</article-title>
          <source>Comput Biol Med</source>
          <year>2022</year>
          <month>12</month>
          <volume>151</volume>
          <issue>Pt A</issue>
          <fpage>106178</fpage>
          <pub-id pub-id-type="doi">10.1016/j.compbiomed.2022.106178</pub-id>
          <pub-id pub-id-type="medline">36306578</pub-id>
          <pub-id pub-id-type="pii">S0010-4825(22)00886-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ibrahim</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mesinovic</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>K-W</given-names>
            </name>
            <name name-style="western">
              <surname>Eid</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Explainable prediction of acute myocardial infarction using machine learning and shapley values</article-title>
          <source>IEEE Access</source>
          <year>2020</year>
          <month>11</month>
          <day>24</day>
          <volume>8</volume>
          <fpage>210410</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2020.3040166</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Du</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rafferty</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>McAuliffe</surname>
              <given-names>FM</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mooney</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>An explainable machine learning-based clinical decision support system for prediction of gestational diabetes mellitus</article-title>
          <source>Sci Rep</source>
          <year>2022</year>
          <month>01</month>
          <day>21</day>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>1170</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-022-05112-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-022-05112-2</pub-id>
          <pub-id pub-id-type="medline">35064173</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-022-05112-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC8782851</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nagaraj</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Muneeswaran</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Dharanidharan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Balananthanan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Arunkumar</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A prediction and recommendation system for diabetes mellitus using XAI-based lime explainer</article-title>
          <source>Proceedings of the International Conference on Sustainable Computing and Data Communication Systems (ICSCDS)</source>
          <year>2022</year>
          <conf-name>International Conference on Sustainable Computing and Data Communication Systems (ICSCDS)</conf-name>
          <conf-date>April 7-9, 2022</conf-date>
          <conf-loc>Erode, India</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icscds53736.2022.9760847</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Maillot</surname>
              <given-names>NE</given-names>
            </name>
            <name name-style="western">
              <surname>Thonnat</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Ontology based complex object recognition</article-title>
          <source>Image Vis Comput</source>
          <year>2008</year>
          <month>1</month>
          <volume>26</volume>
          <issue>1</issue>
          <fpage>102</fpage>
          <lpage>13</lpage>
          <pub-id pub-id-type="doi">10.1016/j.imavis.2005.07.027</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Icarte</surname>
              <given-names>RT</given-names>
            </name>
            <name name-style="western">
              <surname>Baier</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Ruz</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Soto</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>How a general-purpose commonsense ontology can improve performance of learning-based image retrieval</article-title>
          <source>Proceedings of the 26th International Joint Conference on Artificial Intelligence</source>
          <year>2017</year>
          <conf-name>IJCAI'17: Proceedings of the 26th International Joint Conference on Artificial Intelligence</conf-name>
          <conf-date>August 19-25, 2017</conf-date>
          <conf-loc>Melbourne, Australia</conf-loc>
          <pub-id pub-id-type="doi">10.24963/ijcai.2017/178</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Daniels</surname>
              <given-names>ZA</given-names>
            </name>
            <name name-style="western">
              <surname>Frank</surname>
              <given-names>LD</given-names>
            </name>
            <name name-style="western">
              <surname>Menart</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Raymer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hitzler</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>A framework for explainable deep neural models using external knowledge graphs</article-title>
          <source>Proceedings of the SPIE</source>
          <year>2020</year>
          <conf-name>Proceedings of the SPIE</conf-name>
          <conf-date>December 14-18, 2020</conf-date>
          <conf-loc>Online</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ui.adsabs.harvard.edu/abs/2020SPIE11413E..1CD/abstract"/>
          </comment>
          <pub-id pub-id-type="doi">10.1117/12.2558083</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zafar</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>NM</given-names>
            </name>
          </person-group>
          <article-title>DLIME: a deterministic local interpretable model-agnostic explanations approach for computer-aided diagnosis systems</article-title>
          <source>Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery &#38; Data Mining</source>
          <year>2019</year>
          <conf-name>KDD '19</conf-name>
          <conf-date>August 4-8, 2019</conf-date>
          <conf-loc>Anchorage, AK</conf-loc>
          <pub-id pub-id-type="doi">10.32920/22734359.v1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Srinivasu</surname>
              <given-names>PN</given-names>
            </name>
            <name name-style="western">
              <surname>Sandhya</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Jhaveri</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Raut</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>From Blackbox to explainable AI in healthcare: existing tools and case studies</article-title>
          <source>Mob Inf Syst</source>
          <year>2022</year>
          <month>6</month>
          <day>13</day>
          <volume>2022</volume>
          <fpage>1</fpage>
          <lpage>20</lpage>
          <pub-id pub-id-type="doi">10.1155/2022/8167821</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gerlings</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jensen</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Shollo</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>YW</given-names>
            </name>
            <name name-style="western">
              <surname>Vaidya</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mahorkar</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>LC</given-names>
            </name>
          </person-group>
          <article-title>Explainable AI, but explainable to whom? An exploratory case study of xAI in healthcare</article-title>
          <source>Handbook of Artificial Intelligence in Healthcare</source>
          <year>2021</year>
          <month>11</month>
          <day>27</day>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dave</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Naik</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Singhal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Patel</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Explainable AI meets healthcare: a study on heart disease dataset</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online November 6, 2020</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2011.03195v1"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>QV</given-names>
            </name>
            <name name-style="western">
              <surname>Varshney</surname>
              <given-names>KR</given-names>
            </name>
          </person-group>
          <article-title>Human-centered explainable AI (XAI): from algorithms to user experiences</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online October 20, 2021</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2110.10790v5"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chromik</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Making SHAP rap: bridging local and global insights through interaction and narratives</article-title>
          <source>Proceedings of the 18th IFIP TC 13 International Conference</source>
          <year>2021</year>
          <conf-name>18th IFIP TC 13 International Conference</conf-name>
          <conf-date>August 30-September 3, 2021</conf-date>
          <conf-loc>Bari, Italy</conf-loc>
          <pub-id pub-id-type="doi">10.1007/978-3-030-85616-8_37</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dieber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kirrane</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Why model why? Assessing the strengths and limitations of LIME</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online November 30, 2020</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2012.00093v1"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>El-Sappagh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>DDO: a diabetes mellitus diagnosis ontology</article-title>
          <source>Appl Inform</source>
          <year>2016</year>
          <month>8</month>
          <day>25</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>28</lpage>
          <pub-id pub-id-type="doi">10.1186/s40535-016-0021-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <article-title>UMLS glossary</article-title>
          <source>National Institutes of Health National Library of Medicine</source>
          <access-date>2022-11-17</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nlm.nih.gov/research/umls/new_users/glossary.html">https://www.nlm.nih.gov/research/umls/new_users/glossary.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <article-title>SNOMED CT</article-title>
          <source>National Institutes of Health National Library of Medicine</source>
          <access-date>2022-01-23</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nlm.nih.gov/healthit/snomedct/index.html">https://www.nlm.nih.gov/healthit/snomedct/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vrandečić</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Krötzsch</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Wikidata: a free collaborative knowledgebase</article-title>
          <source>Commun ACM</source>
          <year>2014</year>
          <month>10</month>
          <volume>57</volume>
          <issue>10</issue>
          <fpage>78</fpage>
          <lpage>85</lpage>
          <pub-id pub-id-type="doi">10.1145/2629489</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Braga</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Regateiro</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Dias</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Machine Learning Ontology (MLOnto) repository</article-title>
          <source>OSF Home</source>
          <year>2020</year>
          <access-date>2023-10-21</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://osf.io/chu5q/">https://osf.io/chu5q/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Musen</surname>
              <given-names>Mark A</given-names>
            </name>
            <collab>Protégé Team</collab>
          </person-group>
          <article-title>The Protégé Project: A Look Back and a Look Forward</article-title>
          <source>AI Matters</source>
          <year>2015</year>
          <month>06</month>
          <volume>1</volume>
          <issue>4</issue>
          <fpage>4</fpage>
          <lpage>12</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27239556"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2757001.2757003</pub-id>
          <pub-id pub-id-type="medline">27239556</pub-id>
          <pub-id pub-id-type="pmcid">PMC4883684</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hendawi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Alian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A smart mobile app to simplify medical documents and improve health literacy: system design and feasibility validation</article-title>
          <source>JMIR Form Res</source>
          <year>2022</year>
          <month>04</month>
          <day>01</day>
          <volume>6</volume>
          <issue>4</issue>
          <fpage>e35069</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2022/4/e35069/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/35069</pub-id>
          <pub-id pub-id-type="medline">35363142</pub-id>
          <pub-id pub-id-type="pii">v6i4e35069</pub-id>
          <pub-id pub-id-type="pmcid">PMC9015750</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>BioWordVec, improving biomedical word embeddings with subword information and MeSH</article-title>
          <source>Sci Data</source>
          <year>2019</year>
          <month>05</month>
          <day>10</day>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>52</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41597-019-0055-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41597-019-0055-0</pub-id>
          <pub-id pub-id-type="medline">31076572</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41597-019-0055-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6510737</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Islam</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Ferdousi</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rahman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bushra</surname>
              <given-names>HY</given-names>
            </name>
          </person-group>
          <article-title>Likelihood prediction of diabetes at early stage using data mining techniques</article-title>
          <source>Proceedings of the First International Symposium on Computer Vision and Machine Intelligence in Medical Image Analysis</source>
          <year>2019</year>
          <conf-name>ISCMM 2019</conf-name>
          <conf-date>February 26-27, 2019</conf-date>
          <conf-loc>Sikkim, India</conf-loc>
          <pub-id pub-id-type="doi">10.1007/978-981-13-8798-2_12</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="web">
          <article-title>Pima Indians diabetes</article-title>
          <source>data.world</source>
          <access-date>2022-05-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://data.world/uci/pima-indians-diabetes">https://data.world/uci/pima-indians-diabetes</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="web">
          <article-title>Early stage diabetes risk prediction dataset</article-title>
          <source>UCI Irvine Machine Learning Repository</source>
          <year>2020</year>
          <month>11</month>
          <day>7</day>
          <access-date>2023-02-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://archive.ics.uci.edu/ml/datasets/Early+stage+diabetes+risk+prediction+dataset">https://archive.ics.uci.edu/ml/datasets/Early+stage+diabetes+risk+prediction+dataset</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chawla</surname>
              <given-names>NV</given-names>
            </name>
            <name name-style="western">
              <surname>Bowyer</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>Hall</surname>
              <given-names>LO</given-names>
            </name>
            <name name-style="western">
              <surname>Kegelmeyer</surname>
              <given-names>WP</given-names>
            </name>
          </person-group>
          <article-title>SMOTE: synthetic minority over-sampling technique</article-title>
          <source>J Artif Intell Res</source>
          <year>2002</year>
          <month>06</month>
          <day>01</day>
          <volume>16</volume>
          <fpage>321</fpage>
          <lpage>57</lpage>
          <pub-id pub-id-type="doi">10.1613/jair.953</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sasada</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Baba</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hatano</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kimura</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>A resampling method for imbalanced datasets considering noise and overlap</article-title>
          <source>Procedia Comput Sci</source>
          <year>2020</year>
          <volume>176</volume>
          <fpage>420</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/j.procs.2020.08.043</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="web">
          <article-title>SPARQL query language for RDF</article-title>
          <source>The World Wide Web Consortium</source>
          <year>2018</year>
          <month>1</month>
          <day>15</day>
          <access-date>2023-09-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.w3.org/TR/rdf-sparql-query/">https://www.w3.org/TR/rdf-sparql -query/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S-I</given-names>
            </name>
          </person-group>
          <article-title>A unified approach to interpreting model predictions</article-title>
          <source>Proceedings of the 31st International Conference on Neural Information Processing Systems</source>
          <year>2017</year>
          <conf-name>NIPS'17</conf-name>
          <conf-date>December 4-9, 2017</conf-date>
          <conf-loc>Long Beach, CA</conf-loc>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/proceedings/10.5555/3295222"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Winter</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Chapter 53 The Shapley value</article-title>
          <source>Handbook of Game Theory with Economic Applications Volume 2</source>
          <year>2002</year>
          <publisher-loc>Amsterdam, Netherlands</publisher-loc>
          <publisher-name>Elsevier</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ribeiro</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Anchors: high-precision model-agnostic explanations</article-title>
          <source>Proc AAAI Conf Artif Intell</source>
          <year>2018</year>
          <volume>32</volume>
          <issue>1</issue>
          <pub-id pub-id-type="doi">10.1609/aaai.v32i1.11491</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hooker</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>S-LIME: stabilized-LIME for model explanation</article-title>
          <source>Proceedings of the 27th ACM SIGKDD Conference on Knowledge Discovery &#38; Data Mining</source>
          <year>2021</year>
          <conf-name>KDD '21</conf-name>
          <conf-date>August 14-18, 2021</conf-date>
          <conf-loc>Virtual Event, Singapore</conf-loc>
          <pub-id pub-id-type="doi">10.1145/3447548.3467274</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kibria</surname>
              <given-names>HB</given-names>
            </name>
            <name name-style="western">
              <surname>Nahiduzzaman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Goni</surname>
              <given-names>MO</given-names>
            </name>
            <name name-style="western">
              <surname>Ahsan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Haider</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>An ensemble approach for the prediction of diabetes mellitus using a soft voting classifier with an explainable AI</article-title>
          <source>Sensors (Basel)</source>
          <year>2022</year>
          <month>09</month>
          <day>25</day>
          <volume>22</volume>
          <issue>19</issue>
          <fpage>7268</fpage>
          <pub-id pub-id-type="doi">10.3390/s22197268</pub-id>
          <pub-id pub-id-type="medline">36236367</pub-id>
          <pub-id pub-id-type="pii">s22197268</pub-id>
          <pub-id pub-id-type="pmcid">PMC9571784</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="web">
          <article-title>Does diabetes cause hair loss?</article-title>
          <source>Healthline</source>
          <access-date>2023-09-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.healthline.com/health/does-diabetes-cause-hair-loss">https://www.healthline.com/health/does-diabetes-cause-hair-loss</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="web">
          <article-title>Alopecia areata</article-title>
          <source>Wikidata</source>
          <access-date>2023-11-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.wikidata.org/wiki/Q2697787#/media/File:Allopecia_areata.JPG">https://www.wikidata.org/wiki/Q2697787#/media/File:Allopecia_areata.JPG</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="web">
          <article-title>NCI Thesaurus</article-title>
          <source>National Cancer Institute</source>
          <access-date>2023-11-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ncit.nci.nih.gov/ncitbrowser/ConceptReport.jsp?dictionary=NCI_Thesaurus&#38;code=C50575">https://ncit.nci.nih.gov/ncitbrowser/ConceptReport.jsp?dictionary=NCI_The saurus&#38;code=C50575</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choubey</surname>
              <given-names>DK</given-names>
            </name>
            <name name-style="western">
              <surname>Paul</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Classification of Pima Indian diabetes dataset using naive bayes with genetic algorithm as an attribute selection</article-title>
          <source>Proceedings of the International Conference on Communication and Computing Systems (ICCCS-2016)</source>
          <year>2016</year>
          <conf-name>The International Conference on Communication and Computing Systems (ICCCS-2016)</conf-name>
          <conf-date>September 9-11, 2016</conf-date>
          <conf-loc>Gurgaon, India</conf-loc>
          <pub-id pub-id-type="doi">10.1201/9781315364094-82</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Howsalya Devi</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nagarajan</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>A novel hybrid approach for diagnosing diabetes mellitus using farthest first and support vector machine algorithms</article-title>
          <source>Obesity Med</source>
          <year>2020</year>
          <month>03</month>
          <volume>17</volume>
          <fpage>100152</fpage>
          <pub-id pub-id-type="doi">10.1016/j.obmed.2019.100152</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Posania</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Vigneshwari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jamuna Rani</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Machine learning based diabetes prediction using decision tree J48</article-title>
          <source>Proceedings of the 3rd International Conference on Intelligent Sustainable Systems (ICISS)</source>
          <year>2020</year>
          <conf-name>3rd International Conference on Intelligent Sustainable Systems (ICISS)</conf-name>
          <conf-date>December 03-05, 2020</conf-date>
          <conf-loc>Thoothukudi, India</conf-loc>
          <pub-id pub-id-type="doi">10.1109/iciss49785.2020.9316001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sadhu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Jadli</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Early-stage diabetes risk prediction: a comparative analysis of classification algorithms</article-title>
          <source>Int Adv Res J Sci Eng Technol</source>
          <year>2021</year>
          <month>2</month>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>193</fpage>
          <lpage>201</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://iarjset.com/wp-content/uploads/2021/03/IARJSET.2021.8228.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/incet51464.2021.9456263</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>QA</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Pima Indians diabetes mellitus classification based on machine learning (ML) algorithms</article-title>
          <source>Neural Comput Appl</source>
          <year>2022</year>
          <month>03</month>
          <day>24</day>
          <volume>35</volume>
          <issue>22</issue>
          <fpage>1</fpage>
          <lpage>17</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35345556"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s00521-022-07049-z</pub-id>
          <pub-id pub-id-type="medline">35345556</pub-id>
          <pub-id pub-id-type="pii">7049</pub-id>
          <pub-id pub-id-type="pmcid">PMC8943493</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>A-P</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez</surname>
              <given-names>MR</given-names>
            </name>
          </person-group>
          <article-title>On quantitative aspects of model interpretability</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online July 15, 2020</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2007.07584"/>
          </comment>
          <pub-id pub-id-type="doi">10.1017/9781316716854.008</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tseng</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Shrikumar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kundaje</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Fourier-transform-based attribution priors improve the interpretability and stability of deep learning models for genomics</article-title>
          <source>BioRxiv</source>
          <comment>Preprint posted online June 12, 2020</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.biorxiv.org/content/10.1101/2020.06.11.147272v1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/2020.06.11.147272</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sisodia</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sisodia</surname>
              <given-names>DS</given-names>
            </name>
          </person-group>
          <article-title>Prediction of diabetes using classification algorithms</article-title>
          <source>Procedia Comput Sci</source>
          <year>2018</year>
          <volume>132</volume>
          <fpage>1578</fpage>
          <lpage>85</lpage>
          <pub-id pub-id-type="doi">10.1016/j.procs.2018.05.122</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goutham</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ravi</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Soman</surname>
              <given-names>KP</given-names>
            </name>
          </person-group>
          <article-title>Diabetes detection using deep learning algorithms</article-title>
          <source>ICT Express</source>
          <year>2018</year>
          <month>12</month>
          <volume>4</volume>
          <issue>4</issue>
          <fpage>243</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1016/j.icte.2018.10.005</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adadi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Berrada</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Peeking inside the black-box: a survey on explainable artificial intelligence (XAI)</article-title>
          <source>IEEE Access</source>
          <year>2018</year>
          <volume>6</volume>
          <fpage>52138</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2018.2870052</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tiddi</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>d’Aquin</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Motta</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Dedalo: looking for clusters explanations in a labyrinth of linked data</article-title>
          <source>Proceedings of the The Semantic Web: Trends and Challenges</source>
          <year>2014</year>
          <conf-name>The Semantic Web: Trends and Challenges</conf-name>
          <conf-date>May 25-29, 2014</conf-date>
          <conf-loc>Crete, Greece</conf-loc>
          <pub-id pub-id-type="doi">10.1007/978-3-319-07443-6_23</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caruana</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lou</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gehrke</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Koch</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Sturm</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Elhadad</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Intelligible models for HealthCare: predicting pneumonia risk and hospital 30-day readmission</article-title>
          <source>Proceedings of the 21th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
          <year>2015</year>
          <conf-name>KDD '15</conf-name>
          <conf-date>August 10-13, 2015</conf-date>
          <conf-loc>Sydney, Australia</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2783258.2788613</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fisher</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rudin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Dominici</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>All models are wrong, but  are useful: learning a variable's importance by studying an entire class of prediction models simultaneously</article-title>
          <source>J Mach Learn Res</source>
          <year>2019</year>
          <volume>20</volume>
          <fpage>177</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34335110"/>
          </comment>
          <pub-id pub-id-type="medline">34335110</pub-id>
          <pub-id pub-id-type="pii">177</pub-id>
          <pub-id pub-id-type="pmcid">PMC8323609</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vavpetič</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Podpečan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Lavrač</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Semantic subgroup explanations</article-title>
          <source>J Intell Inf Syst</source>
          <year>2013</year>
          <month>12</month>
          <day>6</day>
          <volume>42</volume>
          <issue>2</issue>
          <fpage>233</fpage>
          <lpage>54</lpage>
          <pub-id pub-id-type="doi">10.1007/s10844-013-0292-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Che</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kale</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Bahadori</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Deep computational phenotyping</article-title>
          <source>Proceedings of the 21th ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
          <year>2015</year>
          <conf-name>KDD '15</conf-name>
          <conf-date>August 10-13, 2015</conf-date>
          <conf-loc>Sydney, Australia</conf-loc>
          <pub-id pub-id-type="doi">10.1145/2783258.2783365</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Phan</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Dou</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kil</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Piniewski</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Ontology-based deep learning for human behavior prediction with explanations in health social networks</article-title>
          <source>Inf Sci (N Y)</source>
          <year>2017</year>
          <month>04</month>
          <volume>384</volume>
          <fpage>298</fpage>
          <lpage>313</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28265122"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ins.2016.08.038</pub-id>
          <pub-id pub-id-type="medline">28265122</pub-id>
          <pub-id pub-id-type="pmcid">PMC5336311</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="web">
          <article-title>Welcome to MedlinePlus</article-title>
          <source>MedlinePlus</source>
          <access-date>2023-09-16</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medlineplus.gov/">https://medlineplus.gov/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
