<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JFR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id>
      <journal-title>JMIR Formative Research</journal-title>
      <issn pub-type="epub">2561-326X</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v6i7e36055</article-id>
      <article-id pub-id-type="pmid">35857363</article-id>
      <article-id pub-id-type="doi">10.2196/36055</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>An Urban Population Health Observatory for Disease Causal Pathway Analysis and Decision Support: Underlying Explainable Artificial Intelligence Model</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Mukherjee</surname>
            <given-names>Sumoni</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Ye</surname>
            <given-names>Jiancheng</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Surian</surname>
            <given-names>Didi</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Brakefield</surname>
            <given-names>Whitney S</given-names>
          </name>
          <degrees>MSc, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0054-8944</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Ammar</surname>
            <given-names>Nariman</given-names>
          </name>
          <degrees>MSc, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5363-2541</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Shaban-Nejad</surname>
            <given-names>Arash</given-names>
          </name>
          <degrees>MPH, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Center for Biomedical Informatics</institution>
            <institution>Department of Pediatrics, College of Medicine</institution>
            <institution>University of Tennessee Health Science Center</institution>
            <addr-line>50 N Dunlap Street, R492</addr-line>
            <addr-line>Memphis, TN, 38103</addr-line>
            <country>United States</country>
            <phone>1 901 287 5863</phone>
            <email>ashabann@uthsc.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2047-4759</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Center for Biomedical Informatics</institution>
        <institution>Department of Pediatrics, College of Medicine</institution>
        <institution>University of Tennessee Health Science Center</institution>
        <addr-line>Memphis, TN</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Bredesen Center for Data Science</institution>
        <institution>University of Tennessee</institution>
        <addr-line>Knoxville, TN</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Ochsner Xavier Institute for Health Equity and Research</institution>
        <institution>Ochsner Clinic Foundation</institution>
        <addr-line>New Orleans, LA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Arash Shaban-Nejad <email>ashabann@uthsc.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>7</month>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>20</day>
        <month>7</month>
        <year>2022</year>
      </pub-date>
      <volume>6</volume>
      <issue>7</issue>
      <elocation-id>e36055</elocation-id>
      <history>
        <date date-type="received">
          <day>29</day>
          <month>12</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>13</day>
          <month>4</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>3</day>
          <month>5</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>7</day>
          <month>6</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Whitney S Brakefield, Nariman Ammar, Arash Shaban-Nejad. Originally published in JMIR Formative Research (https://formative.jmir.org), 20.07.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on https://formative.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://formative.jmir.org/2022/7/e36055" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Many researchers have aimed to develop chronic health surveillance systems to assist in public health decision-making. Several digital health solutions created lack the ability to explain their decisions and actions to human users.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study sought to (1) expand our existing Urban Population Health Observatory (UPHO) system by incorporating a semantics layer; (2) cohesively employ machine learning and semantic/logical inference to provide measurable evidence and detect pathways leading to undesirable health outcomes; (3) provide clinical use case scenarios and design case studies to identify socioenvironmental determinants of health associated with the prevalence of obesity, and (4) design a dashboard that demonstrates the use of UPHO in the context of obesity surveillance using the provided scenarios.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>The system design includes a knowledge graph generation component that provides contextual knowledge from relevant domains of interest. This system leverages semantics using concepts, properties, and axioms from existing ontologies. In addition, we used the publicly available US Centers for Disease Control and Prevention 500 Cities data set to perform multivariate analysis. A cohesive approach that employs machine learning and semantic/logical inference reveals pathways leading to diseases.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>In this study, we present 2 clinical case scenarios and a proof-of-concept prototype design of a dashboard that provides warnings, recommendations, and explanations and demonstrates the use of UPHO in the context of obesity surveillance, treatment, and prevention. While exploring the case scenarios using a support vector regression machine learning model, we found that poverty, lack of physical activity, education, and unemployment were the most important predictive variables that contribute to obesity in Memphis, TN.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>The application of UPHO could help reduce health disparities and improve urban population health. The expanded UPHO feature incorporates an additional level of interpretable knowledge to enhance physicians, researchers, and health officials' informed decision-making at both patient and community levels.</p>
        </sec>
        <sec sec-type="registered-report">
          <title>International Registered Report Identifier (IRRID)</title>
          <p>RR2-10.2196/28269 </p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>health surveillance system</kwd>
        <kwd>explainable AI</kwd>
        <kwd>decision support</kwd>
        <kwd>machine learning</kwd>
        <kwd>obesity</kwd>
        <kwd>chronic disease</kwd>
        <kwd>precision health prevention</kwd>
        <kwd>semantic inference</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Enhanced health surveillance systems for chronic disease support could mitigate factors that contribute to the incline of morbidity and mortality of diseases such as obesity. Obesity is linked to increased overall mortality and has reached pandemic proportions, being responsible for approximately 2.8 million deaths annually [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>]. Obesity represents an excessive and abnormal accumulation of body fat, which leads to adverse health effects that impose a health and financial toll on individuals and society [<xref ref-type="bibr" rid="ref2">2</xref>]. More than half of the US population has at least one chronic condition, and 27% are living with multimorbidity [<xref ref-type="bibr" rid="ref3">3</xref>]. These conditions cause more than 1.7 million deaths per year in the United States, where obesity is associated with the top leading causes of death (eg, diabetes, heart disease, stroke, and cancer) [<xref ref-type="bibr" rid="ref4">4</xref>].</p>
        <p>Neighborhood factors such as socioenvironmental determinants of health (SDoH) significantly contribute to these statistics [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. Implementation of an intelligent health surveillance platform that incorporates SDoH can improve preparedness, prevention, and management of this obesity pandemic by assisting in the implementation of effective treatment and interventions.</p>
        <p>Health surveillance involves the “ongoing systematic collection, analysis, and interpretation of data essential to the planning, implementation, and evaluation of public health practice, closely integrated with the timely dissemination of these data to those who need to know” [<xref ref-type="bibr" rid="ref9">9</xref>]. Researchers have aimed to develop chronic health surveillance systems to assist in chronic health decision-making [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref16">16</xref>]. The World Health Organization (WHO) developed a conceptual framework for an Urban Public Health Observatory (UPHO) comprised of 3 domains: mission, governance, and knowledge and intelligence, the latter of which incorporates a data management component [<xref ref-type="bibr" rid="ref17">17</xref>]. This framework from WHO therefore provides a strategic model for health surveillance.</p>
        <p>Many current digital health solutions and electronic health record (EHR) systems lack the ability to incorporate machine learning algorithms into their decision-making process, and even if they do, the algorithms used do not have appropriate capabilities to explain the suggested decisions and actions to human users [<xref ref-type="bibr" rid="ref18">18</xref>]. Machine learning approaches, so-called black-box statistics, should be trustworthy, transparent, interpretable, and explainable when making decisions in the clinical or health science setting [<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref20">20</xref>]. A system’s explanation constitutes its interpretability [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref22">22</xref>]. Explainable AI (XAI) increases the intelligence delivered to the user by providing explanations, thereby enhancing the interpretability of outcomes and findings. Researcher efforts have been shifting toward applying algorithms that can aid in explaining the results of machine learning models. For instance, the SHAP (Shapley Additive Explanations) analysis [<xref ref-type="bibr" rid="ref23">23</xref>] is an approach that assigns each model feature an importance score for making a particular prediction. Compared to traditional feature importance analyses, the novelty of SHAP lies in its ability to assess importance at the individual patient level. In this paper, we propose a novel approach to explainability that uses knowledge graphs as a semantic infrastructure explainable by design and enriches those graphs with results from machine learning algorithms as metrics and scores. The semantic causal relationships on the graph provide contextual knowledge around a population, and the metrics support those relationships, which provides 2 levels of evidence: knowledge level and statistical level.</p>
        <p>We implement a UPHO platform as a knowledge-based surveillance system that provides better insight to improve decision-making by incorporating SDoH and providing XAI and interpretability functions [<xref ref-type="bibr" rid="ref24">24</xref>]. Our UPHO consists of 3 layers: data, analytics, and application. In this work, we refine the initial design by incorporating data management, knowledge, and intelligence domains (<xref rid="figure1" ref-type="fig">Figure 1</xref>) that are in alignment with the conceptual model by WHO and a focus on the semantics layer.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Expanded Urban Population Health Observatory framework. CDC: US Centers for Control and Prevention; USDA: US Department of Agriculture; KG: knowledge graph; UPHO: Urban Population Health Observatory.</p>
          </caption>
          <graphic xlink:href="formative_v6i7e36055_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>The objectives of this article are to (1) expand UPHO by incorporating a semantics layer, (2) cohesively employ machine learning and semantic/logical inference to provide measurable evidence and detect pathways that lead to undesirable health outcomes, (3) provide clinical case scenarios and design case studies on identifying SDoH associated with obesity prevalence, and (4) provide a dashboard design that demonstrates the use of UPHO in the context of obesity, using the provided case scenario.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>UPHO Expansion</title>
        <p><xref rid="figure1" ref-type="fig">Figure 1</xref> shows the expansion of the UPHO to incorporate the semantics layer. In the following section, we provide a detailed description of the UPHO platform expansion design.</p>
      </sec>
      <sec>
        <title>Data Management Domain</title>
        <p>The data management domain comprises the data layer. The UPHO collects population-level health and SDoH data and individual-level clinical and demographic data from EHRs through regional registries.</p>
      </sec>
      <sec>
        <title>Data Layer</title>
        <p>To obtain population-level health data, we used the US Centers for Control and Prevention (CDC) 500 Cities Behavior Risk Factors Surveillance System, which includes data regarding chronic diseases and their behavioral risk factors [<xref ref-type="bibr" rid="ref25">25</xref>]. These variables are model-based estimates of crude prevalence among adults aged ≥18 years in 2018. We extracted variables pertaining to obesity, lack of physical activity, lack of insurance, and diabetes mellitus at the census tract level.</p>
        <p>We extracted population-level SDoH variables that pertain to food insecurity, transportation, and socioeconomic stability at zip code, census tract, census block, and census block group levels from the US Census Bureau 2018 American Community Survey [<xref ref-type="bibr" rid="ref26">26</xref>] and the US Department of Agriculture Research Atlas [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
      </sec>
      <sec>
        <title>Knowledge and Intelligence Domain</title>
        <sec>
          <title>Analytics Layer</title>
          <p>The analytics layer pulls raw data from different sources in the data layer and analyzes it to classify it, predict new relations, conduct spatial pattern detection, and calculate new metrics. The analytics layer also performs feature engineering by deriving new metrics and using them to enrich the original data sets.</p>
        </sec>
        <sec>
          <title>Semantics Layer</title>
          <p>The stages of the UPHO semantics layer are shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>. In the knowledge representation and axiomatization stages, we use semantic web technologies to develop several domain and application ontologies from relevant domains of interest to provide necessary contextual knowledge. Ontologies are systematic representations of knowledge that can be used to integrate and analyze large amounts of heterogeneous data, thereby allowing classification of knowledge [<xref ref-type="bibr" rid="ref28">28</xref>]. In those ontologies, we define concept hierarchies and rule axioms by using existing domain knowledge, such as the WHO/CDC guidelines, and federal and local sources. We develop new ontologies by reusing several existing domain ontologies. For this study, we adopted concepts, properties, and axioms from 5 different ontologies that we used in our prior work [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref32">32</xref>], specifically (1) disease ontology (DO) [<xref ref-type="bibr" rid="ref31">31</xref>] (eg, obesity, diabetes); (2) the Childhood Obesity Prevention (Knowledge) Enterprise (COPE) ontology [<xref ref-type="bibr" rid="ref29">29</xref>] that defines SDoH concepts such as socioeconomic issues (eg, food deserts, income) and behavioral issues (eg, lack of physical activity, purchasing preference); (3) geographical information system ontology (GISO) [<xref ref-type="bibr" rid="ref32">32</xref>] (eg, zip code, census tract); (4) health indicators ontology (HIO) [<xref ref-type="bibr" rid="ref32">32</xref>]; and (5) the adverse childhood experiences (ACEs) ontology (ACESO), which defines concepts related to ACEs, health outcomes (eg, mental and physical health), interventions, and SDoH, including axioms that define issues like lack of transportation (eg, limited access to a vehicle and limited access to public transit) and food and how they affect routine follow-up activities (eg, missing medical appointments) [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
          <p>We start our semantic analysis using concepts defined in our ontologies and web services to align concepts to actual data resources, allowing us to construct a population knowledge graph structure that abides by an ontology and contains both data and concepts [<xref ref-type="bibr" rid="ref33">33</xref>]. We enrich that knowledge graph using a logical reasoner that uses facts derived from existing knowledge, new knowledge extracted from the analytics layer, and the generic rule axioms defined in the domain ontologies that trigger specific actions under certain conditions.</p>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Urban Population Health Observatory semantic layer framework.</p>
            </caption>
            <graphic xlink:href="formative_v6i7e36055_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Explainable AI</title>
          <p>An effective explainable system accounts for the target user group (eg, physician, researcher). Knowledge of the end user is very important for the delivery of decisions, recommendations, and actions. Each analytics and semantics layer contains an explainability component that can be leveraged in the uppermost health applications layer. To maintain features such as data integration, XAI, and interpretability, we must achieve interoperability by using semantics and ontologies. Explanations adaptable to the user can decrease errors in interpretation by enhancing the interpretability of outcomes and findings.</p>
        </sec>
      </sec>
      <sec>
        <title>Application Domain</title>
        <p>The UPHO platform can be used as a basis to develop several applications, some of which we have already developed, including dashboards [<xref ref-type="bibr" rid="ref24">24</xref>], mobile health (mHealth) apps [<xref ref-type="bibr" rid="ref34">34</xref>], digital assistants, and recommender systems [<xref ref-type="bibr" rid="ref35">35</xref>]. In this article, we leverage the UPHO to implement a dashboard for real-time surveillance. By accessing dynamic knowledge discovered through the UPHO, the dashboard can provide real-time early warnings that are based both on content and context. The platform is accessible to policymakers, physicians, researchers, public health officials, and the public.</p>
      </sec>
      <sec>
        <title>Clinical Scenarios</title>
        <p>The following sections present 2 clinical case scenarios that focus on a physician and a researcher as users to demonstrate the methodology used in the knowledge and intelligence domain layers and the corresponding dashboard design in the application.</p>
        <p>Scenario 1: A physician seeks an effective intervention for an adult African American patient diagnosed with obesity. The physician focuses on how SDoH in the patient’s neighborhood can influence the doctor’s management plans.</p>
        <p>Scenario 2: A researcher investigating the impact of SDoH on obesity seeks an effective intervention for the adult obese populations in Memphis, TN.</p>
      </sec>
      <sec>
        <title>Analytics Layer: Machine Learning Model Development</title>
        <p>We trained a machine learning–based support vector regression (SVR) machine model [<xref ref-type="bibr" rid="ref36">36</xref>,<xref ref-type="bibr" rid="ref37">37</xref>]. We linked CDC 500 Cities population-level obesity and behavior data [<xref ref-type="bibr" rid="ref25">25</xref>] to the population-level social DoH [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>] data set at the census tract level in Memphis, TN. We analyzed 8 features and used a Spearman rank test to assess the positive or negative relationship between each feature. We used a variance inflation factor (VIF) to detect multicollinearity between features. To examine patient neighborhood-level exposure, we used SHAP analysis. <xref ref-type="table" rid="table1">Table 1</xref> shows the summary statistics for features considered for this study. We trained our support vector model on the 85% of randomly selected training data and tested the model on the 15% of remaining data to ensure the generalizability of the model, and we applied the linear kernel function. We scaled our data to have a mean of zero and standard deviation of one. We applied the grid search optimization method to seek optimal hyperparameters to improve model performance using the Caret package in R software (R Foundation for Statistical Computing) [<xref ref-type="bibr" rid="ref38">38</xref>]. In addition, to avoid overfitting 5-fold cross-validation was applied to the training data set. We used root mean square error (RMSE) and <italic>R</italic><sup>2</sup> to evaluate the performance of the model.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Summary statistics for obesity and related risk factors in Memphis, TN, census tract (n=178 census tracts).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="140"/>
            <col width="260"/>
            <col width="200"/>
            <col width="200"/>
            <col width="200"/>
            <thead>
              <tr valign="top">
                <td>Features</td>
                <td>Operationalization</td>
                <td>Original, mean (SD)</td>
                <td>Training, mean (SD)</td>
                <td>Test, mean (SD)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Obesity</td>
                <td>Model-based estimate for crude prevalence of obesity among adults aged ≥18 years, 2018</td>
                <td>37.50 (7.84)</td>
                <td>37.42 (7.54)</td>
                <td>37.97 (6.95)</td>
              </tr>
              <tr valign="top">
                <td>Low access to supermarket</td>
                <td>Count of low income population more than half mile from a supermarket in the census tract</td>
                <td>1382.20 (108.37)</td>
                <td>1345.68 (967.83)</td>
                <td>1616.17 (1120.23)</td>
              </tr>
              <tr valign="top">
                <td>Black</td>
                <td>Percentage of population that is Black or African American</td>
                <td>63.17 (32.70)</td>
                <td>62.22 (33.04)</td>
                <td>63.72 (31.88)</td>
              </tr>
              <tr valign="top">
                <td>Poverty</td>
                <td>Percentage of population living below the federal poverty line</td>
                <td>28.65 (16.28)</td>
                <td>28.27 (16.18)</td>
                <td>31.06 (17.06)</td>
              </tr>
              <tr valign="top">
                <td>Unemployment</td>
                <td>Percentage of unemployed population</td>
                <td>15.73 (9.31)</td>
                <td>15.97 (9.67)</td>
                <td>14.16 (6.52)</td>
              </tr>
              <tr valign="top">
                <td>High school diploma</td>
                <td>Percentage of population 25 years or older without high school diploma</td>
                <td>10.38 (6.59)</td>
                <td>10.23 (6.70)</td>
                <td>11.35 (5.89)</td>
              </tr>
              <tr valign="top">
                <td>Lack of physical activity</td>
                <td>Model-based estimate for crude prevalence of lack of physical activity among adults aged ≥18 years, 2018</td>
                <td>36.16 (9.80)</td>
                <td>35.97 (9.79)</td>
                <td>37.34 (9.99)</td>
              </tr>
              <tr valign="top">
                <td>Crime</td>
                <td>Crime rate per thousand people</td>
                <td>350.20 (126.26)</td>
                <td>160.99 (337.65)</td>
                <td>111.93 (80.40)</td>
              </tr>
              <tr valign="top">
                <td>Lack of access to insurance</td>
                <td>Model-based estimate for crude prevalence of lack of insurance among adults aged ≥18 years, 2018</td>
                <td>20.21 (6.78)</td>
                <td>20.10 (6.81)</td>
                <td>20.88 (6.67)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Semantics Layer: Knowledge Graph Generation</title>
        <p>We followed the following ordered steps to generate the semantics layer knowledge graph from concepts defined in our domain ontologies.</p>
        <list list-type="order">
          <list-item>
            <p>We use concepts, relations, and axioms from domain ontologies to construct a preliminary population knowledge graph. For our scenario, we start by adding a dummy node that represents either a patient or a population (<xref rid="figure3" ref-type="fig">Figure 3</xref>). We begin connecting that node to concepts like disease, risk factors, physical characteristics, etc. For example, obesity falls into the disease type represented by the <italic>isA</italic> relation in <xref rid="figure3" ref-type="fig">Figure 3</xref>, where <italic>isA</italic> reflects a subtype. For instance, 
            SDoH <italic>isA RiskFactr</italic>, and lackOfTransporation is an SDoH subtype. These different hierarchies are encoded in the ACESO ontology. We also add a prefix before each type to reflect the namespace where that concept is defined (eg, the term DO:Disease reflects that the concept disease is defined in the DO). Relations can also reflect the properties of a node. For example, a patient <italic>livesIn</italic> 38127, which <italic>isA</italic> zip code, and that zip code has 8 census tracts of the type <italic>CensusTract</italic>, defined in the GISO ontology.</p>
          </list-item>
          <list-item>
            <p>We populate the generated graph structure with evidence from the data layer. For instance, our data set contains a variable that shows the prevalence of obesity as a percentage metric in specific neighborhoods. We use that information to add edges to our graph that link obesity (as a disease) to prevalence (as a metric).</p>
          </list-item>
          <list-item>
            <p>We further enrich and refine the initial graph by performing knowledge engineering using the logical reasoner (<xref rid="figure2" ref-type="fig">Figure 2</xref>) and feature engineering using the results from the analytics layer. The logical reasoner uses a set of rule axioms to perform logical inference on concepts already existing in the graph. For instance, our COPE ontology encodes epidemiological causal axioms that link SDoH to negative health outcomes. <xref ref-type="boxed-text" rid="box1">Textbox 1</xref> shows how we encode the generic axioms R1-R3. When we combine those generic rule axioms with facts about a specific census tract, we can infer all the risk factors associated with living in that census tract, eg, knowing the facts F1 can tell us that the population living in that area may be exposed to risk factors that lead to obesity.</p>
          </list-item>
          <list-item>
            <p>After performing the logical inference on the initial graph structure, we incorporate new nodes and edges in the graph corresponding to new concepts (eg, the lackOfPhysicalActivity concept from the COPE ontology) or new relations (eg, <italic>isExposedTo</italic>). The knowledge graph refinement is an iterative process, so we can repeat step 2 until we reach a stable state of the graph after which we can populate the graph with more evidence from our engineered data that we pull from the analytics layer. For that purpose, we use the population-level data about SDoH risk factors collected from US Census, CDC, and USDA. For instance, to capture the lack of physical activity we use the CDC 500 Cities data set. The machine learning analysis performed by the analytics layer provides edges that pertain to prediction (eg,
            <italic>isPredictorOf</italic>, <xref rid="figure3" ref-type="fig">Figure 3</xref>). The final knowledge graph is shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>, which provides a generic view of all possible assumptions we can make about this patient or population.</p>
          </list-item>
          <list-item>
            <p>To gather the most important information from this graph, a user can trace a specific pathway based on both logical inference and machine learning results. The red arrows in <xref rid="figure3" ref-type="fig">Figure 3</xref> reflect the pathway in our scenario.</p>
          </list-item>
        </list>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Knowledge graph that links concepts defined in domain ontologies (eg, GISO: CensusTract) to data resources stored in databases (eg, percentage Black population) or those derived from the analytics layer. The upper part of the figure shows the nodes and edges produced through semantic inference during the knowledge engineering phase. The lower part of the figure shows the nodes and edges added through ML analysis during the feature engineering phase. GISO: geographical information system ontology; HIO: health indicators ontology; ACESO: adverse childhood experiences ontology; COPE: Childhood Obesity Prevention (Knowledge) Enterprise; DO: disease ontology.</p>
          </caption>
          <graphic xlink:href="formative_v6i7e36055_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <boxed-text id="box1" position="float">
          <title>Encoding axioms as general rules, initial facts, or new facts derived from feature engineering or logical reasoning.</title>
          <p>Generic rule axioms</p>
          <list list-type="bullet">
            <list-item>
              <p>COPE:lackOfPhysicialActivity <italic>leadsTo</italic> DO:Obesity (R1)</p>
            </list-item>
            <list-item>
              <p>%ObesityPrevalence:Metric <italic>isHealthIndicatorFor</italic> DO:Obesity (R2)</p>
            </list-item>
            <list-item>
              <p>Obesity:Disease <italic>isRiskFactorOf</italic> Diabetes:Disease (R3)</p>
            </list-item>
          </list>
          <p>Facts</p>
          <list list-type="bullet">
            <list-item>
              <p>individual:Patient <italic>livesIn</italic> “10300”:CensusTract (F1)</p>
            </list-item>
            <list-item>
              <p>“10300”:CensusTract <italic>has</italic> “49”:%PopWLackOfPhysicialActivity (F2)</p>
            </list-item>
            <list-item>
              <p>“10300”:CensusTract <italic>has</italic> “21”:%PopNoHighSchoolDiploma (F3)</p>
            </list-item>
            <list-item>
              <p>“10300”:CensusTract <italic>has</italic> “60”:%UnderPovertyLine (F4)</p>
            </list-item>
            <list-item>
              <p>“10300”:CensusTract <italic>has</italic> “46”:%ObesityPrevalence (F5)</p>
            </list-item>
          </list>
          <p>Feature engineered through multivariate analysis</p>
          <list list-type="bullet">
            <list-item>
              <p>%PopWLackOfPhysicialActivity:Metric <italic>isPredictorOf</italic> ObesityPrevalence:Metric [using F2-F5] (F6)</p>
            </list-item>
          </list>
          <p>Logical reasoning</p>
          <list list-type="bullet">
            <list-item>
              <p>individual:Patient <italic>isExposedTo</italic> LackPhysicalActivity:PhysicalCharacteristic [using F1 and F2] (F7)</p>
            </list-item>
            <list-item>
              <p>individual:Patient <italic>shouldBeScreenedFor</italic> Diabetes:Disease [using R1, R2, R3, F6, F7]</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>Ethics Approval</title>
        <p>No ethics review board assessment was required for this study because we used publicly available data.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Machine Learning Analysis</title>
        <p>The significant Spearman rank coefficient and VIF of the 7 features included in this study are shown in <xref ref-type="table" rid="table2">Table 2</xref>. Any feature exhibiting a VIF of greater than 10 was removed. For the SVR model results, we obtained an RMSE of 0.312 for the training set and 0.203 for the test set, while the <italic>R</italic><sup>2</sup> for the training set was 0.91 and that for the testing data set was 0.95 . Since the model provides similar results for training and test data sets, the proposed model does not overfit. The SVR feature importance results range on a scale of 0 to 100, and the greater the score, the most important the feature (<xref ref-type="table" rid="table3">Table 3</xref>). We found that the percentage of the population lacking physical activity, percentage of population below poverty level, percentage of population without high school diploma, percentage of population unemployed, and percentage of Black population were the most important variables when predicting obesity prevalence in Memphis, TN.</p>
        <p><xref rid="figure4" ref-type="fig">Figure 4</xref> shows SHAP’s value plot of feature contribution at the patient neighborhood level (census tract: 10300), which indicates the most important features such as the percentage of the population that lack physical activity and the percentage of population below the poverty level, from the point of view of the prediction of obesity prevalence in the patient neighborhood. The lack of physical activity and poverty had the largest positive (increased) contributions to obesity prevalence. On the other hand, the population of low income and more than a half-mile from the supermarket showed a negative (decreased) contribution but was the least important variable when predicting the patient neighborhood obesity prevalence. The knowledge extracted from our analysis will be used to detect the obesity prevalence pathways, which are defined by the top 5 most important features.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Spearman rank coefficient and variance inflation factor for each feature.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="430"/>
            <col width="440"/>
            <col width="130"/>
            <thead>
              <tr valign="top">
                <td>Features</td>
                <td>Spearman rank coefficient</td>
                <td>VIF<sup>a</sup></td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Low access to supermarket</td>
                <td>0.37</td>
                <td>1.70</td>
              </tr>
              <tr valign="top">
                <td>Black</td>
                <td>0.77</td>
                <td>2.80</td>
              </tr>
              <tr valign="top">
                <td>Poverty</td>
                <td>0.83</td>
                <td>3.66</td>
              </tr>
              <tr valign="top">
                <td>Unemployment</td>
                <td>0.73</td>
                <td>3.02</td>
              </tr>
              <tr valign="top">
                <td>No high school diploma</td>
                <td>0.81</td>
                <td>3.55</td>
              </tr>
              <tr valign="top">
                <td>Lack of physical activity</td>
                <td>0.92</td>
                <td>8.82</td>
              </tr>
              <tr valign="top">
                <td>Crime</td>
                <td>0.37</td>
                <td>1.68</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>VIF: variance inflation factor.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Support vector regression data set–level feature importance score.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="600"/>
            <col width="400"/>
            <thead>
              <tr valign="top">
                <td>Features</td>
                <td>SVR<sup>a</sup> feature importance</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Low access to supermarket</td>
                <td>4.39</td>
              </tr>
              <tr valign="top">
                <td>Black</td>
                <td>68.20</td>
              </tr>
              <tr valign="top">
                <td>Poverty</td>
                <td>78.60</td>
              </tr>
              <tr valign="top">
                <td>Unemployment</td>
                <td>70.16</td>
              </tr>
              <tr valign="top">
                <td>No high school diploma</td>
                <td>73.41</td>
              </tr>
              <tr valign="top">
                <td>Lack of physical activity</td>
                <td>100</td>
              </tr>
              <tr valign="top">
                <td>Crime</td>
                <td>0</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>SVR: support vector regression.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>The Shapley Additive Explanations (SHAP) value plot of the feature contribution (unscaled) for the patient’s neighborhood (census tract:10300). The x-axis represents the SHAP’s value, and the y-axis represents the features. The lack of physical activity and poverty had the largest positive (increase) contributions to obesity prevalence in the patient’s neighborhood.</p>
          </caption>
          <graphic xlink:href="formative_v6i7e36055_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>UPHO: Dashboard Design</title>
        <sec>
          <title>Use Case Scenarios</title>
          <p>In this section, we describe the semantics feature provided by UPHO through a proof-of-concept prototype that will display the different features of the expanded system by implementing the clinical scenarios described in the previous section.</p>
          <p>First, the user will sign into the UPHO platform dashboard, which will determine their specific role and establish the proper access permissions. The user will make the selections from the following menu items:</p>
          <list list-type="bullet">
            <list-item>
              <p>S1. Select an outcome of interest (eg, obesity prevalence, cancer,)</p>
            </list-item>
            <list-item>
              <p>S2. Select analytics aim</p>
            </list-item>
            <list-item>
              <p>S3. Select level of analysis and enter address/location (patient’s address [patient-level], city, county, or state [population-level])</p>
            </list-item>
            <list-item>
              <p>S4. Select geographical level of granularity (eg, zip code, census tract)</p>
            </list-item>
            <list-item>
              <p>S5. Select SDoH domain-specific risk factors</p>
            </list-item>
          </list>
          <p>After making these selections, the system will present on-demand explanations of risk level calculations, based on the selected level of geographic granularity.</p>
        </sec>
        <sec>
          <title>Scenario 1</title>
          <p>The physician selects “obesity prevalence” as the outcome of interest (S1), and “causal pathway analysis” (S2) as the analytics aim, “patient-level” as the level of interest (entering patient’s address, S3), and “census tract” as the geographical level of granularity (S4). The system provides risk-level calculations and descriptive statistics based on the census tract of the patient’s address. The physician also has the option to select a particular SDoH of interest in S5, in which case the system will highlight these nodes in the graph. Finally, the user selects “Explore” to generate the results and a corresponding knowledge graph. These results are tailored to the user’s interest in patient-level analysis and provide an explanative overview of the analysis results (<xref rid="figure5" ref-type="fig">Figure 5</xref>A). The system also allows the user to hover over pathways and nodes to explore explanative knowledge (<xref rid="figure5" ref-type="fig">Figure 5</xref>B, 5C) and offers a summary of recommendations and knowledge (<xref rid="figure5" ref-type="fig">Figure 5</xref>D).</p>
          <fig id="figure5" position="float">
            <label>Figure 5</label>
            <caption>
              <p>The dashboard of the Urban Population Health Observatory displays a physician user interested in obesity prevalence in her patient’s neighborhood with an overview of analysis results (A), explanations displayed when user hovers over a particular pathway (B), knowledge displayed when user hovers over a particular node (C), and summary of recommendations and knowledge (D).  ACESO: adverse childhood experiences ontology; GISO: geographical information system ontology; DO: disease ontology; HIO: health indicators ontology.</p>
            </caption>
            <graphic xlink:href="formative_v6i7e36055_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Scenario 2</title>
          <p>Here the researcher has access to more features. The researcher explores the causal pathway analysis aim in a population-level analysis and enters Memphis, TN, as a location of interest at the census tract–level (S1-S3), as shown in <xref rid="figure6" ref-type="fig">Figure 6</xref>, and the system provides risk-level calculations for the city of Memphis, TN. The researcher also has access to regression plots (<xref rid="figure6" ref-type="fig">Figure 6</xref>, A), which reflect the selection in S5. In section B, the system reports the results from the SVR machine model and provides explanations for each feature included in the model (<xref rid="figure6" ref-type="fig">Figure 6</xref>, B). In section C, the explanation pane presents a knowledge graph showing results tailored to the user’s interest in population-level analysis (<xref rid="figure6" ref-type="fig">Figure 6</xref>, C). The researcher can also hover over pathways and nodes for knowledge (<xref rid="figure6" ref-type="fig">Figure 6</xref>, C, a, b, and c), like the physician in scenario 1. The system also offers the researcher a summary of recommendations and knowledge (<xref rid="figure6" ref-type="fig">Figure 6</xref>, C, d).</p>
          <fig id="figure6" position="float">
            <label>Figure 6</label>
            <caption>
              <p>The dashboard of the Urban Population Health Observatory displays a researcher as the user interested in obesity prevalence in Memphis, TN, with univariate regression plot (A), multivariate analysis (B), and (C) which contains an overview of analysis results (a), explanations displayed when user hovers over a particular pathway (b), knowledge displayed when user hovers over a particular node (c), and summary of recommendations and knowledge (d).  ACESO: adverse childhood experiences ontology; GISO: geographical information system ontology; DO: disease ontology; HIO: health indicators ontology.</p>
            </caption>
            <graphic xlink:href="formative_v6i7e36055_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
      </sec>
      <sec>
        <title>Explanations</title>
        <p>The graph part of the dashboard can serve as a tool for researchers and physicians to semantically explain the recommendations that we made about a specific patient or population. The current version of the graph provides 2 different visual cues, as follows.</p>
        <list list-type="bullet">
          <list-item>
            <p>Tracing pathways on the graph provides visual cues. The red arrows in <xref rid="figure3" ref-type="fig">Figure 3</xref> show the edges that are part of a causal pathway that leads from risk factors to negative health outcomes for the specific patient, zip code, or census tract. While this path is specific to the selected patient or population, it can be used as a generic metapath. For example, Individual <italic>livesIn</italic> CensusTract→<italic>representsA</italic> Neighborhood→<italic>hasPhysicalCharacteristic→RiskFactorFor</italic> Disease. Depending on the level of sophistication desired, the user can trace paths on the graph and click on certain nodes or edges to obtain more insights, including statistically derived evidence or semantically inferred knowledge. They can also track the sources of that knowledge including the ontologies used.</p>
          </list-item>
          <list-item>
            <p>Clicking on a node or edge on the graph displays analysis results or knowledge. The user can hover over a certain edge (eg, lackOfPhysicalActivity</p>
            <p>isPredictorOf</p>
            <p>ObesityPrevalence; <xref rid="figure5" ref-type="fig">Figure 5</xref>B) to obtain an explanation of the data that show lackOfPhysical activity in the patient’s census tract leads to an increase in the prevalence of obesity. Similarly, the user can hover over a metric node (eg, percentage of the population below the poverty line, <xref rid="figure5" ref-type="fig">Figure 5</xref>C) to explain that this patient lives in a neighborhood in which nearly 61% of the population lives below the poverty line, compared to the average in their city, county, or state.</p>
          </list-item>
        </list>
        <p>UPHO’s metrics can be implemented into the backend of EHR systems (eg, Epic), and the results of those metrics can be rendered on the EHR interface in the form of risk scores on dashboards with severity indicators based on thresholds. Physicians can examine these metrics at the population level or individual patient level. UPHO can alternatively be used in a standalone approach by allowing a physician to extract more details about a single patient by providing the patient’s address or a population of patients by providing their city, state, or county. The input is coded to a geographical level of granularity that can be aligned with the population-level data to gain insights into the patient’s environment.</p>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Previous studies provided evidence that socially disadvantaged communities are disproportionately affected by chronic diseases such as obesity [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref8">8</xref>], which is a risk factor for developing diabetes, heart disease, and cancer. The significance of UPHO lies in its ability to provide a multifaceted surveillance system design that serves as an apparatus for actualizing effective interventions, addressing concerns in health disparities, providing awareness to the public, and equipping health officials with a surveillance system that will improve population health decision-making and planning [<xref ref-type="bibr" rid="ref24">24</xref>]. Using the semantics layer, the UPHO platform provides contextual knowledge by reusing several ontologies focusing on public health (eg, diseases, transportation, geography).</p>
        <p>The incorporation of semantics provides the user with an additional layer of explainability and interpretability, which could decrease errors in intervention or treatment due to misinterpretation or misunderstanding. The semantics layer can also use ontologies to overcome the challenge of scattered data sources, thereby assisting in the achievement of interoperability, which will be used to maintain features such as data integration, XAI, and interpretability. We apply logical reasoners to extract and supply knowledge despite limited data.</p>
        <p>Similar chronic disease surveillance systems [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref16">16</xref>] have offered approaches to assist in the efforts of improving chronic disease surveillance. Several published systems do not incorporate SDoH data [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. One did not provide an implementation of the systematic framework [<xref ref-type="bibr" rid="ref16">16</xref>] and several of them did not include XAI as a feature.</p>
        <p>We followed the conceptual framework for UPHOs [<xref ref-type="bibr" rid="ref17">17</xref>] and sought to improve the quality of disease surveillance by incorporating advances in AI and Bog Data, including interactive dashboard design, explainability, data integration, and interoperability, and incorporation of multimodal SDoH data. Developing a multidimensional scalable surveillance system to monitor and detect trends and deliver rapid early warnings and recommendations could assist health officials, physicians, and researchers in mitigating a health crisis such as the ongoing COVID-19 pandemic [<xref ref-type="bibr" rid="ref24">24</xref>].</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>One of the major limitations of UPHO is that it collects population data so that neighborhood or population assumptions are made for an individual in a clinical setting. For instance, individuals or patients who live in a particular population or neighborhood might not have the same characteristics as other individuals residing in the same neighborhood or population. However, our platform provides an end-to-end approach to examining the environment one resides and incorporates information that is important for the implementation of effective interventions for a given disease.</p>
        <p>The future work will be focusing on the further development of the UPHO platform, so it can enable timely, insight-driven decisions and inform immediate or long-term health policy responses [<xref ref-type="bibr" rid="ref15">15</xref>] to current and future public health crises.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>This study leveraged semantic technology and presented a proof-of-concept prototype design for our knowledge-based surveillance system, UPHO, which aims to reduce health disparities and improve population health. The expanded feature incorporates another level of interpretable knowledge needed to inform physicians, researchers, and health officials’ decision-making process at the community level. Incorporating XAI helps with the explainability and interpretability of the relevant data, information, and knowledge. Users who are not equipped with domain knowledge could extract common sense knowledge from a system that incorporates XAI [<xref ref-type="bibr" rid="ref35">35</xref>]. We as humans need a clear visualization and understanding of relationships between parameters in a system to make informed decisions. The lack of understandability and explainability in the health care and public health domains often leads to poor transparency, lack of accountability, and ultimately lower quality of care and biased health policies [<xref ref-type="bibr" rid="ref39">39</xref>]. Thus, the incorporation of semantics and XAI can improve fairness, accountability, transparency, and trust in health care and public health.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ACE</term>
          <def>
            <p>adverse childhood experience</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ACESO</term>
          <def>
            <p>adverse childhood experiences ontology</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">CDC</term>
          <def>
            <p>US Centers for Control and Prevention</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">COPE</term>
          <def>
            <p>Childhood Obesity Prevention (Knowledge) Enterprise</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">DO</term>
          <def>
            <p>disease ontology</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">GISO</term>
          <def>
            <p>geographical information system ontology</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">HIO</term>
          <def>
            <p>health indicators ontology</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">mHealth</term>
          <def>
            <p>mobile health</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">RMSE</term>
          <def>
            <p>root mean square error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">SDoH</term>
          <def>
            <p>socioenvironmental determinants of health</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">SHAP</term>
          <def>
            <p>Shapley Additive Explanations</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">SVR</term>
          <def>
            <p>support vector regression</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">UPHO</term>
          <def>
            <p>Urban Population Health Observatory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">VIF</term>
          <def>
            <p>variance inflation factor</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">WHO</term>
          <def>
            <p>World Health Organization</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">XAI</term>
          <def>
            <p>explainable artificial intelligence</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The funding for this study is provided by the University of Tennessee Health Science Center.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <source>Obesity 2021</source>
          <access-date>2021-09-09</access-date>
          <publisher-loc>Geneva</publisher-loc>
          <publisher-name>World Health Organization</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/news-room/facts-in-pictures/detail/6-facts-on-obesity">https://www.who.int/news-room/facts-in-pictures/detail/6-facts-on -obesity</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abdelaal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>le Roux</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Docherty</surname>
              <given-names>NG</given-names>
            </name>
          </person-group>
          <article-title>Morbidity and mortality associated with obesity</article-title>
          <source>Ann Transl Med</source>
          <year>2017</year>
          <month>04</month>
          <volume>5</volume>
          <issue>7</issue>
          <fpage>161</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.21037/atm.2017.03.107"/>
          </comment>
          <pub-id pub-id-type="doi">10.21037/atm.2017.03.107</pub-id>
          <pub-id pub-id-type="medline">28480197</pub-id>
          <pub-id pub-id-type="pii">atm-05-07-161</pub-id>
          <pub-id pub-id-type="pmcid">PMC5401682</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <source>Health and economic costs of chronic diseases</source>
          <year>2021</year>
          <month>06</month>
          <day>23</day>
          <access-date>2021-09-09</access-date>
          <publisher-loc>Atlanta</publisher-loc>
          <publisher-name>Centers for Disease Control and Prevention</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/chronicdisease/about/costs/index.htm">https://www.cdc.gov/chronicdisease/about/costs/index.htm</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boersma</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Black</surname>
              <given-names>LI</given-names>
            </name>
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>BW</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of multiple chronic conditions among US adults, 2018</article-title>
          <source>Prev Chronic Dis</source>
          <year>2020</year>
          <month>09</month>
          <day>17</day>
          <volume>17</volume>
          <fpage>E106</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/pcd/issues/2020/20_0130.htm"/>
          </comment>
          <pub-id pub-id-type="doi">10.5888/pcd17.200130</pub-id>
          <pub-id pub-id-type="medline">32945769</pub-id>
          <pub-id pub-id-type="pii">E106</pub-id>
          <pub-id pub-id-type="pmcid">PMC7553211</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cardel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Donahoo</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Feingold</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Anawalt</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Boyce</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Social and environmental factors influencing obesity</article-title>
          <source>Endotext</source>
          <year>2000</year>
          <publisher-loc>South Dartmouth</publisher-loc>
          <publisher-name>MDText.com, Inc</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Suglia</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Shelton</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Hsiao</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>YC</given-names>
            </name>
            <name name-style="western">
              <surname>Rundle</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Link</surname>
              <given-names>BG</given-names>
            </name>
          </person-group>
          <article-title>Why the neighborhood social environment is critical in obesity prevention</article-title>
          <source>J Urban Health</source>
          <year>2016</year>
          <month>02</month>
          <day>15</day>
          <volume>93</volume>
          <issue>1</issue>
          <fpage>206</fpage>
          <lpage>212</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26780582"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11524-015-0017-6</pub-id>
          <pub-id pub-id-type="medline">26780582</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11524-015-0017-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC4794461</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reidpath</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Burns</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Garrard</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mahoney</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Townsend</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>An ecological study of the relationship between social and environmental determinants of obesity</article-title>
          <source>Health Place</source>
          <year>2002</year>
          <month>6</month>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>141</fpage>
          <lpage>145</lpage>
          <pub-id pub-id-type="doi">10.1016/s1353-8292(01)00028-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yusuf</surname>
              <given-names>ZI</given-names>
            </name>
            <name name-style="western">
              <surname>Dongarwar</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Yusuf</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Salihu</surname>
              <given-names>HM</given-names>
            </name>
          </person-group>
          <article-title>Social determinants of overweight and obesity among children in the United States</article-title>
          <source>Int J MCH AIDS</source>
          <year>2020</year>
          <month>12</month>
          <day>28</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>22</fpage>
          <lpage>33</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32123625"/>
          </comment>
          <pub-id pub-id-type="doi">10.21106/ijma.337</pub-id>
          <pub-id pub-id-type="medline">32123625</pub-id>
          <pub-id pub-id-type="pii">IJMA-9-22</pub-id>
          <pub-id pub-id-type="pmcid">PMC7031877</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thacker</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Berkelman</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Public health surveillance in the United States</article-title>
          <source>Epidemiol Rev</source>
          <year>1988</year>
          <volume>10</volume>
          <fpage>164</fpage>
          <lpage>190</lpage>
          <pub-id pub-id-type="doi">10.1093/oxfordjournals.epirev.a036021</pub-id>
          <pub-id pub-id-type="medline">3066626</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rotmensch</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Halpern</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tlimat</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Horng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sontag</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Learning a health knowledge graph from electronic medical records</article-title>
          <source>Sci Rep</source>
          <year>2017</year>
          <month>07</month>
          <day>20</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>5994</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://dx.doi.org/10.1038/s41598-017-05778-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-017-05778-z</pub-id>
          <pub-id pub-id-type="medline">28729710</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-017-05778-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC5519723</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sheth</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Anantharam</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Thirunarayan</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>kHealth: proactive personalized actionable information for better healthcare</article-title>
          <year>2014</year>
          <conf-name>40th Int’l Conf Very Large Databases Workshop Personal Data Analytics in the Internet of Things (PDA@IOT)</conf-name>
          <conf-date>2014</conf-date>
          <conf-loc>online</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Qi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Agu</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Seneviratne</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>McCusker</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Making study populations visible through knowledge graphs</article-title>
          <source>Lecture Notes Comput Sci</source>
          <year>2019</year>
          <fpage>53</fpage>
          <lpage>68</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-30796-7_4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Seneviratne</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Rashid</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chari</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Knowledge integration for disease characterization: a breast cancer example</article-title>
          <source>Int Semantic Web Conf</source>
          <year>2018</year>
          <fpage>223</fpage>
          <lpage>238</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-00668-6_14</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gyrard</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Manas</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Saeedeh</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Krishnaprasad</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Amit</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Personalized health knowledge graph</article-title>
          <source>ISWC 2018 Contextualized Knowledge Graph Workshop</source>
          <year>2018</year>
          <fpage>1</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://scholarcommons.sc.edu/cgi/viewcontent.cgi?article=1005&#38;context=aii_fac_pub"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shaban-Nejad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Lavigne</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Okhmatovskaia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Buckeridge</surname>
              <given-names>DL</given-names>
            </name>
          </person-group>
          <article-title>PopHR: a knowledge-based platform to support integration, analysis, and visualization of population health data</article-title>
          <source>Ann N Y Acad Sci</source>
          <year>2017</year>
          <month>01</month>
          <day>17</day>
          <volume>1387</volume>
          <issue>1</issue>
          <fpage>44</fpage>
          <lpage>53</lpage>
          <pub-id pub-id-type="doi">10.1111/nyas.13271</pub-id>
          <pub-id pub-id-type="medline">27750378</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Castillo-Salgado</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Developing an academia-based public health observatory: the new global public health observatory with emphasis on urban health at Johns Hopkins Bloomberg School of Public Health</article-title>
          <source>Cad. Saúde Pública</source>
          <year>2015</year>
          <month>11</month>
          <volume>31</volume>
          <issue>suppl 1</issue>
          <fpage>286</fpage>
          <lpage>293</lpage>
          <pub-id pub-id-type="doi">10.1590/0102-311x00132914</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caiaffa</surname>
              <given-names>WT</given-names>
            </name>
            <name name-style="western">
              <surname>Friche</surname>
              <given-names>AAL</given-names>
            </name>
            <name name-style="western">
              <surname>Dias</surname>
              <given-names>MAS</given-names>
            </name>
            <name name-style="western">
              <surname>Meireles</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Ignacio</surname>
              <given-names>CF</given-names>
            </name>
            <name name-style="western">
              <surname>Prasad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kano</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Developing a conceptual framework of urban health observatories toward integrating research and evidence into urban policy for health and health equity</article-title>
          <source>J Urban Health</source>
          <year>2014</year>
          <month>02</month>
          <day>22</day>
          <volume>91</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>16</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23974945"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11524-013-9812-0</pub-id>
          <pub-id pub-id-type="medline">23974945</pub-id>
          <pub-id pub-id-type="pmcid">PMC3907625</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doshi-Velez</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Towards a rigorous science of interpretable machine learning</article-title>
          <source>Mach Learn</source>
          <year>2017</year>
          <fpage>2</fpage>
          <pub-id pub-id-type="doi">10.1201/9780367816377-16</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Battaglia</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Hamrick</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>Relational inductive biases, deep learning, and graph networks</source>
          <year>2018</year>
          <access-date>2022-06-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1806.01261">https://arxiv.org/abs/1806.01261</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Angelov</surname>
              <given-names>PP</given-names>
            </name>
            <name name-style="western">
              <surname>Soares</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Arnold</surname>
              <given-names>NI</given-names>
            </name>
            <name name-style="western">
              <surname>Atkinson</surname>
              <given-names>PM</given-names>
            </name>
          </person-group>
          <article-title>Explainable artificial intelligence: an analytical review</article-title>
          <source>WIREs Data Mining Knowl Discov</source>
          <year>2021</year>
          <month>07</month>
          <day>12</day>
          <volume>11</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <pub-id pub-id-type="doi">10.1002/widm.1424</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosenfeld</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Richardson</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Explainability in human–agent systems</article-title>
          <source>Auton Agent Multi-Agent Syst</source>
          <year>2019</year>
          <month>5</month>
          <day>13</day>
          <volume>33</volume>
          <issue>6</issue>
          <fpage>673</fpage>
          <lpage>705</lpage>
          <pub-id pub-id-type="doi">10.1007/s10458-019-09408-y</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Biemann</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <source>What do we need to build explainable AI systems for the medical domain?</source>
          <year>2017</year>
          <access-date>2022-06-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1712.09923">https://arxiv.org/abs/1712.09923</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lundberg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A unified approach to interpreting model predictions</article-title>
          <source>Proc Adv Neural Inf Proc Syst</source>
          <year>2017</year>
          <fpage>4768</fpage>
          <lpage>4777</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://proceedings.neurips.cc/paper/2017/hash/8a20a8621978632d76c43dfd28b67767-Abstract.html"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brakefield</surname>
              <given-names>WS</given-names>
            </name>
            <name name-style="western">
              <surname>Ammar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Olusanya</surname>
              <given-names>OA</given-names>
            </name>
            <name name-style="western">
              <surname>Shaban-Nejad</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>An Urban Population Health Observatory system to support COVID-19 pandemic preparedness, response, and management: design and development study</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2021</year>
          <month>06</month>
          <day>16</day>
          <volume>7</volume>
          <issue>6</issue>
          <fpage>e28269</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2021/6/e28269/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/28269</pub-id>
          <pub-id pub-id-type="medline">34081605</pub-id>
          <pub-id pub-id-type="pii">v7i6e28269</pub-id>
          <pub-id pub-id-type="pmcid">PMC8211099</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="web">
          <source>500 cities project: 2016 to 2019</source>
          <year>2020</year>
          <month>12</month>
          <day>08</day>
          <access-date>2021-09-20</access-date>
          <publisher-loc>Atlanta</publisher-loc>
          <publisher-name>Centers for Disease Control and Prevention</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/places/about/500-cities-2016-2019/index.html">https://www.cdc.gov/places/about/500-cities-2016-2019/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="web">
          <article-title>About the ACS</article-title>
          <source>U. S. Census Bureau</source>
          <year>2021</year>
          <month>01</month>
          <day>04</day>
          <access-date>2021-09-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.census.gov/programs-surveys/acs/about.html">https://www.census.gov/programs-surveys/acs/about.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <article-title>Economic Research Service: data sources</article-title>
          <source>U.S. Department of Agriculture</source>
          <access-date>2021-09-20</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ers.usda.gov/topics/farm-economy/farm-sector-income-finances/data-sources/">https://www.ers.usda.gov/topics/farm- economy/farm-sector-income-finances/data-sources/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Haendel</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Chute</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Robinson</surname>
              <given-names>PN</given-names>
            </name>
          </person-group>
          <article-title>Classification, ontology, and precision medicine</article-title>
          <source>N Engl J Med</source>
          <year>2018</year>
          <month>10</month>
          <day>11</day>
          <volume>379</volume>
          <issue>15</issue>
          <fpage>1452</fpage>
          <lpage>1462</lpage>
          <pub-id pub-id-type="doi">10.1056/nejmra1615014</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shaban-Nejad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Buckeridge</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Dubé</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>COPE: Childhood obesity prevention [knowledge] enterprise</article-title>
          <source>Artific Intell Med</source>
          <year>2011</year>
          <fpage>225</fpage>
          <lpage>229</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-642-22218-4_28</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brenas</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>EK</given-names>
            </name>
            <name name-style="western">
              <surname>Shaban-Nejad</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Adverse childhood experiences ontology for mental health surveillance, research, and evaluation: advanced knowledge representation and semantic web techniques</article-title>
          <source>JMIR Ment Health</source>
          <year>2019</year>
          <month>05</month>
          <day>21</day>
          <volume>6</volume>
          <issue>5</issue>
          <fpage>e13498</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2019/5/e13498/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13498</pub-id>
          <pub-id pub-id-type="medline">31115344</pub-id>
          <pub-id pub-id-type="pii">v6i5e13498</pub-id>
          <pub-id pub-id-type="pmcid">PMC6707574</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schriml</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Arze</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Nadendla</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>YW</given-names>
            </name>
            <name name-style="western">
              <surname>Mazaitis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Felix</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kibbe</surname>
              <given-names>WA</given-names>
            </name>
          </person-group>
          <article-title>Disease Ontology: a backbone for disease semantic integration</article-title>
          <source>Nucleic Acids Res</source>
          <year>2012</year>
          <month>01</month>
          <day>12</day>
          <volume>40</volume>
          <issue>D1</issue>
          <fpage>D940</fpage>
          <lpage>D946</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/22080554"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/nar/gkr972</pub-id>
          <pub-id pub-id-type="medline">22080554</pub-id>
          <pub-id pub-id-type="pii">gkr972</pub-id>
          <pub-id pub-id-type="pmcid">PMC3245088</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shaban-Nejad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Okhmatovskaia</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Izadi</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Naderi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mondor</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jauvin</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Buckeridge</surname>
              <given-names>DL</given-names>
            </name>
          </person-group>
          <article-title>PHIO: a knowledge base for interpretation and calculation of public health indicators</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2013</year>
          <volume>192</volume>
          <fpage>1207</fpage>
          <pub-id pub-id-type="medline">23920981</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ehrlinger</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <source>Towards a definition of knowledge graphs</source>
          <year>2016</year>
          <access-date>2022-06-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://ceur-ws.org/Vol-1695/paper4.pdf">http://ceur-ws.org/Vol-1695/paper4.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ammar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bailey</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Shaban-Nejad</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Using a personal health library-enabled mHealth recommender system for self-management of diabetes among underserved populations: use case for knowledge graphs and linked data</article-title>
          <source>JMIR Form Res</source>
          <year>2021</year>
          <month>03</month>
          <day>16</day>
          <volume>5</volume>
          <issue>3</issue>
          <fpage>e24738</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://formative.jmir.org/2021/3/e24738/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24738</pub-id>
          <pub-id pub-id-type="medline">33724197</pub-id>
          <pub-id pub-id-type="pii">v5i3e24738</pub-id>
          <pub-id pub-id-type="pmcid">PMC8075073</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ammar</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Shaban-Nejad</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Explainable artificial intelligence recommendation system by leveraging the semantics of adverse childhood experiences: proof-of-concept prototype development</article-title>
          <source>JMIR Med Inform</source>
          <year>2020</year>
          <month>11</month>
          <day>04</day>
          <volume>8</volume>
          <issue>11</issue>
          <fpage>e18752</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2020/11/e18752/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/18752</pub-id>
          <pub-id pub-id-type="medline">33146623</pub-id>
          <pub-id pub-id-type="pii">v8i10e18752</pub-id>
          <pub-id pub-id-type="pmcid">PMC7673979</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Awad</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Khanna</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Support vector regression</article-title>
          <source>Efficient Learning Machines: Theories, Concepts, and Applications for Engineers and System Designers</source>
          <year>2015</year>
          <publisher-loc>online</publisher-loc>
          <publisher-name>apress</publisher-name>
          <fpage>67</fpage>
          <lpage>80</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Drucker</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Burges</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kaufman</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Smola</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vapnik</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <source>Support vector regression machines</source>
          <year>1997</year>
          <access-date>2022-06-27</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://papers.neurips.cc/paper/1238-support-vector-regression-machines.pdf">http://papers.neu rips.cc/paper/1238-support-vector-regression-machines.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kuhn</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Building predictive models in R using the caret package</article-title>
          <source>J Stat Soft</source>
          <year>2008</year>
          <volume>28</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.18637/jss.v028.i05</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shaban-Nejad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Michalowski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Buckeridge</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Guest editorial explainable AI: towards fairness, accountability, transparency and trust in healthcare</article-title>
          <source>IEEE J Biomed Health Inform</source>
          <year>2021</year>
          <month>7</month>
          <volume>25</volume>
          <issue>7</issue>
          <fpage>2374</fpage>
          <lpage>2375</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2021.3088832</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
