<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JFR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id>
      <journal-title>JMIR Formative Research</journal-title>
      <issn pub-type="epub">2561-326X</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i1e38399</article-id>
      <article-id pub-id-type="pmid">36656633</article-id>
      <article-id pub-id-type="doi">10.2196/38399</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Predicting Openness of Communication in Families With Hereditary Breast and Ovarian Cancer Syndrome: Natural Language Processing Analysis</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Pozzar</surname>
            <given-names>Rachel</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Khalilian</surname>
            <given-names>Engineer Reza</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zhao</surname>
            <given-names>Runchen</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Baroutsou</surname>
            <given-names>Vasiliki</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3475-4831</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Cerqueira Gonzalez Pena</surname>
            <given-names>Rodrigo</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9010-2830</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Schweighoffer</surname>
            <given-names>Reka</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4358-2517</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Caiata-Zufferey</surname>
            <given-names>Maria</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-4197-8913</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>Sue</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3785-2445</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Hesse-Biber</surname>
            <given-names>Sharlene</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff5" ref-type="aff">5</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2169-1993</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Ciorba</surname>
            <given-names>Florina M</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff6" ref-type="aff">6</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2773-4499</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Lauer</surname>
            <given-names>Gerhard</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0230-2574</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Katapodi</surname>
            <given-names>Maria</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Clinical Research</institution>
            <institution>University of Basel</institution>
            <addr-line>Missionstrasse 64</addr-line>
            <addr-line>Basel, 4055</addr-line>
            <country>Switzerland</country>
            <phone>41 612070430</phone>
            <email>maria.katapodi@unibas.ch</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-3903-3750</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author">
          <collab>CASCADE Consortium</collab>
          <xref rid="aff8" ref-type="aff">8</xref>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Clinical Research</institution>
        <institution>University of Basel</institution>
        <addr-line>Basel</addr-line>
        <country>Switzerland</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Center for Data Analytics</institution>
        <institution>University of Basel</institution>
        <addr-line>Basel</addr-line>
        <country>Switzerland</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Competence Centre for Healthcare Practices and Policies</institution>
        <institution>Department of Business Economics, Health and Social Care</institution>
        <institution>University of Applied Sciences and Arts of Southern Switzerland</institution>
        <addr-line>Manno</addr-line>
        <country>Switzerland</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>College of Nursing</institution>
        <institution>Yonsei University</institution>
        <addr-line>Seoul</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>Department of Sociology</institution>
        <institution>Boston College</institution>
        <addr-line>Chestnut Hill, MA</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Department of Mathematics and Computer Science</institution>
        <institution>University of Basel</institution>
        <addr-line>Basel</addr-line>
        <country>Switzerland</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Gutenberg-Institut für Weltliteratur und schriftorientierte Medien</institution>
        <institution>Abteilung Buchwissenschaft Johannes Gutenberg</institution>
        <institution>Universität Mainz Philosophicum</institution>
        <addr-line>Mainz</addr-line>
        <country>Germany</country>
      </aff>
      <aff id="aff8">
        <label>8</label>
        <institution>See Acknowledgments</institution>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Maria Katapodi <email>maria.katapodi@unibas.ch</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>19</day>
        <month>1</month>
        <year>2023</year>
      </pub-date>
      <volume>7</volume>
      <elocation-id>e38399</elocation-id>
      <history>
        <date date-type="received">
          <day>31</day>
          <month>3</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>23</day>
          <month>6</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>11</day>
          <month>7</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>24</day>
          <month>11</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Vasiliki Baroutsou, Rodrigo Cerqueira Gonzalez Pena, Reka Schweighoffer, Maria Caiata-Zufferey, Sue Kim, Sharlene Hesse-Biber, Florina M Ciorba, Gerhard Lauer, Maria Katapodi,  CASCADE Consortium. Originally published in JMIR Formative Research (https://formative.jmir.org), 19.01.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on https://formative.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://formative.jmir.org/2023/1/e38399" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>In health care research, patient-reported opinions are a critical element of personalized medicine and contribute to optimal health care delivery. The importance of integrating natural language processing (NLP) methods to extract patient-reported opinions has been gradually acknowledged over the past years. One form of NLP is sentiment analysis, which extracts and analyses information by detecting feelings (thoughts, emotions, attitudes, etc) behind words. Sentiment analysis has become particularly popular following the rise of digital interactions. However, NLP and sentiment analysis in the context of intrafamilial communication for genetic cancer risk is still unexplored. Due to privacy laws, intrafamilial communication is the main avenue to inform at-risk relatives about the pathogenic variant and the possibility of increased cancer risk.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The study examined the role of sentiment in predicting openness of intrafamilial communication about genetic cancer risk associated with hereditary breast and ovarian cancer (HBOC) syndrome.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We used narratives derived from 53 in-depth interviews with individuals from families that harbor pathogenic variants associated with HBOC: first, to quantify openness of communication about cancer risk, and second, to examine the role of sentiment in predicting openness of communication. The interviews were conducted between 2019 and 2021 in Switzerland and South Korea using the same interview guide. We used NLP to extract and quantify textual features to construct a handcrafted lexicon about interpersonal communication of genetic testing results and cancer risk associated with HBOC. Moreover, we examined the role of sentiment in predicting openness of communication using a stepwise linear regression model. To test model accuracy, we used a split-validation set. We measured the performance of the training and testing model using area under the curve, sensitivity, specificity, and root mean square error.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Higher “openness of communication” scores were associated with higher overall net sentiment score of the narrative, higher fear, being single, having nonacademic education, and higher informational support within the family. Our results demonstrate that NLP was highly effective in analyzing unstructured texts from individuals of different cultural and linguistic backgrounds and could also reliably predict a measure of “openness of communication” (area under the curve=0.72) in the context of genetic cancer risk associated with HBOC.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our study showed that NLP can facilitate assessment of openness of communication in individuals carrying a pathogenic variant associated with HBOC. Findings provided promising evidence that various features from narratives such as sentiment and fear are important predictors of interpersonal communication and self-disclosure in this context. Our approach is promising and can be expanded in the field of personalized medicine and technology-mediated communication.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>cascade testing</kwd>
        <kwd>dictionary-based approach</kwd>
        <kwd>family communication</kwd>
        <kwd>hereditary breast and ovarian cancer</kwd>
        <kwd>HBOC</kwd>
        <kwd>sentiment analysis</kwd>
        <kwd>text mining</kwd>
        <kwd>natural language processing</kwd>
        <kwd>cancer</kwd>
        <kwd>hereditary</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>Natural language processing (NLP) is a computer-assisted analytical approach for automatically evaluating and interpreting human language by extracting meaningful insights from textual data sets [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref3">3</xref>]. NLP has been broadly used in various fields in the recent past, for example, in financial and business marketing, education, and health care [<xref ref-type="bibr" rid="ref4">4</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. The typical applications of NLP include information extraction, sentiment and semantic analysis, text classification, and text summarization. Among the different NLP applications, sentiment analysis has become particularly popular in recent years following the rise of digital communication and social media [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. Sentiment analysis aims to assess whether people’s opinions, emotions, and attitudes toward a certain event or experience are positive, negative, or neutral [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>] and generates valuable insights that lead to the improvement of a new service or product.</p>
      <p>In health care–related studies, patient-reported insights are an essential component of personalized medicine and contribute to optimal health care delivery. Researchers have applied NLP to extract and analyze patient-reported insights from social media and for different topics, for example, social exchange patterns in web-based health platforms [<xref ref-type="bibr" rid="ref12">12</xref>], needs of patients and caregivers in different disease entities [<xref ref-type="bibr" rid="ref13">13</xref>], online support groups for patients with breast cancer [<xref ref-type="bibr" rid="ref14">14</xref>], or awareness for Lynch syndrome (LS) [<xref ref-type="bibr" rid="ref15">15</xref>]. A major limitation of this approach is that population characteristics (age, socioeconomic status, etc) are often unavailable, which limits the clinical applicability of findings and may create disparities either due to increased representation or lack thereof of certain population subgroups. Others have applied NLP to clinical notes originating from electronic medical records to describe patients’ experiences with symptoms [<xref ref-type="bibr" rid="ref16">16</xref>] or free-text data from patient surveys evaluating the quality of hospital services [<xref ref-type="bibr" rid="ref17">17</xref>]. One limitation of this approach is the lack of depth in these data sources, either because they lack the patient’s perspective or because the texts are limited in scope and volume. We identified only a few studies that applied NLP to unstructured narratives collected from in-depth interviews aiming to describe experiences with cancer ambulatory services [<xref ref-type="bibr" rid="ref18">18</xref>] or to predict changes in substance use [<xref ref-type="bibr" rid="ref19">19</xref>] and perceived loneliness among older adults [<xref ref-type="bibr" rid="ref20">20</xref>].</p>
      <p>NLP and sentiment analysis in the context of intrafamilial communication for genetic cancer risk is unexplored. Due to privacy laws, individuals carrying pathogenic variants in cancer-causing genes have a key role in disseminating information to relatives and in advocating for genetic testing [<xref ref-type="bibr" rid="ref21">21</xref>]. This self-disclosure process is currently the main avenue to alert relatives to their own risk of carrying the pathogenic variant. Self-disclosure is a process of interpersonal communication by which one person reveals information about themselves to another person, or a small intimate group, for example, their family. The information exchange can be based on verbal and nonverbal cues and can be face to face or technology mediated. Most importantly, in addition to information exchange, self-disclosure can include thoughts, emotional experiences and feelings, aspirations, goals, fears, likes, and dislikes [<xref ref-type="bibr" rid="ref22">22</xref>]. During self-disclosure, humans adjust and adapt their verbal and nonverbal communication, and messages are produced, interpreted, understood, or misunderstood [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. Intrafamilial communication for genetic cancer risk may involve significant levels of uncertainty and potential conflicts since the meaning of self-disclosure about the cancer-causing variant can be shaped by opposing arguments and negative responses from others. Indeed, information exchange about genetic cancer risk may be easier with some family members or may present a particularly difficult moment with others [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>].</p>
      <p>Predicting openness of communication and examining the role of sentiment in intrafamilial communication of genetic cancer risk may be used to enrich message tailoring in technology-assisted interventions. In this study, we examined the role of sentiment in predicting openness of communication about genetic cancer risk associated with hereditary breast and ovarian cancer (HBOC) syndrome. HBOC is a hereditary cancer syndrome that affects both men and women and accounts for a significant number of different cancers, such as breast, ovarian, pancreatic, and prostate [<xref ref-type="bibr" rid="ref27">27</xref>]. Sharing information about HBOC-causing pathogenic variants is a complex process of intrafamilial communication and a key element of public health interventions aiming to promote cascade testing of relatives and cancer prevention and control [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. In this study, we used narrative data collected with in-depth interviews: first, to quantify openness of communication about HBOC cancer risk, and second, to examine the role of sentiment in predicting openness of communication.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Design, Population, Settings, and Procedures</title>
        <p>This analysis is part of a larger ongoing study, the Swiss CASCADE cohort, which follows adult (aged ≥18 years) men and women from families that harbor pathogenic variants associated with HBOC or LS. The cohort includes individuals who had genetic testing, confirming either the presence or the absence of the familial pathogenic variant, and their untested relatives with unknown mutation status. Eligible participants may have had a cancer diagnosis, or they could be cancer-free at the time of enrolment in the study. Recruitment takes place at 8 different oncology and genetic testing centers in the German-, French-, and Italian-speaking regions of Switzerland. The study collects survey data designed to elicit factors that enhance cascade genetic testing and cancer surveillance for HBOC and LS. A subsample of participants has consented to provide narrative data regarding family communication of test results. For the purposes of this paper, we focused only on individuals who have had genetic testing for HBOC-associated pathogenic variants and accepted to provide narrative data.</p>
      </sec>
      <sec>
        <title>Ethics Approval</title>
        <p>The study protocol has been approved by the Ethics Committee of Northwest Switzerland (BASEC 2016-02052) and is publicly available (ClinicalTrials.gov NCT03124212) [<xref ref-type="bibr" rid="ref30">30</xref>]. We also used available data from participants in the K-CASCADE study (ClinicalTrials.gov NCT04214210) in South Korea, which focuses on HBOC. K-CASCADE and the collaboration of the 2 studies has been approved by local ethics committees (Severance Hospital Institutional Review Board: 4-2020-0520). K-CASCADE is identical to the Swiss CASCADE in respect to scope, research design, participant eligibility criteria (except for age ≥19 years), and data collection methodology. Participants to K-CASCADE are recruited from 5 hospitals in South Korea [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
      </sec>
      <sec>
        <title>Narrative Data</title>
        <p>Narrative data included in this paper were collected from 44 individuals living in Switzerland and 9 in South Korea. The in-depth interviews were conducted between April 2019 and June 2021 either face to face or online (after April 2020 due to the COVID-19 pandemic) by trained research staff in German, French, Italian, English, and Korean using the same interview guide. Interview questions were designed to explore general communication patterns within family networks and specific experiences and barriers of family communication regarding genetic risk including discussions with health care providers. Examples of questions included in the interview guide are “What are some issues (barriers) that people might experience, related to sharing genetic risk information with family members?” and “Think of your own experience of (not) sharing genetic risk information with family members. What did you do and how did you decide about it?” Interviews were recorded, and all narrative data were transcribed verbatim in the original language in Microsoft Word and translated into English for this paper.</p>
      </sec>
      <sec>
        <title>Survey Data</title>
        <p>Survey data were collected on an ongoing basis, starting in fall 2017 and occurring approximately 18-24 months apart. Self-administered surveys assessed demographic and clinical characteristics [<xref ref-type="bibr" rid="ref30">30</xref>]. The surveys also included investigator-developed items that have been associated with family communication and intention to inform relatives about genetic cancer risk. These items assess informational support among family members, preference for patient-mediated communication of genetic testing results, and perceived utility of genetic testing for relatives (<xref ref-type="boxed-text" rid="box1">Textbox 1</xref>). These items are scored on 7-point Likert-type scales ranging from 1 “Strongly Disagree” to 7 “Strongly Agree.” Respondents also completed the Informing Relatives Inventory (IRI), a 37-item scale assessing knowledge, motivation, and self-efficacy to disclose genetic cancer risk to relatives [<xref ref-type="bibr" rid="ref32">32</xref>]. IRI items are also scored on a 7-point Likert-type scale, with higher overall score indicating greater intention to inform relatives about genetic cancer risk.</p>
        <boxed-text id="box1" position="float">
          <title>Items from the CASCADE baseline survey used for this study.</title>
          <p>Demographic characteristics</p>
          <list list-type="bullet">
            <list-item>
              <p>Age</p>
            </list-item>
            <list-item>
              <p>Sex (female/male)</p>
            </list-item>
            <list-item>
              <p>Education level (elementary-, high school–, or technical school–graduate or academic degree)</p>
            </list-item>
            <list-item>
              <p>Marital status (married or living as married, single, divorced or separated, or widowed)</p>
            </list-item>
            <list-item>
              <p>Employment status (working full time, nonworking, or retired)</p>
            </list-item>
          </list>
          <p>Clinical characteristics</p>
          <list list-type="bullet">
            <list-item>
              <p>Cancer status (affected or never diagnosed with cancer)</p>
            </list-item>
            <list-item>
              <p>Genetic testing result (positive or negative for the familial pathogenic variant)</p>
            </list-item>
          </list>
          <p>Family communication</p>
          <list list-type="bullet">
            <list-item>
              <p>“In our family when I have a health problem there is great willingness to share information with each other”</p>
            </list-item>
            <list-item>
              <p>“I would prefer not to discuss about genetic testing results with anyone in my family”</p>
            </list-item>
            <list-item>
              <p>“If you have blood relatives, would it be useful for them to have genetic testing?”</p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>Data Analysis Overview</title>
        <p>First, we examined narratives to assess “openness of communicating” genetic test results and cancer risk with relatives and with health care providers. Second, we categorized the text of each narrative as describing either a positive or negative sentiment toward experiences with genetic testing and health care services. Third, we examined whether demographic and clinical characteristics and sentiment, as expressed in the narrative, can predict “openness of communicating” genetic risk from tested individuals to relatives.</p>
      </sec>
      <sec>
        <title>NLP Model Development</title>
        <p>The ability of NLP to identify and predict different levels of “openness of communication” was evaluated following a multistep framework (<xref rid="figure1" ref-type="fig">Figure 1</xref>), which was divided into three phases: (1) preprocessing, (2) training, and (3) performance evaluation. All computations were performed in R software (version 3.6.3; R Foundation for Statistical Computing) [<xref ref-type="bibr" rid="ref33">33</xref>]. We have made our analysis publicly available through the Zenodo open data repository [<xref ref-type="bibr" rid="ref34">34</xref>].</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Phases of developing the natural language processing (NLP) algorithm: (1) preprocessing, (2) training, and (3) performance evaluation. LDA: latent Dirichlet analysis; POS: part of speech; TF-IDF: term frequency–inverse document frequency.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e38399_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Preprocessing Phase</title>
        <p>To start data processing, we broke down each text into individual tokens. We then applied functions to remove stop words and special characters. All texts were converted to lower case. We also applied part-of-speech tagging to extract phrases from the text corpus, used a latent Dirichlet allocation model to generate the most appropriate topics, and computed the term frequency–inverse document frequency to indicate the significance of a word in the text corpus [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>].</p>
        <sec>
          <title>Creation of a Lexicon and a Score for “Openness of Communication”</title>
          <p>To develop an “openness of communication” score, we built a lexicon containing words and phrases linked to communication (for example, <italic>“</italic>difficulties in communication” and <italic>“</italic>excellent communication<italic>”</italic>) and classified them as positive or negative. After completing the preprocessing phase, we extracted N-grams from the text corpus. N-grams refer to single words (unigrams) or a combination of 2 or 3 words (bigrams or trigrams) associated with the outcome of interest, ie, “openness of communication.” To further enrich the lexicon, we applied the same process in a US-based sample of 123 narratives related to experiences with HBOC genetic cancer risk. This database includes narrative data collected between January 2013 to September 2016 from women and men who are carriers of HBOC-associated variants [<xref ref-type="bibr" rid="ref26">26</xref>]. The semistructured interviews inquired about experiences with genetic counseling, genetic testing, and family communication patterns. We enriched the lexicon with supplementary words related to communication identified in an online thesaurus [<xref ref-type="bibr" rid="ref37">37</xref>]. The final lexicon we created contained 532 items (132 unigrams, 215 bigrams, and 185 trigrams). Two members of the research team independently created the scoring of N-grams in the lexicon as positive or negative without considering the context of the phrases in the interviews. Specifically, they evaluated each item on a 7-point scale on how favorable the items measure “openness of communication.” Scoring values ranged from –3 (extremely strong negative word related to communication) to +3 (extremely strong positive word related to communication). In cases of disagreement, the final value was calculated by averaging the 2 values given by the 2 raters rounding to the greater nearest integer. The final “openness of communication” score assigned to the transcript of each narrative was developed by matching N-grams to the lexicon and summing up the corresponding scores. To ensure the robustness of the above scoring process, we calculated the Pearson correlation coefficient between the “openness of communication” scores we created with the IRI overall score. This correlation was examined only on Swiss data because Korean IRI scores were not available at the time of this analysis.</p>
        </sec>
        <sec>
          <title>Sentiment Analysis and Attitude Toward Family Communication of Genetic Risk</title>
          <p>To categorize the text of each narrative as describing either a positive or negative attitude toward genetic testing and health care services and to capture the overall emotional valence of the narrative, we used 3 common lexicons for text sentiment analysis: AFINN, Bing Liu, and the National Research Council Canada (NRC) Emotion Lexicon. The AFINN lexicon contains words with a score between –5 and +5, with negative and positive scores indicating negative and positive sentiments, respectively [<xref ref-type="bibr" rid="ref38">38</xref>]. The Bing Liu lexicon classifies words into conveying a positive or a negative sentiment [<xref ref-type="bibr" rid="ref1">1</xref>]. The NRC Emotion Lexicon estimates a sentiment score (positive and negative sentiment) based on 8 emotions. Positive emotions include anticipation, joy, surprise, and trust, whereas negative emotions include anger, disgust, fear, and sadness [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. We also calculated an overall net sentiment expressed in each narrative, based on the difference between overall positive sentiment minus overall negative sentiment. An overall positive score meant that the individual expressed more positive sentiment in the narrative than negative, and vice versa.</p>
        </sec>
      </sec>
      <sec>
        <title>Training Phase</title>
        <p>For developing the model, the overall data set was split randomly, with 70% of data used in the training phase by using the “openness of communication” score as the dependent variable. To examine whether the demographic and clinical characteristics and sentiment features of each narrative predicted “openness of communication” scores, we used a linear regression model based on the following steps. Initially we performed a univariate analysis to identify those independent variables exhibiting more than 60% absolute correlation with one another. These variables were excluded to avoid multicollinearity. Then, we continued with a multivariate analysis using a stepwise linear regression to identify possible predictors of the dependent variable and remove nonsignificant independent variables. As an alternative model, we attempted to use an artificial neural network. We built a fully connected network with 1 hidden layer, 1 input and 1 output layer, and 5 neurons. Optimization was done through the Broyden-Fletcher-Goldfarb-Shanno method. Early stopping was utilized to avoid overfitting. However, we ended up discarding the artificial neural network from the analysis because it showed no improvement compared to the linear regression. Finally, the performance of the models was evaluated using the area under the curve (AUC), sensitivity, specificity, and root mean square error (RMSE).</p>
      </sec>
      <sec>
        <title>Testing Phase</title>
        <p>In this phase, we tested the model using the remaining 30% of the database (validation cohort). The performance of the models was evaluated using the same metrics as in the training phase, ie, AUC, sensitivity, specificity, and RMSE.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Description of the Sample</title>
        <p>Narrative and survey data from 53 individuals are included in this paper. Participants were aged 32-76 years. Most were female (47/53, 89%), married (41/53, 77%), and carriers of the familial pathogenic variant (51/53, 96%). Approximately 2 in 3 (32/53, 60%) had a prior diagnosis of cancer (<xref ref-type="table" rid="table1">Table 1</xref>). The Swiss and the Korean samples were not statistically different in respect to age (<italic>P</italic>=.71), prior cancer diagnosis (<italic>P</italic>=.38), educational level (<italic>P</italic>=.17), and employment status (<italic>P</italic>=.14).</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Sociodemographic and clinical data of participants (N=53).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="670"/>
            <col width="0"/>
            <col width="300"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Characteristic</td>
                <td>Value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Age (years), mean (SD)</td>
                <td>53.3 (12.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Sex, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td colspan="2">47 (89)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Education, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Attended elementary/high school</td>
                <td colspan="2">5 (9)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>High school graduate</td>
                <td colspan="2">14 (26)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Technical school graduate</td>
                <td colspan="2">13 (24)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>University degree/postgraduate degree</td>
                <td colspan="2">21 (40)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Marital status, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Married/living as married</td>
                <td colspan="2">41 (77)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Single</td>
                <td colspan="2">4 (8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td> Divorced/separated/widowed</td>
                <td colspan="2">8 (15)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">Employed full or part time (yes), n (%)</td>
                <td>34 (64)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Cancer status, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Previous cancer, one or more diagnoses</td>
                <td colspan="2">32 (60)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Never been diagnosed with cancer</td>
                <td colspan="2">21 (40)</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Genetic test result, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Positive for the familial pathogenic variant</td>
                <td colspan="2">51 (96)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Negative for the familial pathogenic variant</td>
                <td colspan="2">2 (4)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Description of the “Openness of Communication” Score and the Narrative Data</title>
        <p>The average “openness of communication” score was 29.8 (SD 19.5; range –9 to 76), indicating an overall trend toward open communication. Narratives from these 53 individuals included 5837 unique unigrams, 4183 bigrams, and 654 trigrams. The most frequently appearing nontrivial words are shown in <xref rid="figure2" ref-type="fig">Figure 2</xref>. Based on the NRC Emotion Lexicon, the 10 most common positive words were “time,” “true,” “children,” “talk,” “finally,” “information,” “positive,” “doctor,” “understand,” and “daughter”. The 10 most common negative words were “cancer,” “sick,” “feel,” “risk,” “negative,” “died,” “difficult,” “fear,” “disease,” and “bad.”</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>The most frequent words identified in narratives.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e38399_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Validating the Relationship of “Openness of Communication” scores with IRI</title>
        <p>The correlation coefficient between the “openness of communication” score and IRI in the Swiss data was <italic>r</italic>=0.46, indicating a moderate positive correlation.</p>
      </sec>
      <sec>
        <title>Attitude Toward Genetic Testing and Health Care Services</title>
        <p>Attitude toward genetic testing and health care services varied among participants, but it was overall positive. “Trust” appeared as the strongest positive emotion, whereas “fear” and “sadness” appeared as the strongest negative emotions in the text corpus based on the NRC Emotion Lexicon. The least perceived emotions were “surprise” and “anger.” <xref rid="figure3" ref-type="fig">Figure 3</xref> describes the frequencies of words identified in the corpus for each emotion.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Frequencies of words identified for each emotion (anger, anticipation, disgust, fear, joy, sadness, surprise, and trust) based on the National Research Council Canada Emotion Lexicon.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e38399_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Prediction of “Openness of Communication” Score</title>
        <p>The <italic>R</italic>² for the overall model was 0.87 (adjusted <italic>R</italic>²=0.85; <italic>P</italic>&#60;.001). A stepwise linear regression identified 5 significant predictors of “openness of communication” score, ie, the overall net sentiment of the narrative and fear, which were obtained based on the NRC Emotion Lexicon; informational support among family members; educational level; and being single (<xref ref-type="table" rid="table2">Table 2</xref>). Specifically, findings showed that both the higher overall net sentiment score of the narrative (<italic>P</italic>=.007) and also greater fear (<italic>P=</italic>1.97 × 10<sup>–5</sup>) were strongly associated with higher “openness of communication” scores. There was a positive correlation between “openness of communication” score and the statement “In our family when I have a health problem there is great willingness to share information with each other” (<italic>P</italic>=.005). Participants with nonacademic education were also more likely to communicate genetic risk with their relatives (<italic>P</italic>=.02). Lastly, there was a positive correlation between being single and “openness of communication” scores (<italic>P</italic>=.047).</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Results of the linear regression analysis predicting “openness of communication.”</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="130"/>
            <col width="100"/>
            <col width="160"/>
            <col width="110"/>
            <thead>
              <tr valign="bottom">
                <td>Variables</td>
                <td>Estimate</td>
                <td>SE</td>
                <td><italic>t</italic> test<sup>a</sup> (<italic>df</italic>)</td>
                <td><italic>P</italic> value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Being single</td>
                <td>19.782</td>
                <td>9.574</td>
                <td>2.066 (1)</td>
                <td>.047<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Academic education</td>
                <td>–10.387</td>
                <td>4.256</td>
                <td>–2.44 (1)</td>
                <td>.02<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>Fear</td>
                <td>0.204</td>
                <td>0.041</td>
                <td>4.954 (1)</td>
                <td>1.97 × 10<sup>–5c</sup></td>
              </tr>
              <tr valign="top">
                <td>Informational support</td>
                <td>11.392</td>
                <td>3.790</td>
                <td>3.006 (1)</td>
                <td>.005<sup>d</sup></td>
              </tr>
              <tr valign="top">
                <td>Net sentiment score of the narrative</td>
                <td>0.260</td>
                <td>0.091</td>
                <td>2.861 (1)</td>
                <td>.007<sup>d</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>2-tailed <italic>t</italic> test.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>Significance level: <italic>P</italic>&#60;.05.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>Significance level: <italic>P</italic>&#60;.001.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>Significance level: <italic>P</italic>&#60;.01.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Model Performance</title>
        <p>The predictive accuracy of the model using a stepwise linear regression for the training and testing data sets reached 0.85 (AUC=0.92, specificity=0.86, and sensitivity=0.82) and 0.72 (AUC=0.69, specificity=0.62, and sensitivity=0.83), respectively. <xref rid="figure4" ref-type="fig">Figure 4</xref> presents the receiver operating characteristic curves that visualize the accuracy improvement between the training and testing data sets applying linear regression.</p>
        <p>The predicted values are plotted against the target values and are shown on a scatter plot for the linear regression model (<xref rid="figure5" ref-type="fig">Figure 5</xref>). The linear regression model achieved RMSEs of 11.76 (training data set) and 16.04 (testing data set). In this case, our model performs more accurately when it yields lower values of RSME.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Receiver operating characteristic (ROC) curves of the training (A) and testing (B) model predicting “openness of communication” applying linear regression. AUC: area under the curve.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e38399_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Scatter plot of predicted values against target values with 95% confidence and prediction intervals for the training (A) and testing (B) data sets applying linear regression.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e38399_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>We analyzed 53 narratives regarding intrafamilial communication of genetic cancer risk associated with HBOC. NLP enabled the analysis of unstructured narratives from different languages and identified the most frequently used words or combination of words describing openness in family communication of genetic cancer risk. This was the first study in which we applied NLP and sentiment analysis to better understand factors driving open intrafamilial communication regarding genetic cancer risk. Our findings showed that sentiment plays a crucial role and that emotions are a pervasive feature that predict intrafamilial communication in this particular population. Sentiment analysis performed on all interviews provided scores demonstrating positive or negative emotional valence, which were highly predictive of the direction of intrafamilial communication in this context. The higher overall net sentiment scores predicted greater openness in intrafamilial communication, whereas the lower overall net sentiment scores predicted closed or absent communication. This finding provides insights consistent with social penetration theory related to self-disclosure of carrying a cancer-causing genetic variant [<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]. The depth of self-disclosure, ie, the degree to which the individual reveals personal and private information involving unusual traits and painful memories, reflects the degree of intimacy of a relationship. In the context of HBOC intrafamilial communication, self-disclosure of personal genetic information may be opposed by the desire to retain privacy and to avoid creating uncertainty and unpredictability in interpersonal relationships. Anticipating future negative emotions, such as regret or conflict, categorizes genetic risk information as a considerable emotional threat [<xref ref-type="bibr" rid="ref43">43</xref>]. This finding was captured in our analysis as the overall net sentiment of each narrative, and its predictive value was confirmed based on the performance of our models. Taken together, findings indicate that sentiment can be used to frame genetic cancer risk as an opportunity for proactive risk reduction and for enhancing technology-mediated HBOC intrafamilial communication.</p>
        <p>Our linear regression model explained more than 80% of the variance in openness of communication and achieved good performance in both the training and the testing samples. Our findings show that NLP was highly accurate in analyzing unstructured narratives from individuals of different cultural and linguistic backgrounds (Swiss German, French, Italian, English, and Korean) and in quantifying openness of communication in intrafamilial discussions about genetic cancer risk. The “openness of communication” scores were also validated against IRI. IRI was developed on the premise that increased genetic knowledge, positive motivation, and increased self-efficacy are prerequisites of increased intention to inform relatives about genetic risk. Although “intention to inform relatives” is closely related to “openness of communicating genetic risk,” the 2 concepts are not identical, which was also confirmed in our data with a moderate positive correlation between the 2 scores. An individual may have high intention to inform relatives about their genetic risk despite difficulties in communication within their family.</p>
        <p>Creating a new lexicon for openness in communication enriched with terms from different sources contributes to the innovation of our approach and the generalizability and applicability of our findings. Our lexicon can be further used and expanded in future projects, providing a solid foundation for the use of NLP in the growing field of research in interpersonal communication, focusing on family communication and health care and technology-mediated communication [<xref ref-type="bibr" rid="ref44">44</xref>]. Sentiment analysis can be further utilized in the era of precision medicine and precision public health for message tailoring and message framing. Extracting sentiment polarities can be highly informative in improving consumer experiences when using digital health platforms in promoting precision public health campaigns. For example, trust in the health care system has been associated with use of cancer surveillance, whereas conflicting messages from providers create a sense of disorientation and mistrust [<xref ref-type="bibr" rid="ref45">45</xref>-<xref ref-type="bibr" rid="ref48">48</xref>].</p>
        <p>Our findings also indicated a greater likelihood of open intrafamilial communication in those who were single, had a nonacademic education, and higher informational support within their family network. These findings should be interpreted with caution and should be replicated with analyses of narratives from larger, and possibly more diverse, samples.</p>
      </sec>
      <sec>
        <title>Strengths and Limitations</title>
        <p>Studies in different domains have also considered sentiment for analyzing textual communication in social media such as Twitter or Facebook [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. However, one significant strength of our approach was that narrative data were combined with the demographic and clinical characteristics of participants, which can increase the applicability of findings. Another important strength was the use of several sentiment lexicons to select the most suitable for this context. Sentiment scores originating from the NRC Emotion Lexicon were the most appropriate to predict “openness of communication,” whereas the other 2 sentiment lexicons (AFINN and Bing Liu) were highly correlated, resulting in a predictive algorithm of lesser importance. Studies have shown that the selection of inappropriate lexicons may impact prediction performance [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>]. Finally, NLP can automate parts of text analysis and can be used as an assisting tool to help researchers navigate through large volumes of text data.</p>
        <p>One limitation of our study was the small sample size and the size of the available corpus, which did not allow us to include possible significant covariates and to fully explore the potential of the NLP methodology, including sentence structure and length of words. Despite this limitation, the results of our study can be used as indicators of various narrative features, such as overall sentiment and fear, which can be important predictors of interpersonal communication and self-disclosure in this specific population. Important features of NLP analysis, such as sentence structure and length of words, can be investigated with a larger number of narratives and larger number of corpora. The analytical approach we describe in this paper can be further improved by using larger samples. Further development of a robust model will advance a more precise assessment and reach higher accuracy.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We demonstrate how various features from narratives can be used to predict “openness of communication” in individuals carrying a pathogenic variant connected to HBOC. Although our methodology requires further exploration and our findings require replication with larger samples, this is an important first step to understand how individuals and the public may react in discourses involving communication of genetic cancer risk. Overall, this experimental analysis provides evidence that our approach is promising and can be further used in the field of technology-mediated communication and precision public health.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUC</term>
          <def>
            <p>area under the curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">HBOC</term>
          <def>
            <p>hereditary breast and ovarian cancer</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">IRI</term>
          <def>
            <p>Informing Relatives Inventory</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">LS</term>
          <def>
            <p>Lynch syndrome</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">NRC</term>
          <def>
            <p>National Research Council Canada</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">RMSE</term>
          <def>
            <p>root mean square error</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We would like to thank Monica Aceti, PhD; Andrea Kaiser-Grolimund, PhD; and Carla Pedrazzani, MSc; and the recruitment team of K-CASCADE and the CASCADE Consortia for their valuable help regarding data collection and ongoing recruitment. This research was supported by the Swiss Cancer League (KLS-4294-08-2017); Swiss Cancer Research Foundation (KFS-5293-02-2021); DIALOGUE (IZKSZ3_188408/1); and the University of Basel, Office of the Vice Rector of Research (2016) to MCK.</p>
      <p>The members of the CASCADE Consortium are Monica Aceti, Souria Aissaoui, Nicole Bürki, Pierre O Chappuis, Muriel Fluri, Rossella Graffeo-Galbiati, Karl Heinimann, Viola Heinzelmann-Schwarz, Helen Koechlin, Christian Kurzeder, Ashley Machen, Christian Monnerat, Carla Pedrazzani, Nicole Probst-Hensch, Manuela Rabaglio, Simon Wieser and Ursina Zürrer-Härdi.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>VB, RCGP, GL, and MCK contributed to conceptualization. VB, RCGP, RS, and MCK contributed to methodology. VB contributed to formal analysis and visualization. VB and MCK contributed to writing—original draft preparation. VB, RCGP, SK, RS, SHB, MCZ, GL, FC, and MCK contributed to writing—review and editing. MCK contributed to supervision. All authors have read and agreed to the published version of the manuscript.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Mining and summarizing customer reviews</article-title>
          <year>2004</year>
          <month>08</month>
          <day>22</day>
          <conf-name>KDD '04: tenth ACM SIGKDD international conference on Knowledge discovery and data mining</conf-name>
          <conf-date>August 22-25, 2004</conf-date>
          <conf-loc>Seattle, WA</conf-loc>
          <fpage>168</fpage>
          <lpage>177</lpage>
          <pub-id pub-id-type="doi">10.1145/1014052.1014073</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pang</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Opinion mining and sentiment analysis</article-title>
          <source>Foundations and Trends in Information Retrieval</source>
          <year>2008</year>
          <month>07</month>
          <day>07</day>
          <volume>2</volume>
          <issue>1–2</issue>
          <fpage>1</fpage>
          <lpage>135</lpage>
          <pub-id pub-id-type="doi">10.1561/1500000011</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Solangi</surname>
              <given-names>YA</given-names>
            </name>
            <name name-style="western">
              <surname>Solangi</surname>
              <given-names>ZA</given-names>
            </name>
            <name name-style="western">
              <surname>Aarain</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Abro</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mallah</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Review on natural language processing (NLP) and its toolkits for opinion mining and sentiment analysis</article-title>
          <year>2018</year>
          <conf-name>2018 IEEE 5th International Conference on Engineering Technologies and Applied Sciences (ICETAS)</conf-name>
          <conf-date>November 22-23, 2018</conf-date>
          <conf-loc>Bangkok, Thailand</conf-loc>
          <fpage>1</fpage>
          <lpage>4</lpage>
          <pub-id pub-id-type="doi">10.1109/icetas.2018.8629198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kastrati</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Dalipi</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Imran</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Pireva Nuci</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wani</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Sentiment analysis of students’ feedback with NLP and deep learning: a systematic mapping study</article-title>
          <source>Appl Sci</source>
          <year>2021</year>
          <month>04</month>
          <day>28</day>
          <volume>11</volume>
          <issue>9</issue>
          <fpage>3986</fpage>
          <pub-id pub-id-type="doi">10.3390/app11093986</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaur</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ahsaan</surname>
              <given-names>SU</given-names>
            </name>
            <name name-style="western">
              <surname>Alankar</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>A proposed sentiment analysis deep learning algorithm for analyzing COVID-19 tweets</article-title>
          <source>Inf Syst Front</source>
          <year>2021</year>
          <month>04</month>
          <day>20</day>
          <volume>23</volume>
          <issue>6</issue>
          <fpage>1417</fpage>
          <lpage>1429</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33897274"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10796-021-10135-7</pub-id>
          <pub-id pub-id-type="medline">33897274</pub-id>
          <pub-id pub-id-type="pii">10135</pub-id>
          <pub-id pub-id-type="pmcid">PMC8057010</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Manguri</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Ramadhan</surname>
              <given-names>RN</given-names>
            </name>
            <name name-style="western">
              <surname>Mohammed Amin</surname>
              <given-names>PR</given-names>
            </name>
          </person-group>
          <article-title>Twitter sentiment analysis on worldwide COVID-19 outbreaks</article-title>
          <source>Kurdistan Journal of Applied Research</source>
          <year>2020</year>
          <month>05</month>
          <day>19</day>
          <volume>5</volume>
          <issue>3</issue>
          <fpage>54</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.24017/covid.8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mishev</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Gjorgjevikj</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Stojanov</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mishkovski</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Vodenska</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Chitkushev</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Performance evaluation of word and sentence embeddings for finance headlines sentiment analysis</article-title>
          <year>2019</year>
          <month>10</month>
          <day>14</day>
          <conf-name>Performance evaluation of word and sentence embeddings for finance headlines sentiment analysis. International Conference on ICT Innovations; : Springer</conf-name>
          <conf-date>October 17-19, 2019</conf-date>
          <conf-loc>Ohrid, North Macedonia</conf-loc>
          <fpage>161</fpage>
          <lpage>172</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-030-33110-8_14</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Petropoulos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Siakoulis</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Can central bank speeches predict financial market turbulence? evidence from an adaptive NLP sentiment index analysis using XGBoost machine learning technique</article-title>
          <source>Central Bank Review</source>
          <year>2021</year>
          <month>12</month>
          <volume>21</volume>
          <issue>4</issue>
          <fpage>141</fpage>
          <lpage>153</lpage>
          <pub-id pub-id-type="doi">10.1016/j.cbrev.2021.12.002</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Paltoglou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Thelwall</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Twitter, MySpace, Digg: unsupervised sentiment analysis in social media</article-title>
          <source>ACM Trans Intell Syst Technol</source>
          <year>2012</year>
          <month>09</month>
          <volume>3</volume>
          <issue>4</issue>
          <fpage>1</fpage>
          <lpage>19</lpage>
          <pub-id pub-id-type="doi">10.1145/2337542.2337551</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bhaskar</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Sruthi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nedungadi</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Enhanced sentiment analysis of informal textual communication in social media by considering objective words and intensifiers</article-title>
          <year>2014</year>
          <conf-name>nternational Conference on Recent Advances and Innovations in Engineering (ICRAIE-2014)</conf-name>
          <conf-date>May 9-11, 2014</conf-date>
          <conf-loc>Jaipur, India</conf-loc>
          <fpage>1</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1109/icraie.2014.6909220</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sailunaz</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Alhajj</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Emotion and sentiment analysis from Twitter text</article-title>
          <source>J Comput Sci</source>
          <year>2019</year>
          <month>09</month>
          <volume>36</volume>
          <fpage>101003</fpage>
          <pub-id pub-id-type="doi">10.1016/j.jocs.2019.05.009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chi</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Examining patterns of information exchange and social support in a web-based health community: exponential random graph models</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>09</month>
          <day>29</day>
          <volume>22</volume>
          <issue>9</issue>
          <fpage>e18062</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/9/e18062/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/18062</pub-id>
          <pub-id pub-id-type="medline">32990628</pub-id>
          <pub-id pub-id-type="pii">v22i9e18062</pub-id>
          <pub-id pub-id-type="pmcid">PMC7556372</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Understanding health care social media use from different stakeholder perspectives: a content analysis of an online health community</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>04</month>
          <day>07</day>
          <volume>19</volume>
          <issue>4</issue>
          <fpage>e109</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/4/e109/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.7087</pub-id>
          <pub-id pub-id-type="medline">28389418</pub-id>
          <pub-id pub-id-type="pii">v19i4e109</pub-id>
          <pub-id pub-id-type="pmcid">PMC5400888</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cabling</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Hurtado-de-Mendoza</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Drago</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Sheppard</surname>
              <given-names>VB</given-names>
            </name>
          </person-group>
          <article-title>Sentiment analysis of an online breast cancer support group: communicating about Tamoxifen</article-title>
          <source>Health Commun</source>
          <year>2018</year>
          <month>09</month>
          <volume>33</volume>
          <issue>9</issue>
          <fpage>1158</fpage>
          <lpage>1165</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28678549"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/10410236.2017.1339370</pub-id>
          <pub-id pub-id-type="medline">28678549</pub-id>
          <pub-id pub-id-type="pmcid">PMC6077266</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Salloum</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Prosperi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Du</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ramirez-Diaz</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Using social media data to understand the impact of promotional information on laypeople's discussions: a case study of Lynch syndrome</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>12</month>
          <day>13</day>
          <volume>19</volume>
          <issue>12</issue>
          <fpage>e414</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/12/e414/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.9266</pub-id>
          <pub-id pub-id-type="medline">29237586</pub-id>
          <pub-id pub-id-type="pii">v19i12e414</pub-id>
          <pub-id pub-id-type="pmcid">PMC5745354</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hyun</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>SB</given-names>
            </name>
            <name name-style="western">
              <surname>Bakken</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Exploring the ability of natural language processing to extract data from nursing narratives</article-title>
          <source>Comput Inform Nurs</source>
          <year>2009</year>
          <volume>27</volume>
          <issue>4</issue>
          <fpage>215</fpage>
          <lpage>23; quiz 224</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/19574746"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/NCN.0b013e3181a91b58</pub-id>
          <pub-id pub-id-type="medline">19574746</pub-id>
          <pub-id pub-id-type="pii">00024665-200907000-00005</pub-id>
          <pub-id pub-id-type="pmcid">PMC4415266</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cammel</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>de Vos</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>van Soest</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hettne</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Boer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Steyerberg</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Boosman</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>How to automatically turn patient experience free-text responses into actionable insights: a natural language programming (NLP) approach</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2020</year>
          <month>05</month>
          <day>27</day>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>97</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-020-1104-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-020-1104-5</pub-id>
          <pub-id pub-id-type="medline">32460734</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-020-1104-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC7251822</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vehviläinen-Julkunen</surname>
              <given-names>Katri</given-names>
            </name>
            <name name-style="western">
              <surname>Turpeinen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kvist</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ryden-Kortelainen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nelimarkka</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Enshaeifar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Faithfull</surname>
              <given-names>S</given-names>
            </name>
            <collab>INEXCA Consortium</collab>
          </person-group>
          <article-title>Experience of ambulatory cancer care: understanding patients' perspectives of quality using sentiment analysis</article-title>
          <source>Cancer Nurs</source>
          <year>2021</year>
          <volume>44</volume>
          <issue>6</issue>
          <fpage>E331</fpage>
          <lpage>E338</lpage>
          <pub-id pub-id-type="doi">10.1097/NCC.0000000000000845</pub-id>
          <pub-id pub-id-type="medline">32618620</pub-id>
          <pub-id pub-id-type="pii">00002820-202111000-00013</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cox</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia-Romeu</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>MW</given-names>
            </name>
          </person-group>
          <article-title>Predicting changes in substance use following psychedelic experiences: natural language processing of psychedelic session narratives</article-title>
          <source>Am J Drug Alcohol Abuse</source>
          <year>2021</year>
          <month>07</month>
          <day>04</day>
          <volume>47</volume>
          <issue>4</issue>
          <fpage>444</fpage>
          <lpage>454</lpage>
          <pub-id pub-id-type="doi">10.1080/00952990.2021.1910830</pub-id>
          <pub-id pub-id-type="medline">34096403</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Badal</surname>
              <given-names>VD</given-names>
            </name>
            <name name-style="western">
              <surname>Graham</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Depp</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Shinkawa</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yamada</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Palinkas</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Jeste</surname>
              <given-names>DV</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>EE</given-names>
            </name>
          </person-group>
          <article-title>Prediction of loneliness in older adults using natural language processing: exploring sex differences in speech</article-title>
          <source>Am J Geriatr Psychiatry</source>
          <year>2021</year>
          <month>08</month>
          <volume>29</volume>
          <issue>8</issue>
          <fpage>853</fpage>
          <lpage>866</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33039266"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jagp.2020.09.009</pub-id>
          <pub-id pub-id-type="medline">33039266</pub-id>
          <pub-id pub-id-type="pii">S1064-7481(20)30479-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7486862</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schwiter</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rahm</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Sturm</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>How can we reach at-risk relatives? efforts to enhance communication and cascade testing uptake: a mini-review</article-title>
          <source>Curr Genet Med Rep</source>
          <year>2018</year>
          <month>4</month>
          <day>19</day>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>21</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1007/s40142-018-0134-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ignatius</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kokkonen</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Factors contributing to verbal self-disclosure</article-title>
          <source>Nord Psychol</source>
          <year>2012</year>
          <month>07</month>
          <day>11</day>
          <volume>59</volume>
          <issue>4</issue>
          <fpage>362</fpage>
          <lpage>391</lpage>
          <pub-id pub-id-type="doi">10.1027/1901-2276.59.4.362</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baxter</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Braithwaite</surname>
              <given-names>DO</given-names>
            </name>
          </person-group>
          <article-title>Relational dialectics theory: crafting meaning from competing discourses</article-title>
          <source>Engaging Theories in Interpersonal Communication: Multiple Perspectives</source>
          <year>2008</year>
          <publisher-loc>Thousand Oaks, CA</publisher-loc>
          <publisher-name>SAGE Publications</publisher-name>
          <fpage>01</fpage>
          <lpage>61</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Braithwaite</surname>
              <given-names>DO</given-names>
            </name>
          </person-group>
          <source>Engaging Theories in Interpersonal Communication: Multiple Perspectives</source>
          <year>2005</year>
          <publisher-loc>Thousand Oaks, CA</publisher-loc>
          <publisher-name>SAGE Publications</publisher-name>
          <fpage>349</fpage>
          <lpage>362</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tezak</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pierce</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Weidner</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Clouse</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pal</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cragun</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Sharing genetic test results with family members of BRCA, PALB2, CHEK2, and ATM carriers</article-title>
          <source>Patient Educ Couns</source>
          <year>2021</year>
          <month>04</month>
          <volume>104</volume>
          <issue>4</issue>
          <fpage>720</fpage>
          <lpage>725</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33455826"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.pec.2020.12.019</pub-id>
          <pub-id pub-id-type="medline">33455826</pub-id>
          <pub-id pub-id-type="pii">S0738-3991(20)30683-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC8005459</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dwyer</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Hesse-Biber</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Flynn</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Remick</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Parent of origin effects on family communication of risk in BRCA+ women: a qualitative investigation of human factors in cascade screening</article-title>
          <source>Cancers (Basel)</source>
          <year>2020</year>
          <month>08</month>
          <day>17</day>
          <volume>12</volume>
          <issue>8</issue>
          <fpage>2316</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=cancers12082316"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/cancers12082316</pub-id>
          <pub-id pub-id-type="medline">32824510</pub-id>
          <pub-id pub-id-type="pii">cancers12082316</pub-id>
          <pub-id pub-id-type="pmcid">PMC7464326</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mahdavi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nassiri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kooshyar</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Vakili-Azghandi</surname>
              <given-names>Masoume</given-names>
            </name>
            <name name-style="western">
              <surname>Avan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sandry</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pillai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Gopalan</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Hereditary breast cancer; genetic penetrance and current status with BRCA</article-title>
          <source>J Cell Physiol</source>
          <year>2019</year>
          <month>05</month>
          <day>14</day>
          <volume>234</volume>
          <issue>5</issue>
          <fpage>5741</fpage>
          <lpage>5750</lpage>
          <pub-id pub-id-type="doi">10.1002/jcp.27464</pub-id>
          <pub-id pub-id-type="medline">30552672</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chivers Seymour</surname>
              <given-names>Kim</given-names>
            </name>
            <name name-style="western">
              <surname>Addington-Hall</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lucassen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Foster</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>What facilitates or impedes family communication following genetic testing for cancer risk? A systematic review and meta-synthesis of primary qualitative research</article-title>
          <source>J Genet Couns</source>
          <year>2010</year>
          <month>08</month>
          <volume>19</volume>
          <issue>4</issue>
          <fpage>330</fpage>
          <lpage>42</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1007/s10897-010-9296-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s10897-010-9296-y</pub-id>
          <pub-id pub-id-type="medline">20379768</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Srinivasan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Won</surname>
              <given-names>NY</given-names>
            </name>
            <name name-style="western">
              <surname>Dotson</surname>
              <given-names>WD</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>ST</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>MC</given-names>
            </name>
          </person-group>
          <article-title>Barriers and facilitators for cascade testing in genetic conditions: a systematic review</article-title>
          <source>Eur J Hum Genet</source>
          <year>2020</year>
          <month>12</month>
          <volume>28</volume>
          <issue>12</issue>
          <fpage>1631</fpage>
          <lpage>1644</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32948847"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41431-020-00725-5</pub-id>
          <pub-id pub-id-type="medline">32948847</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41431-020-00725-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC7784694</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Katapodi</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Viassolo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Caiata-Zufferey</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nikolaidis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bührer-Landolt</surname>
              <given-names>Rosmarie</given-names>
            </name>
            <name name-style="western">
              <surname>Buerki</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Graffeo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Horváth</surname>
              <given-names>Henrik Csaba</given-names>
            </name>
            <name name-style="western">
              <surname>Kurzeder</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rabaglio</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Scharfe</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Urech</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Erlanger</surname>
              <given-names>TE</given-names>
            </name>
            <name name-style="western">
              <surname>Probst-Hensch</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Heinimann</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Heinzelmann-Schwarz</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Pagani</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Chappuis</surname>
              <given-names>PO</given-names>
            </name>
          </person-group>
          <article-title>Cancer predisposition cascade screening for hereditary breast/ovarian cancer and Lynch syndromes in Switzerland: study protocol</article-title>
          <source>JMIR Res Protoc</source>
          <year>2017</year>
          <month>09</month>
          <day>20</day>
          <volume>6</volume>
          <issue>9</issue>
          <fpage>e184</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://boris.unibe.ch/id/eprint/111491"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/resprot.8138</pub-id>
          <pub-id pub-id-type="medline">28931501</pub-id>
          <pub-id pub-id-type="pii">v6i9e184</pub-id>
          <pub-id pub-id-type="pmcid">PMC5628286</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aceti</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Baroutsou</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Bürki</surname>
              <given-names>Nicole</given-names>
            </name>
            <name name-style="western">
              <surname>Caiata-Zufferey</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cattaneo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chappuis</surname>
              <given-names>PO</given-names>
            </name>
            <name name-style="western">
              <surname>Ciorba</surname>
              <given-names>FM</given-names>
            </name>
            <name name-style="western">
              <surname>Graffeo-Galbiati</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Heinzelmann-Schwarz</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Jeong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jung</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Ming</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Monnerat</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Pedrazzani</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Rabaglio</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ryu</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Saccilotto</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wieser</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zürrer-Härdi</surname>
              <given-names>Ursina</given-names>
            </name>
            <name name-style="western">
              <surname>Katapodi</surname>
              <given-names>MC</given-names>
            </name>
          </person-group>
          <article-title>Using a tailored digital health intervention for family communication and cascade genetic testing in Swiss and Korean families with hereditary breast and ovarian cancer: protocol for the DIALOGUE study</article-title>
          <source>JMIR Res Protoc</source>
          <year>2021</year>
          <month>06</month>
          <day>11</day>
          <volume>10</volume>
          <issue>6</issue>
          <fpage>e26264</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://boris.unibe.ch/id/eprint/159245"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26264</pub-id>
          <pub-id pub-id-type="medline">34114954</pub-id>
          <pub-id pub-id-type="pii">v10i6e26264</pub-id>
          <pub-id pub-id-type="pmcid">PMC8235289</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>de Geus</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Aalfs</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Menko</surname>
              <given-names>FH</given-names>
            </name>
            <name name-style="western">
              <surname>Sijmons</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Verdam</surname>
              <given-names>MGE</given-names>
            </name>
            <name name-style="western">
              <surname>de Haes</surname>
              <given-names>HCJM</given-names>
            </name>
            <name name-style="western">
              <surname>Smets</surname>
              <given-names>EMA</given-names>
            </name>
          </person-group>
          <article-title>Development of the Informing Relatives Inventory (IRI): assessing index patients' knowledge, motivation and self-efficacy regarding the disclosure of hereditary cancer risk information to relatives</article-title>
          <source>Int J Behav Med</source>
          <year>2015</year>
          <month>08</month>
          <volume>22</volume>
          <issue>4</issue>
          <fpage>551</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1007/s12529-014-9455-x</pub-id>
          <pub-id pub-id-type="medline">25515913</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>R Core Team</collab>
          </person-group>
          <article-title>R: a language and environment for statistical computing</article-title>
          <source>The R Project for Statistical Computing</source>
          <access-date>2022-12-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.r-project.org/">https://www.r-project.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Baroutsou</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Analysis code for the paper "predicting openness of communication in families with hereditary breast and ovarian cancer syndrome: natural language processing analysis"</article-title>
          <source>Zenodo</source>
          <year>2022</year>
          <month>05</month>
          <day>04</day>
          <access-date>2022-12-22</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.5281/zenodo.6517726">https://doi.org/10.5281/zenodo.6517726</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>MI</given-names>
            </name>
          </person-group>
          <article-title>Latent Dirichlet allocation</article-title>
          <source>J Mach Learn Res</source>
          <year>2003</year>
          <month>03</month>
          <day>01</day>
          <volume>3</volume>
          <fpage>993</fpage>
          <lpage>1022</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmlr.org/papers/volume3/blei03a/blei03a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aizawa</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>An information-theoretic perspective of tf–idf measures</article-title>
          <source>Information Processing &#38; Management</source>
          <year>2003</year>
          <month>1</month>
          <volume>39</volume>
          <issue>1</issue>
          <fpage>45</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1016/S0306-4573(02)00021-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="web">
          <source>Power Thesaurus</source>
          <access-date>2021-12-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.powerthesaurus.org/">https://www.powerthesaurus.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nielsen</surname>
              <given-names>FÅ</given-names>
            </name>
          </person-group>
          <article-title>A new ANEW: evaluation of a word list for sentiment analysis in microblogs</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on March 15, 2011</comment>
          <pub-id pub-id-type="doi">10.48550/arXiv.1103.2903</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mohammad</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Turney</surname>
              <given-names>PD</given-names>
            </name>
          </person-group>
          <article-title>Crowdsourcing a word-emotion association lexicon</article-title>
          <source>Comput Intell</source>
          <year>2013</year>
          <month>08</month>
          <volume>29</volume>
          <issue>3</issue>
          <fpage>436</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1467-8640.2012.00460.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mohammad</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Turney</surname>
              <given-names>PD</given-names>
            </name>
          </person-group>
          <article-title>Emotions evoked by common words and phrases: using mechanical turk to create an emotion lexicon</article-title>
          <year>2010</year>
          <month>06</month>
          <conf-name>NAACL HLT 2010 Workshop on Computational Approaches to Analysis and Generation of Emotion in Text</conf-name>
          <conf-date>June 5, 2010</conf-date>
          <conf-loc>Los Angeles, CA</conf-loc>
          <fpage>26</fpage>
          <lpage>34</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carpenter</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Greene</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Social penetration theory</article-title>
          <source>The International Encyclopedia of Interpersonal Communication</source>
          <year>2015</year>
          <month>12</month>
          <day>01</day>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>John Wiley &#38; Sons</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Masaviru</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Self-disclosure: theories and model review</article-title>
          <source>Journal of Culture, Society and Development</source>
          <year>2016</year>
          <volume>18</volume>
          <fpage>43</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://core.ac.uk/download/pdf/234691127.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wöhlke</surname>
              <given-names>Sabine</given-names>
            </name>
            <name name-style="western">
              <surname>Schaper</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Schicktanz</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>How uncertainty influences lay people's attitudes and risk perceptions concerning predictive genetic testing and risk communication</article-title>
          <source>Front Genet</source>
          <year>2019</year>
          <month>04</month>
          <day>26</day>
          <volume>10</volume>
          <fpage>380</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31080458"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fgene.2019.00380</pub-id>
          <pub-id pub-id-type="medline">31080458</pub-id>
          <pub-id pub-id-type="pmcid">PMC6497735</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caughlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Koerner</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Schrodt</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Fitzpatrick</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Knapp</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Daly</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Interpersonal communication in family relationships</article-title>
          <source>The Sage Handbook of Interpersonal Communication. 4th ed</source>
          <year>2011</year>
          <publisher-loc>Thousand Oaks, CA</publisher-loc>
          <publisher-name>SAGE Publications</publisher-name>
          <fpage>679</fpage>
          <lpage>714</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caiata-Zufferey</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pagani</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Cina</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Membrez</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Taborelli</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Unger</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Monnerat</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Chappuis</surname>
              <given-names>PO</given-names>
            </name>
          </person-group>
          <article-title>Challenges in managing genetic cancer risk: a long-term qualitative study of unaffected women carrying BRCA1/BRCA2 mutations</article-title>
          <source>Genet Med</source>
          <year>2015</year>
          <month>09</month>
          <volume>17</volume>
          <issue>9</issue>
          <fpage>726</fpage>
          <lpage>32</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1098-3600(21)03211-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/gim.2014.183</pub-id>
          <pub-id pub-id-type="medline">25503500</pub-id>
          <pub-id pub-id-type="pii">S1098-3600(21)03211-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Rauscher</surname>
              <given-names>GH</given-names>
            </name>
            <name name-style="western">
              <surname>Jacobs</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Strenski</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Ferrans</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Warnecke</surname>
              <given-names>RB</given-names>
            </name>
          </person-group>
          <article-title>The import of trust in regular providers to trust in cancer physicians among White, African American, and Hispanic breast cancer patients</article-title>
          <source>J Gen Intern Med</source>
          <year>2011</year>
          <month>01</month>
          <volume>26</volume>
          <issue>1</issue>
          <fpage>51</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/20811783"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11606-010-1489-4</pub-id>
          <pub-id pub-id-type="medline">20811783</pub-id>
          <pub-id pub-id-type="pmcid">PMC3024096</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Katapodi</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Pierce</surname>
              <given-names>PF</given-names>
            </name>
            <name name-style="western">
              <surname>Facione</surname>
              <given-names>NC</given-names>
            </name>
          </person-group>
          <article-title>Distrust, predisposition to use health services and breast cancer screening: results from a multicultural community-based survey</article-title>
          <source>Int J Nurs Stud</source>
          <year>2010</year>
          <month>08</month>
          <volume>47</volume>
          <issue>8</issue>
          <fpage>975</fpage>
          <lpage>83</lpage>
          <pub-id pub-id-type="doi">10.1016/j.ijnurstu.2009.12.014</pub-id>
          <pub-id pub-id-type="medline">20089252</pub-id>
          <pub-id pub-id-type="pii">S0020-7489(09)00406-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kenen</surname>
              <given-names>RH</given-names>
            </name>
            <name name-style="western">
              <surname>Shapiro</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Friedman</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Coyne</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Peer-support in coping with medical uncertainty: discussion of oophorectomy and hormone replacement therapy on a web-based message board</article-title>
          <source>Psychooncology</source>
          <year>2007</year>
          <month>08</month>
          <volume>16</volume>
          <issue>8</issue>
          <fpage>763</fpage>
          <lpage>71</lpage>
          <pub-id pub-id-type="doi">10.1002/pon.1152</pub-id>
          <pub-id pub-id-type="medline">17230435</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
