<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JFR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id>
      <journal-title>JMIR Formative Research</journal-title>
      <issn pub-type="epub">2561-326X</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i1e48534</article-id>
      <article-id pub-id-type="pmid">37707946</article-id>
      <article-id pub-id-type="doi">10.2196/48534</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Estimating Patient Satisfaction Through a Language Processing Model: Model Development and Evaluation</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Huang</surname>
            <given-names>Zonghai</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Burns</surname>
            <given-names>Michael</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Matsuda</surname>
            <given-names>Shinichi</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Drug Safety Division</institution>
            <institution>Chugai Pharmaceutical Co Ltd</institution>
            <addr-line>2-1-1 Nihonbashi-Muromachi, Chuo-ku</addr-line>
            <addr-line>Tokyo, 103-8324</addr-line>
            <country>Japan</country>
            <phone>81 8080105061</phone>
            <email>matsudasni@chugai-pharm.co.jp</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1822-1090</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Ohtomo</surname>
            <given-names>Takumi</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6438-6315</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Okuyama</surname>
            <given-names>Masaru</given-names>
          </name>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0000-5226-1243</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Miyake</surname>
            <given-names>Hiraku</given-names>
          </name>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0001-4582-5749</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Aoki</surname>
            <given-names>Kotonari</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1923-7003</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Drug Safety Division</institution>
        <institution>Chugai Pharmaceutical Co Ltd</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Initiative Inc</institution>
        <addr-line>Tokyo</addr-line>
        <country>Japan</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Shinichi Matsuda <email>matsudasni@chugai-pharm.co.jp</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>14</day>
        <month>9</month>
        <year>2023</year>
      </pub-date>
      <volume>7</volume>
      <elocation-id>e48534</elocation-id>
      <history>
        <date date-type="received">
          <day>1</day>
          <month>5</month>
          <year>2023</year>
        </date>
        <date date-type="rev-request">
          <day>16</day>
          <month>5</month>
          <year>2023</year>
        </date>
        <date date-type="rev-recd">
          <day>28</day>
          <month>7</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>9</day>
          <month>8</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Shinichi Matsuda, Takumi Ohtomo, Masaru Okuyama, Hiraku Miyake, Kotonari Aoki. Originally published in JMIR Formative Research (https://formative.jmir.org), 14.09.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on https://formative.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://formative.jmir.org/2023/1/e48534" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Measuring patient satisfaction is a crucial aspect of medical care. Advanced natural language processing (NLP) techniques enable the extraction and analysis of high-level insights from textual data; nonetheless, data obtained from patients are often limited.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to create a model that quantifies patient satisfaction based on diverse patient-written textual data.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We constructed a neural network–based NLP model for this cross-sectional study using the textual content from disease blogs written in Japanese on the Internet between 1994 and 2020. We extracted approximately 20 million sentences from 56,357 patient-authored disease blogs and constructed a model to predict the patient satisfaction index (PSI) using a regression approach. After evaluating the model’s effectiveness, PSI was predicted before and after cancer notification to examine the emotional impact of cancer diagnoses on 48 patients with breast cancer.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We assessed the correlation between the predicted and actual PSI values, labeled by humans, using the test set of 169 sentences. The model successfully quantified patient satisfaction by detecting nuances in sentences with excellent effectiveness (Spearman correlation coefficient [ρ]=0.832; root-mean-squared error [RMSE]=0.166; <italic>P</italic>&#60;.001). Furthermore, the PSI was significantly lower in the cancer notification period than in the preceding control period (−0.057 and −0.012, respectively; 2-tailed t<sub>47</sub>=5.392, <italic>P</italic>&#60;.001), indicating that the model quantifies the psychological and emotional changes associated with the cancer diagnosis notification.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our model demonstrates the ability to quantify patient dissatisfaction and identify significant emotional changes during the disease course. This approach may also help detect issues in routine medical practice.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>breast cancer</kwd>
        <kwd>internet</kwd>
        <kwd>machine learning</kwd>
        <kwd>natural language processing</kwd>
        <kwd>natural language-processing model</kwd>
        <kwd>neural network</kwd>
        <kwd>NLP</kwd>
        <kwd>patient satisfaction</kwd>
        <kwd>textual data</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>In any service industry, the goal is to identify and respond to customer needs [<xref ref-type="bibr" rid="ref1">1</xref>]. In health care, customers are patients, and services must be provided based on whether patients are satisfied with the diagnoses, treatment, and care that they receive. Additionally, in the medical field, patient satisfaction can be considered in the context of pharmacovigilance (PV). PV is related to monitoring and minimizing the risks of unfavorable events associated with medications, such as adverse drug reactions, and optimizing the benefit-risk profile throughout the drug life cycle [<xref ref-type="bibr" rid="ref2">2</xref>]. Recently, in the wake of technological data innovations, some traditional PV activities have faced challenges in improving efficiency and quality [<xref ref-type="bibr" rid="ref3">3</xref>]. To improve PV, it is essential to consider recruiting patients who have first-hand experience of treatments, but this remains insufficient [<xref ref-type="bibr" rid="ref4">4</xref>]. Traditional measures, such as spontaneous reporting and electronic health care databases, do not contain information related to patients’ emotions; previous research in this area has used questionnaires regarding quality of life (QOL) or patient-reported outcomes [<xref ref-type="bibr" rid="ref5">5</xref>]. Furthermore, obtaining sufficient and generalizable knowledge is often challenging owing to small sample sizes and limited patient diversity [<xref ref-type="bibr" rid="ref6">6</xref>].</p>
      <p>Insights from patient-derived resources can help improve PV guidelines to better meet patient needs. However, encouraging patient involvement is associated with challenges in obtaining feedback from different patients. Recent PV studies considered data from social networking services (SNSs) [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>], but research has shown that the benefits of using Twitter and Facebook as patient-derived resources for PV are few [<xref ref-type="bibr" rid="ref10">10</xref>]. This may be because SNSs contain a significant amount of information unrelated to treatment, making it difficult to extract the necessary data, as the primary scope of these SNSs is not related to the provision of medical care.</p>
      <p>Data resources that are primarily focused on collecting patient experiences are rare. An example of a successful method of collecting such information is the web-based patient community operating in the United States, PatientsLikeMe, which has conducted both prospective data collection and evaluation of treatments from the perspective of patients [<xref ref-type="bibr" rid="ref11">11</xref>]. One conventional method of collecting data regarding patient feedback is through surveys that include questions on QOL. Surveys conducted by PatientsLikeMe use multiple-choice questionnaires to ask patients about their disease complaints [<xref ref-type="bibr" rid="ref12">12</xref>]. However, as most QOL questions are developed from the perspective of the health care professional, they tend to focus only on the intentions of those asking the questions. A recent study showed that patients with COVID-19 tended to describe broad aspects of care that mattered to them in the comment field, regardless of the focus of the survey question [<xref ref-type="bibr" rid="ref13">13</xref>]. This highlights the importance of patient-written narratives, as essential opinions of patients may be overlooked if only prespecified questionnaires are used. Another key challenge is obtaining data that reflect the opinions of a wide range of patients receiving various treatments.</p>
      <p>Regarding such data, some patients in Japan who had adopted the custom of writing <italic>tōbyōki</italic>, which are diaries about their longitudinal experience with diseases [<xref ref-type="bibr" rid="ref14">14</xref>], began posting their <italic>tōbyōki</italic> as blogs in the mid-1990s. These <italic>tōbyōki</italic> blogs, in combination with natural language processing (NLP) [<xref ref-type="bibr" rid="ref15">15</xref>], facilitate a qualitative understanding of treatment experiences and feelings [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. Nonetheless, a qualitative description alone is not sufficient to make decisions that could improve patient care, and effective methods for visualizing patient anxieties and frustrations are needed.</p>
      <p>Based on recent research trends, we believe the following 3 research issues should be addressed:</p>
      <list list-type="order">
        <list-item>
          <p>Critical information is missed when only computers are used to classify results based on a preset group of options. Thus, the contents need to be reviewed manually. This takes considerable time before starting a discussion for action.</p>
        </list-item>
        <list-item>
          <p>Analyzing qualitative data quantitatively to investigate the significance of differences is challenging. For example, sentiment analysis programs can identify a particular sentiment category as “negative” for a specific group of texts based on machine learning; however, this classification alone does not indicate the intensity of that negativity. Although some studies have quantitatively shown the degree of sentiment, the validity of such estimations in the health care domain has been limited [<xref ref-type="bibr" rid="ref18">18</xref>]. Hence, manual review by humans is required to prioritize issues for action. Thus, a system that can quantitatively assess the impact of qualitative content in a timely fashion is needed.</p>
        </list-item>
        <list-item>
          <p>When using supervised machine learning to classify groups according to patients’ comments, researchers must specify the classification groups beforehand. If a patient has a complaint that does not fit into the prespecified classification groups, it is challenging to capture the complaint using previous classification methods. Thus, we believe that these types of classification approaches have led to the loss of a significant percentage of social media data, which is unfortunate because patients’ comments on social media can yield novel, unanticipated complaints given that they do not have the same restrictions that they would have with structured questionnaires [<xref ref-type="bibr" rid="ref19">19</xref>].</p>
        </list-item>
      </list>
      <p>We believe that the quantitative assessment of patient satisfaction using data from the narratives of diverse patient populations is of significant value; however, no such efforts have been reported. If an efficient tool to obtain patient feedback from written texts could be developed, it could be widely applied to improve health care services. In this study, we aimed to create an NLP model that quantifies patient satisfaction based on diverse patient-written textual data.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Description and Processing of Data</title>
        <p>We have collected anonymous, publicly available data from <italic>tōbyōki</italic> blogs written in Japanese from the internet [<xref ref-type="bibr" rid="ref20">20</xref>]. Individual <italic>tōbyōki</italic> blogs were manually tagged by disease based on the blog title or introduction page. Between 1994 and 2020, the most frequently reported disease on <italic>tōbyōki</italic> blogs was breast cancer (n=6669 blog entries), followed by depression (n=3295), cervical cancer (n=1231), and rheumatoid arthritis (n=1144). We focused on breast cancer because it has the largest number of entries and is the most common cancer in women worldwide [<xref ref-type="bibr" rid="ref21">21</xref>]. Additionally, as the recurrence of breast cancer exerts a severe psychological distress on patients [<xref ref-type="bibr" rid="ref22">22</xref>], there is a substantial need to evaluate patient satisfaction during treatment.</p>
      </sec>
      <sec>
        <title>Overall Flow of Model Construction and Evaluation</title>
        <p>A systematic review revealed no unified definition of patient satisfaction [<xref ref-type="bibr" rid="ref23">23</xref>]. It is assumed that patient satisfaction is the result of a combination of treatment efficacy, quality of care, and QOL. Here, the patient satisfaction index (PSI) was defined as a numerical value ranging from −1.0 to 1.0, representing the most dissatisfied and satisfied states, respectively. We applied NLP and machine learning (ML) to develop a quantitative method for evaluating PSIs using textual information. Currently, most approaches to text analysis are based on sentiment analysis, which uses a simple sum of each word’s emotional score [<xref ref-type="bibr" rid="ref24">24</xref>]. However, this approach limits the ability to capture emotional subtleties. Another critical issue when dealing with words is how to consider the context of each sentence. A previous study reported that the performance of ML models for textual data is inadequate in the absence of contextual considerations [<xref ref-type="bibr" rid="ref25">25</xref>]. To address these issues, we applied a neural network-based model known as bidirectional encoder representation from transformers (BERT) [<xref ref-type="bibr" rid="ref26">26</xref>]. It uses word embedding, which helps capture sentence nuance more naturally than sentiment analysis [<xref ref-type="bibr" rid="ref24">24</xref>]. In addition, BERT provides improved performance because it incorporates the context before and after the words to capture nuances better than other models.</p>
        <p>We attempted to predict PSIs using a regression approach. The overall flow of the model construction is shown in <xref rid="figure1" ref-type="fig">Figure 1</xref>, and the data flowchart is shown in Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. For the training process, we collected 20 million <italic>tōbyōki</italic> blog sentences extracted from disease blogs written by 56,357 patients concerning 1402 distinct diseases, and then the preprocessing was performed to remove the extraneous information (Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) [<xref ref-type="bibr" rid="ref27">27</xref>]. In general, pretraining requires a vast amount of data and tends to be highly computational and time-consuming. To complete this process efficiently, we implemented transfer learning using the publicly available Japanese version of BERT [<xref ref-type="bibr" rid="ref28">28</xref>]. We then prepared the training data for fine-tuning, which enabled BERT to predict PSIs. Specifically, we prepared 961 sentences extracted randomly from <italic>tōbyōki</italic> blog entries written by 181 patients with breast cancer. Next, 3 reviewers (SM, TO, and HM) independently reviewed each sentence and provided a numerical value for the PSI as the actual label (PSI labeling guidelines are presented in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>; statistics for annotation results are presented in Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>); the mean value of the reviewers’ PSI labels was treated as the actual PSI for each sentence to ensure the model’s robustness by avoiding possible effects of differences between the 3 labels. Subsequently, we randomly divided these sentence data into a training data set (792 sentences) and an unseen test data set (169 sentences) to build the model and evaluate its effectiveness (the characteristics of the data for fine-tuning are presented in Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flow diagram of model construction. The overall flow of model construction consists of a pretraining phase, fine-tuning phase, and model evaluation phase. During pretraining, the bidirectional encoder representation from transformers (BERT) model obtains the spread of words, a mechanism also known as word embedding, from a large data set (in this case, tōbyōki blogs). Next, fine-tuning, a supervised learning process, replaces the output layer of the model for a specific task (in this case, predicting patient satisfaction index [PSI] from the texts).</p>
          </caption>
          <graphic xlink:href="formative_v7i1e48534_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Using the test data set, we conducted a sentiment analysis based on the Japanese sentiment polarity dictionary [<xref ref-type="bibr" rid="ref29">29</xref>]. Researchers at Tohoku University, a national university in Japan, created this dictionary by collecting nouns and declinable words in Japanese and manually adding polarity information ranging from −1.00 (negative) to 1.00 (positive) [<xref ref-type="bibr" rid="ref30">30</xref>]. Next, using the same test set, we evaluated the BERT model’s performance based on the correlation between the predicted and actual PSI.</p>
      </sec>
      <sec>
        <title>Change in PSI After Cancer Notification</title>
        <p>To confirm the reliability of the prepared BERT model in evaluating the PSI for actual cases, we conducted an evaluation by predicting the PSI before and after cancer notification. The “cancer notification period” was defined as the time when any blog entry containing the word “cancer notification (in Japanese)” was posted; each of these entries was manually confirmed by a reviewer. In contrast, the “control period” was defined as the time covered by 10 entries posted before the 120 days preceding the cancer notification period (Figure S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). We selected 48 blogs with both a blog entry for the cancer notification period and the preceding control period and computed the PSI in each period; the detailed procedure is presented in Table S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
      </sec>
      <sec>
        <title>Statistical Analyses</title>
        <p>To evaluate the model’s capacity, the Spearman correlation coefficient (ρ) and the root-mean-squared error (RMSE) were used. A paired, 2-tailed <italic>t</italic> test was conducted to compare the PSIs between the cancer notification and control periods. To compare BERT models with and without pretraining, we used a statistical comparison test for 2 correlations [<xref ref-type="bibr" rid="ref31">31</xref>]. All statistical analyses were performed using R (version 3.6.2; The R Foundation for Statistical Computing), with <italic>P</italic>&#60;.05 being considered statistically significant.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>We collected anonymous, publicly available data from web-based sources. Per the copyright law issued by the Japanese Agency for Cultural Affairs (Article 47-7), we adhered to regulations allowing the reproduction and adaptation of copyrighted works onto recording media for information analysis within specified limits [<xref ref-type="bibr" rid="ref32">32</xref>]. To ensure the privacy of individuals, the breast cancer blog data used in this study were meticulously reviewed. They were visually confirmed to be free of personally identifiable information such as the blog authors’ names, handle names, and dates of birth. This study did not necessitate institutional review board approval, aligning with the Ethical Guidelines for Life Sciences and Medical Research Involving Human Subjects [<xref ref-type="bibr" rid="ref33">33</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Evaluation of the BERT Model</title>
        <p>As part of the dictionary-based approach, we conducted sentiment analysis. The correlation between the actual PSI labeled by humans and the predicted sentiment score was very low (ρ=0.127; RMSE=0.563; <italic>P</italic>=.10; Figure S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). This result shows that sentiment analysis based on the widely used Japanese sentiment polarity dictionary is not appropriate for predicting the PSI.</p>
        <p>Using the same test set, we evaluated the correlation between the predicted and actual PSI. The BERT model achieved excellent effectiveness as an NLP model for predicting PSIs (ρ=0.832; RMSE=0.166; <italic>P</italic>&#60;.001; <xref rid="figure2" ref-type="fig">Figure 2</xref>). PSI prediction using the BERT model without pretraining was less reliable than that using the model with pretraining (ρ=0.554; RMSE=0.250; <italic>P</italic>&#60;.001; Figure S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Furthermore, a statistical comparison test for 2 correlations demonstrated that they were significantly different (<italic>P</italic>&#60;.001). This reaffirms that the model’s performance is the highest in the BERT model with pretraining.</p>
        <p>We reviewed the sentences with the highest and lowest PSIs (<xref ref-type="table" rid="table1">Table 1</xref>) and found that our model was able to evaluate the nuances of each sentence. For example, a sentence expressing appreciation for help from a patient’s family members and friends yielded a high predicted PSI of 0.45. In contrast, a situation where patients believed that their condition was improving despite experiencing adverse drug reactions yielded a modest predicted PSI of 0.18. Similarly, a sentence describing considerable hardships from radiotherapy yielded the lowest PSI, which was −0.58.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Correlation between the predicted and actual patient satisfaction index (PSI). Predicted versus actual PSI using the test set.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e48534_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Predicted patient satisfaction index (PSI) corresponding to sentences in tōbyōki blogs.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="50"/>
            <col width="890"/>
            <col width="60"/>
            <thead>
              <tr valign="bottom">
                <td>Rank</td>
                <td>PSI sentence examples<sup>a</sup></td>
                <td>PSI</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>Blindsided by the notification of my illness, I found immense joy and amazement in being able to accomplish so many things in just 6 months, with all of my friends waiting for me, bolstering my happiness.</td>
                <td>0.45</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>Perhaps the new anti-nausea medication is working better than expected.</td>
                <td>0.41</td>
              </tr>
              <tr valign="top">
                <td>17</td>
                <td>The results of the echocardiogram showed no abnormalities at all.</td>
                <td>0.23</td>
              </tr>
              <tr valign="top">
                <td>25</td>
                <td>The only reason I can manage to tolerate the side effects is that I believe my condition is becoming better.</td>
                <td>0.18</td>
              </tr>
              <tr valign="top">
                <td>105</td>
                <td>I told the doctor I wanted a chest scan, but he said he would not do it until I had more symptoms.</td>
                <td>−0.11</td>
              </tr>
              <tr valign="top">
                <td>149</td>
                <td>I really do not like tests, and no matter how many times I have them, I never get used to them.</td>
                <td>−0.33</td>
              </tr>
              <tr valign="top">
                <td>171</td>
                <td>I have had a number of severe depressive episodes, and I have also suffered from menopausal symptoms caused by hormone therapy.</td>
                <td>−0.52</td>
              </tr>
              <tr valign="top">
                <td>172</td>
                <td>The radiation treatment was quite painful.</td>
                <td>−0.58</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>These are translations of original sentences written in Japanese. Some minor changes have been made to protect patient privacy. Ranks represent the results ordered from the highest to the lowest predicted PSI for the test set.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Changes in PSI After Cancer Notification</title>
        <p>To confirm the applicability of this study’s BERT model in assessing the PSI for actual cases, we compared the PSI distribution between the time of cancer notification and the time before cancer notification using 48 <italic>tōbyōki</italic> blogs written by patients with breast cancer. Many sentences tended to have neutral PSIs (the proportions of PSIs between −0.2 and 0.2 were 1725/2097, 82.3% in the cancer notification period and 7330/8983, 81.6% in the control period; <xref rid="figure3" ref-type="fig">Figure 3</xref>). The proportion of sentences showing a negative PSI was higher in the cancer notification period (1342/2097, 64%) than in the control period (4497/8983, 50.1%). In addition, the negative PSI distribution in each sentence was slightly higher in the cancer notification period (mode –0.05) than in the control period (mode 0.05). These results indicate that many sentences in <italic>tōbyōki</italic> blogs had a neutral tone, even when they were written about cancer notification. Overall, the PSI was lower in the cancer notification period than in the control period.</p>
        <p>To examine the aforementioned differences in detail, we compared the mean PSI values at each period. Although the SD of the PSI distribution was similar in the cancer notification (SD 0.042) and control (SD 0.045) periods, the mean PSI was significantly lower in the cancer notification period than in the control period (−0.057 and −0.012, respectively; <italic>t</italic><sub>47</sub>==5.392; <italic>P</italic>&#60;.001; <xref rid="figure4" ref-type="fig">Figure 4</xref>A). This result suggests that cancer notification adversely affects the PSI, as expected. However, the average negative effect associated with cancer notification may have been partly diminished owing to the many neutral sentences in the cancer notification and control periods, as shown in <xref rid="figure3" ref-type="fig">Figure 3</xref>. This suggests that some sentences expressing shock concerning the notification may be overlooked when relying on the overall mean PSI alone. Hence, we focused on the sentences with the lowest PSI values, which were expected to highlight the most negative effects associated with cancer notification. The mean difference in the PSI between the cancer notification and control periods became apparent when the bottom 5 sentences were compared (−0.298 and −0.144, respectively; <italic>t</italic><sub>47</sub>=7.214; <italic>P</italic>&#60;.001; <xref rid="figure4" ref-type="fig">Figure 4</xref>B). Furthermore, the SD of the PSI distribution was larger during the cancer notification period (SD 0.128) than during the control period (SD 0.090). These results suggest that focusing on the lower end of the PSI successfully highlights the negative effects of cancer notification.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Distribution of the predicted patient satisfaction index (PSI) before and after cancer notification. Distribution of the predicted PSI at the time of and before cancer notification (defined as the control period). The figure shows the predicted PSI for each sentence in each period.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e48534_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Patient satisfaction index (PSI) comparison before and after cancer notification. (A) Comparison of the mean PSI in the cancer notification and control periods without limiting. (B) Comparison of the mean PSI in the cancer notification and control periods limited to the 5 sentences with the lowest PSI values.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e48534_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study showed the successful development of a model that quantifies patient satisfaction based on patient-written textual data. The most recent studies on patient satisfaction have used relatively small samples [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. However, our approach, which involved the use of an ML model with a vast amount of patient-written text from the internet, presented a realistic method for estimating patient satisfaction that can help improve health care services.</p>
        <p>When we applied the neural network-based BERT model, the predicted PSI was strongly correlated with that judged by human interpretation (ρ=0.832; <xref rid="figure2" ref-type="fig">Figure 2</xref>), and the model became more reliable with pretraining (ρ=0.554; Figure S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). This indicates the importance of pretraining specific to patients’ experiences in PSI prediction; therefore, pretraining using a large amount of data is essential to achieve high accuracy. Although a recent systematic review showed that there are many studies on NLP and ML using patient-written free texts [<xref ref-type="bibr" rid="ref36">36</xref>], few studies have attempted text-based quantification, and no previous studies are available that could provide a benchmark for comparison with our model. Nevertheless, in 1 study on hospital care that evaluated the correlation between scores obtained from a patient questionnaire and those derived from sentiment analysis of free text comments, Spearman correlation coefficient did not exceed 0.50 [<xref ref-type="bibr" rid="ref37">37</xref>], indicating the difficulty in achieving high accuracy. These findings also support our model’s excellent effectiveness in such a situation. Moreover, when we reviewed the sentences paired with PSIs (<xref ref-type="table" rid="table1">Table 1</xref>), we found that the model’s predictions considered the degree of meaning (the nuances of the language expressions) in the sentences, which is difficult to predict using conventional sentiment analysis. Collectively, these findings suggest that this model, which was trained on an immensely high volume of data from <italic>tōbyōki</italic> blogs, can be practically applied to determine accurate PSIs.</p>
        <p>We validated the model’s applicability in assessing emotional responses to cancer notification, which usually occurs in the early phase of patients’ cancer journey. As expected, PSI was significantly lower during the cancer notification period than during the preceding control period (<xref rid="figure4" ref-type="fig">Figure 4</xref>), indicating that the model can quantify the psychological and emotional changes associated with the notification. When limited to the 5 lowest-ranking sentences, the difference in PSIs between the cancer notification and control periods increased, suggesting that the amplitude of negative emotions is high for some people, as reflected by the larger SD in the cancer notification period (SD 0.128) than in the control period (SD 0.090). Understanding patient satisfaction at each stage of treatment during routine clinical practice is essential for improving the medical care system in a patient-centered fashion because there may be discrepancies in the disease burden recognized by patients and clinicians [<xref ref-type="bibr" rid="ref38">38</xref>]. Moreover, this result is consistent with Elisabeth Kübler-Ross’s 5-stage model of death and dying (<xref rid="figure5" ref-type="fig">Figure 5</xref>) [<xref ref-type="bibr" rid="ref39">39</xref>]. In the Kübler-Ross model, a cancer notification induces a “shock,” represented as the steepest negative impact (shown as a thick red line). Although several factors, including both personal (eg, age, sex, and religion) and country (eg, country’s health policies and medical environment) levels, affect patient satisfaction, it is reasonable to assume that cancer notification is universally considered to be a negative event that causes a decline in patient satisfaction regardless of the differences in these factors. To our knowledge, our model succeeded in numerically expressing this phenomenon for the first time.</p>
        <p>Our method of quantitatively identifying cancer-related anxieties can greatly contribute to future NLP research by highlighting patients’ medical needs efficiently. Although research using qualitative approaches, such as content analysis, is helpful in analyzing feedback from patients, qualitative review tends to be time-consuming and is associated with many challenges in analyzing information. Our approach, which is based on supervised ML using BERT, can significantly reduce the cost of human review. While many studies have reported achieving good results by applying BERT to both classification [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>] and regression tasks [<xref ref-type="bibr" rid="ref42">42</xref>], this study brings a unique perspective by demonstrating the potential usefulness of BERT in predicting patient satisfaction using a regression approach on patient-written textual data.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>The 5-stage model of death and dying by Elisabeth Kübler-Ross. The thick red line denotes the “shock” induced by cancer notification. The dotted line indicates a fork in the path between acceptance and depression.</p>
          </caption>
          <graphic xlink:href="formative_v7i1e48534_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>The current findings suggest that our model can be applied as a quantitative index of patient satisfaction not only in the field of PV but also in the field of health care services, where it can be used to determine the effectiveness of communication with health service providers and other related factors [<xref ref-type="bibr" rid="ref43">43</xref>]. Considering that many hospitals in the United States continue to estimate patient satisfaction with treatment using questionnaires or Twitter [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>], our approach represents a major breakthrough. Patients may be dissatisfied and anxious about services, including treatments, in their disease-fighting experience. In addition, this model can be applied to diverse areas of research subjects in social psychology, where quantitative consideration of population-level patient emotions may play an essential role in advancing knowledge in the field.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>This study has several limitations. First, when applying our method cross-culturally, it is necessary to consider that the writers’ thoughts, culture, beliefs, and customs affect their content. Second, in our model, we exclusively used breast cancer data; therefore, the model may not be generalizable to other diseases, especially those that affect male patients. Therefore, as a scope for future work, data relating to both male and female patients should be analyzed using blogs on other diseases. Third, patient satisfaction inherently contains some level of subjectivity. It encompasses multiple facets, such as treatment outcomes, communication experience with health care providers, patients’ understanding of their disease, and the overall patient experience. Although this study focuses on an overall assessment of their disease condition and treatment reflected through their blog entries, our approach does not necessarily capture all aspects of patient satisfaction. Fourth, the subjectivity inherent in manual labeling procedures and the limitation of having a relatively small number of manual labels represent another constraint. Although we took careful measures to reduce potential bias and inconsistency, this aspect is subject to individual interpretation and understanding. Finally, we recognize the limitation in our definition of the “cancer notification period.” In our approach, 1 of our researchers manually read and verified the relevance of the content of the selected blogs to cancer notification. While this manual review ensured that the selected blogs were indeed about cancer notification, there may exist instances of cancer notification that use different terminology. Consequently, there may be missed cases where cancer notification is described using alternative expressions.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>We have proposed a distinctive approach for estimating patient satisfaction using patient-written textual data. Visualizing the patient’s journey and determining the causes of varying patient satisfaction will identify problems in routine medical practice and provide services to resolve these problems.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>eTables and eFigures.</p>
        <media xlink:href="formative_v7i1e48534_app1.docx" xlink:title="DOCX File , 447 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">BERT</term>
          <def>
            <p>bidirectional encoder representation from transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">PSI</term>
          <def>
            <p>patient satisfaction index</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">PV</term>
          <def>
            <p>pharmacovigilance</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">QOL</term>
          <def>
            <p>quality of life</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">RMSE</term>
          <def>
            <p>root-mean-squared error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">SNS</term>
          <def>
            <p>social networking service</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors would like to thank Matthew McKeehan for his assistance with drafting the manuscript. We would like to thank Editage for editing and reviewing this manuscript in English. This study received no funding.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>SM, TO, and KA work with Chugai Pharmaceutical Co, Ltd. MO and HM work with Initiative Inc. All other authors declare that they have no competing interests.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lovelock</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Wirtz</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <source>Services Marketing: An Asia-Pacific and Australian Perspective, 6th ed</source>
          <year>2015</year>
          <publisher-loc>Melbourne</publisher-loc>
          <publisher-name>Pearson Australia</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fornasier</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Francescon</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Leone</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Baldo</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>An historical overview over pharmacovigilance</article-title>
          <source>Int J Clin Pharm</source>
          <year>2018</year>
          <volume>40</volume>
          <issue>4</issue>
          <fpage>744</fpage>
          <lpage>747</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29948743"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11096-018-0657-1</pub-id>
          <pub-id pub-id-type="medline">29948743</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11096-018-0657-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC6132952</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Edwards</surname>
              <given-names>IR</given-names>
            </name>
          </person-group>
          <article-title>The future of pharmacovigilance: a personal view</article-title>
          <source>Eur J Clin Pharmacol</source>
          <year>2008</year>
          <volume>64</volume>
          <issue>2</issue>
          <fpage>173</fpage>
          <lpage>181</lpage>
          <pub-id pub-id-type="doi">10.1007/s00228-007-0435-9</pub-id>
          <pub-id pub-id-type="medline">18172624</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Basch</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The missing voice of patients in drug-safety reporting</article-title>
          <source>N Engl J Med</source>
          <year>2010</year>
          <volume>362</volume>
          <issue>10</issue>
          <fpage>865</fpage>
          <lpage>869</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/20220181"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMp0911494</pub-id>
          <pub-id pub-id-type="medline">20220181</pub-id>
          <pub-id pub-id-type="pii">362/10/865</pub-id>
          <pub-id pub-id-type="pmcid">PMC3031980</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jefford</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Lisy</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lacey</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Emery</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Glaser</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Cross</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Krishnasamy</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McLachlan</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Bishop</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Patient-reported outcomes in cancer survivors: a population-wide cross-sectional study</article-title>
          <source>Support Care Cancer</source>
          <year>2017</year>
          <volume>25</volume>
          <issue>10</issue>
          <fpage>3171</fpage>
          <lpage>3179</lpage>
          <pub-id pub-id-type="doi">10.1007/s00520-017-3725-5</pub-id>
          <pub-id pub-id-type="medline">28434095</pub-id>
          <pub-id pub-id-type="pii">10.1007/s00520-017-3725-5</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Poole</surname>
              <given-names>KG</given-names>
            </name>
          </person-group>
          <article-title>Patient-experience data and bias: what ratings don't tell us</article-title>
          <source>N Engl J Med</source>
          <year>2019</year>
          <volume>380</volume>
          <issue>9</issue>
          <fpage>801</fpage>
          <lpage>803</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nejm.org/doi/10.1056/NEJMp1813418"/>
          </comment>
          <pub-id pub-id-type="doi">10.1056/NEJMp1813418</pub-id>
          <pub-id pub-id-type="medline">30811905</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pierce</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Bouri</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Pamer</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Proestel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rodriguez</surname>
              <given-names>HW</given-names>
            </name>
            <name name-style="western">
              <surname>Van Le</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Freifeld</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Walderhaug</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Edwards</surname>
              <given-names>IR</given-names>
            </name>
            <name name-style="western">
              <surname>Dasgupta</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Evaluation of Facebook and Twitter monitoring to detect safety signals for medical products: an analysis of recent FDA safety alerts</article-title>
          <source>Drug Saf</source>
          <year>2017</year>
          <volume>40</volume>
          <issue>4</issue>
          <fpage>317</fpage>
          <lpage>331</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28044249"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40264-016-0491-0</pub-id>
          <pub-id pub-id-type="medline">28044249</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40264-016-0491-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC5362648</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Convertino</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Ferraro</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Blandizzi</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tuccori</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The usefulness of listening social media for pharmacovigilance purposes: a systematic review</article-title>
          <source>Expert Opin Drug Saf</source>
          <year>2018</year>
          <volume>17</volume>
          <issue>11</issue>
          <fpage>1081</fpage>
          <lpage>1093</lpage>
          <pub-id pub-id-type="doi">10.1080/14740338.2018.1531847</pub-id>
          <pub-id pub-id-type="medline">30285501</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tricco</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Zarin</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Lillie</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Jeblee</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Warren</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Khan</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Robson</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pham</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Hirst</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Straus</surname>
              <given-names>SE</given-names>
            </name>
          </person-group>
          <article-title>Utility of social media and crowd-intelligence data for pharmacovigilance: a scoping review</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2018</year>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>38</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-018-0621-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-018-0621-y</pub-id>
          <pub-id pub-id-type="medline">29898743</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-018-0621-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC6001022</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Caster</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Dietrich</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kürzinger</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Lerch</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Maskell</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Norén</surname>
              <given-names>GN</given-names>
            </name>
            <name name-style="western">
              <surname>Tcherny-Lessenot</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Vroman</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Wisniewski</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>van Stekelenborg</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Assessment of the utility of social media for broad-ranging statistical signal detection in pharmacovigilance: results from the WEB-RADR project</article-title>
          <source>Drug Saf</source>
          <year>2018</year>
          <volume>41</volume>
          <issue>12</issue>
          <fpage>1355</fpage>
          <lpage>1369</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30043385"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40264-018-0699-2</pub-id>
          <pub-id pub-id-type="medline">30043385</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40264-018-0699-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC6223695</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Wicks</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Heywood</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>The power of social networking in medicine</article-title>
          <source>Nat Biotechnol</source>
          <year>2009</year>
          <volume>27</volume>
          <issue>10</issue>
          <fpage>888</fpage>
          <lpage>890</lpage>
          <pub-id pub-id-type="doi">10.1038/nbt1009-888</pub-id>
          <pub-id pub-id-type="medline">19816437</pub-id>
          <pub-id pub-id-type="pii">nbt1009-888</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wicks</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Vaughan</surname>
              <given-names>TE</given-names>
            </name>
            <name name-style="western">
              <surname>Massagli</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Heywood</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Accelerated clinical discovery using self-reported patient data collected online and a patient-matching algorithm</article-title>
          <source>Nat Biotechnol</source>
          <year>2011</year>
          <volume>29</volume>
          <issue>5</issue>
          <fpage>411</fpage>
          <lpage>414</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nature.com/articles/nbt.1837"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/nbt.1837</pub-id>
          <pub-id pub-id-type="medline">21516084</pub-id>
          <pub-id pub-id-type="pii">nbt.1837</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guney</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Daniels</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Childers</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Using AI to understand the patient voice during the Covid-19 pandemic</article-title>
          <source>NEJM Catal Innov Care Deliv</source>
          <year>2020</year>
          <volume>1</volume>
          <issue>2</issue>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://catalyst.nejm.org/doi/full/10.1056/CAT.20.0103"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kadobayashi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <source>As a Source of Power to Live: Sociology of Tōbyōki for Cancer [in Japanese]</source>
          <year>2011</year>
          <publisher-loc>Tokyo</publisher-loc>
          <publisher-name>Seikaisha Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hirschberg</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>CD</given-names>
            </name>
          </person-group>
          <article-title>Advances in natural language processing</article-title>
          <source>Science</source>
          <year>2015</year>
          <volume>349</volume>
          <issue>6245</issue>
          <fpage>261</fpage>
          <lpage>266</lpage>
          <pub-id pub-id-type="doi">10.1126/science.aaa8685</pub-id>
          <pub-id pub-id-type="medline">26185244</pub-id>
          <pub-id pub-id-type="pii">349/6245/261</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Matsuda</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Aoki</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tomizawa</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sone</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tanaka</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kuriki</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Takahashi</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Analysis of patient narratives in disease blogs on the internet: an exploratory study of social pharmacovigilance</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2017</year>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>e10</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2017/1/e10/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/publichealth.6872</pub-id>
          <pub-id pub-id-type="medline">28235749</pub-id>
          <pub-id pub-id-type="pii">v3i1e10</pub-id>
          <pub-id pub-id-type="pmcid">PMC5346166</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Matsuda</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ohtomo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Tomizawa</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Miyano</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mogi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kuriki</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Nakayama</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Watanabe</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Incorporating unstructured patient narratives and health insurance claims data in pharmacovigilance: natural language processing analysis of patient-generated texts about systemic lupus erythematosus</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2021</year>
          <volume>7</volume>
          <issue>6</issue>
          <fpage>e29238</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2021/6/e29238/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/29238</pub-id>
          <pub-id pub-id-type="medline">34255719</pub-id>
          <pub-id pub-id-type="pii">v7i6e29238</pub-id>
          <pub-id pub-id-type="pmcid">PMC8278300</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hanauer</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Developing a standardized protocol for computational sentiment analysis research using health-related social media data</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <volume>28</volume>
          <issue>6</issue>
          <fpage>1125</fpage>
          <lpage>1134</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33355353"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocaa298</pub-id>
          <pub-id pub-id-type="medline">33355353</pub-id>
          <pub-id pub-id-type="pii">6045013</pub-id>
          <pub-id pub-id-type="pmcid">PMC8200276</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rozenblum</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Greaves</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Bates</surname>
              <given-names>DW</given-names>
            </name>
          </person-group>
          <article-title>The role of social media around patient experience and engagement</article-title>
          <source>BMJ Qual Saf</source>
          <year>2017</year>
          <volume>26</volume>
          <issue>10</issue>
          <fpage>845</fpage>
          <lpage>848</lpage>
          <pub-id pub-id-type="doi">10.1136/bmjqs-2017-006457</pub-id>
          <pub-id pub-id-type="medline">28428244</pub-id>
          <pub-id pub-id-type="pii">bmjqs-2017-006457</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="web">
          <article-title>Tōbyōki blog collection [in Japanese]</article-title>
          <source>TOBYO</source>
          <access-date>2023-04-11</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.tobyo.jp/">https://www.tobyo.jp/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bray</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ferlay</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Soerjomataram</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Siegel</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Torre</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Jemal</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Global cancer statistics 2018: GLOBOCAN estimates of incidence and mortality worldwide for 36 cancers in 185 countries</article-title>
          <source>CA Cancer J Clin</source>
          <year>2018</year>
          <volume>68</volume>
          <issue>6</issue>
          <fpage>394</fpage>
          <lpage>424</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/doi/10.3322/caac.21492"/>
          </comment>
          <pub-id pub-id-type="doi">10.3322/caac.21492</pub-id>
          <pub-id pub-id-type="medline">30207593</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Skandarajah</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Lisy</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ward</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bishop</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lacey</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mann</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Jefford</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Patient-reported outcomes in survivors of breast cancer one, three, and five years post-diagnosis: a cancer registry-based feasibility study</article-title>
          <source>Qual Life Res</source>
          <year>2021</year>
          <volume>30</volume>
          <issue>2</issue>
          <fpage>385</fpage>
          <lpage>394</lpage>
          <pub-id pub-id-type="doi">10.1007/s11136-020-02652-w</pub-id>
          <pub-id pub-id-type="medline">32997334</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11136-020-02652-w</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Batbaatar</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Dorjdagva</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Luvsannyam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Amenta</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Conceptualisation of patient satisfaction: a systematic narrative literature review</article-title>
          <source>Perspect Public Health</source>
          <year>2015</year>
          <volume>135</volume>
          <issue>5</issue>
          <fpage>243</fpage>
          <lpage>250</lpage>
          <pub-id pub-id-type="doi">10.1177/1757913915594196</pub-id>
          <pub-id pub-id-type="medline">26187638</pub-id>
          <pub-id pub-id-type="pii">1757913915594196</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Denecke</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Sentiment analysis in medical settings: new opportunities and challenges</article-title>
          <source>Artif Intell Med</source>
          <year>2015</year>
          <volume>64</volume>
          <issue>1</issue>
          <fpage>17</fpage>
          <lpage>27</lpage>
          <pub-id pub-id-type="doi">10.1016/j.artmed.2015.03.006</pub-id>
          <pub-id pub-id-type="medline">25982909</pub-id>
          <pub-id pub-id-type="pii">S0933-3657(15)00029-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greaves</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ramirez-Cano</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Millett</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Darzi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Donaldson</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Use of sentiment analysis for capturing patient experience from free-text comments posted online</article-title>
          <source>J Med Internet Res</source>
          <year>2013</year>
          <volume>15</volume>
          <issue>11</issue>
          <fpage>e239</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2013/11/e239/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.2721</pub-id>
          <pub-id pub-id-type="medline">24184993</pub-id>
          <pub-id pub-id-type="pii">v15i11e239</pub-id>
          <pub-id pub-id-type="pmcid">PMC3841376</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>ArXiv. Preprint posted online on May 24 2019</source>
          <year>2019</year>
          <pub-id pub-id-type="doi">10.48550/arXiv.1810.04805</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Morita</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Kawahara</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kurohashi</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Morphological analysis for unsegmented languages using recurrent neural network language model</article-title>
          <year>2015</year>
          <conf-name>Proceedings of the 2015 Conference on Empirical Methods in Natural Language Processing</conf-name>
          <conf-date>17-21 September 2015</conf-date>
          <conf-loc>Lisbon, Portugal</conf-loc>
          <fpage>2292</fpage>
          <lpage>2297</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/D15-1276</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shibata</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kawahara</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kurohashi</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Improving accuracy of Japanese parsing with BERT [in Japanese]</article-title>
          <year>2019</year>
          <conf-name>Proceedings of the 25th Annual Conference of the Association for Natural Language Processing</conf-name>
          <conf-date>March 12-15, 2019</conf-date>
          <conf-loc>Nagoya, Japan</conf-loc>
          <fpage>205</fpage>
          <lpage>208</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kobayashi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Inui</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Matsumoto</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tateishi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fukushima</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Collecting evaluative expressions for opinion extraction</article-title>
          <year>2004</year>
          <conf-name>Natural Language Processing – IJCNLP 2004</conf-name>
          <conf-date>22-24 March, 2004</conf-date>
          <conf-loc>Hainan Island, China</conf-loc>
          <fpage>596</fpage>
          <lpage>605</lpage>
          <pub-id pub-id-type="doi">10.1007/978-3-540-30211-7_63</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Higashiyama</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Inui</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Matsumoto</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Learning sentiment of nouns from selectional preferences of verbs and adjectives [in Japanese]</article-title>
          <year>2008</year>
          <conf-name>Proceedings of the 14th Annual Meeting of the Association for Natural Language Processing</conf-name>
          <conf-date>17-21 March, 2008</conf-date>
          <conf-loc>Tokyo, Japan</conf-loc>
          <fpage>584</fpage>
          <lpage>587</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Diedenhofen</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Musch</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>cocor: a comprehensive solution for the statistical comparison of correlations</article-title>
          <source>PLoS One</source>
          <year>2015</year>
          <volume>10</volume>
          <issue>3</issue>
          <fpage>e0121945</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0121945"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0121945</pub-id>
          <pub-id pub-id-type="medline">25835001</pub-id>
          <pub-id pub-id-type="pii">PONE-D-14-48849</pub-id>
          <pub-id pub-id-type="pmcid">PMC4383486</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <article-title>Copyright law for information analysis issued by the Japanese Agency for Cultural Affairs [in Japanese]</article-title>
          <source>Agency for Cultural Affairs, Government of Japan</source>
          <access-date>2023-08-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.bunka.go.jp/seisaku/chosakuken/seidokaisetsu/gaiyo/chosakubutsu_jiyu.html">https://www.bunka.go.jp/seisaku/chosakuken/seidokaisetsu/gaiyo/chosakubutsu_jiyu.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="web">
          <article-title>Ethical guidelines for life sciences and medical research involving human subjects [in Japanese]</article-title>
          <source>Ministry of Education; Ministry of Health, Labour and Welfare; and Ministry of Economy, Trade and Industry</source>
          <access-date>2023-08-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mhlw.go.jp/content/001077424.pdf">https://www.mhlw.go.jp/content/001077424.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schlesinger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Grob</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Shaller</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Using patient-reported information to improve clinical practice</article-title>
          <source>Health Serv Res</source>
          <year>2015</year>
          <volume>50</volume>
          <issue>Suppl 2</issue>
          <fpage>2116</fpage>
          <lpage>2154</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26573890"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/1475-6773.12420</pub-id>
          <pub-id pub-id-type="medline">26573890</pub-id>
          <pub-id pub-id-type="pmcid">PMC5115180</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blödt</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Müller-Nordhorn</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Seifert</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Holmberg</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Trust, medical expertise and humaneness: a qualitative study on people with cancer' satisfaction with medical care</article-title>
          <source>Health Expect</source>
          <year>2021</year>
          <volume>24</volume>
          <issue>2</issue>
          <fpage>317</fpage>
          <lpage>326</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33528878"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/hex.13171</pub-id>
          <pub-id pub-id-type="medline">33528878</pub-id>
          <pub-id pub-id-type="pmcid">PMC8077133</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Khanbhai</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Anyadi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Symons</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Flott</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Darzi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mayer</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Applying natural language processing and machine learning techniques to patient experience feedback: a systematic review</article-title>
          <source>BMJ Health Care Inform</source>
          <year>2021</year>
          <volume>28</volume>
          <issue>1</issue>
          <fpage>e100262</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://informatics.bmj.com/lookup/pmidlookup?view=long&#38;pmid=33653690"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjhci-2020-100262</pub-id>
          <pub-id pub-id-type="medline">33653690</pub-id>
          <pub-id pub-id-type="pii">bmjhci-2020-100262</pub-id>
          <pub-id pub-id-type="pmcid">PMC7929894</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Greaves</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ramirez-Cano</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Millett</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Darzi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Donaldson</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Machine learning and sentiment analysis of unstructured free-text information about patient experience online</article-title>
          <source>The Lancet</source>
          <year>2012</year>
          <volume>380</volume>
          <issue>1</issue>
          <fpage>S10</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://informatics.bmj.com/lookup/pmidlookup?view=long&#38;pmid=33653690"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(13)60366-9</pub-id>
          <pub-id pub-id-type="pii">bmjhci-2020-100262</pub-id>
          <pub-id pub-id-type="pmcid">PMC7929894</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Salgado</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Reed</surname>
              <given-names>HL</given-names>
            </name>
            <name name-style="western">
              <surname>Quinn</surname>
              <given-names>CS</given-names>
            </name>
            <name name-style="western">
              <surname>Syverson</surname>
              <given-names>JG</given-names>
            </name>
            <name name-style="western">
              <surname>Le-Rademacher</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lopez</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Beutler</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Loprinzi</surname>
              <given-names>CL</given-names>
            </name>
            <name name-style="western">
              <surname>Vangipuram</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>EML</given-names>
            </name>
            <name name-style="western">
              <surname>Henry</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Farris</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Hertz</surname>
              <given-names>DL</given-names>
            </name>
          </person-group>
          <article-title>Patient factors associated with discrepancies between patient-reported and clinician-documented peripheral neuropathy in women with breast cancer receiving paclitaxel: a pilot study</article-title>
          <source>Breast</source>
          <year>2020</year>
          <volume>51</volume>
          <fpage>21</fpage>
          <lpage>28</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.thebreastonline.com/article/S0960-9776(20)30068-0/fulltext"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.breast.2020.02.011</pub-id>
          <pub-id pub-id-type="medline">32193049</pub-id>
          <pub-id pub-id-type="pii">S0960-9776(20)30068-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC7198332</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kübler-Ross</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wessler</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Avioli</surname>
              <given-names>LV</given-names>
            </name>
          </person-group>
          <article-title>On death and dying</article-title>
          <source>JAMA</source>
          <year>1972</year>
          <volume>221</volume>
          <issue>2</issue>
          <fpage>174</fpage>
          <lpage>179</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.psy.lmu.de/allg2/download/audriemmo/ws1011/kubler-ross.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jama.1972.03200150040010</pub-id>
          <pub-id pub-id-type="medline">5067627</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ambalavanan</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Devarakonda</surname>
              <given-names>MV</given-names>
            </name>
          </person-group>
          <article-title>Using the contextual language model BERT for multi-criteria classification of scientific articles</article-title>
          <source>J Biomed Inform</source>
          <year>2020</year>
          <volume>112</volume>
          <fpage>103578</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(20)30206-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2020.103578</pub-id>
          <pub-id pub-id-type="medline">33059047</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(20)30206-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>When BERT meets Bilbo: a learning curve analysis of pretrained language model on disease classification</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2022</year>
          <volume>21</volume>
          <issue>Suppl 9</issue>
          <fpage>377</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-022-01829-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-022-01829-2</pub-id>
          <pub-id pub-id-type="medline">35382811</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-022-01829-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC8981604</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Altosaar</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ranganath</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>ClinicalBERT: modeling clinical notes and predicting hospital readmission</article-title>
          <source>ArXiv. Preprint posted online on November 29 2020</source>
          <year>2020</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.48550/arXiv.1904.05342"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jenkinson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Coulter</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bruster</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Richards</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Chandola</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Patients' experiences and satisfaction with health care: results of a questionnaire study of specific aspects of care</article-title>
          <source>Qual Saf Health Care</source>
          <year>2002</year>
          <volume>11</volume>
          <issue>4</issue>
          <fpage>335</fpage>
          <lpage>339</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://qualitysafety.bmj.com/lookup/pmidlookup?view=long&#38;pmid=12468693"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/qhc.11.4.335</pub-id>
          <pub-id pub-id-type="medline">12468693</pub-id>
          <pub-id pub-id-type="pmcid">PMC1757991</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elliott</surname>
              <given-names>MN</given-names>
            </name>
            <name name-style="western">
              <surname>Cohea</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Lehrman</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>EH</given-names>
            </name>
            <name name-style="western">
              <surname>Cleary</surname>
              <given-names>PD</given-names>
            </name>
            <name name-style="western">
              <surname>Giordano</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Beckett</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Zaslavsky</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Accelerating improvement and narrowing gaps: trends in patients' experiences with hospital care reflected in HCAHPS public reporting</article-title>
          <source>Health Serv Res</source>
          <year>2015</year>
          <volume>50</volume>
          <issue>6</issue>
          <fpage>1850</fpage>
          <lpage>1867</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/25854292"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/1475-6773.12305</pub-id>
          <pub-id pub-id-type="medline">25854292</pub-id>
          <pub-id pub-id-type="pmcid">PMC4693845</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hawkins</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Brownstein</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Tuli</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Runels</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Broecker</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nsoesie</surname>
              <given-names>EO</given-names>
            </name>
            <name name-style="western">
              <surname>McIver</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Rozenblum</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bourgeois</surname>
              <given-names>FT</given-names>
            </name>
            <name name-style="western">
              <surname>Greaves</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Measuring patient-perceived quality of care in US hospitals using Twitter</article-title>
          <source>BMJ Qual Saf</source>
          <year>2016</year>
          <volume>25</volume>
          <issue>6</issue>
          <fpage>404</fpage>
          <lpage>413</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://qualitysafety.bmj.com/lookup/pmidlookup?view=long&#38;pmid=26464518"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjqs-2015-004309</pub-id>
          <pub-id pub-id-type="medline">26464518</pub-id>
          <pub-id pub-id-type="pii">bmjqs-2015-004309</pub-id>
          <pub-id pub-id-type="pmcid">PMC4878682</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
