<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id><journal-id journal-id-type="publisher-id">formative</journal-id><journal-id journal-id-type="index">27</journal-id><journal-title>JMIR Formative Research</journal-title><abbrev-journal-title>JMIR Form Res</abbrev-journal-title><issn pub-type="epub">2561-326X</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v10i1e81368</article-id><article-id pub-id-type="doi">10.2196/81368</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Remote Assessment of Parkinson Disease Using Deep Learning on Structured Mouse-Trace Data From Suspected Cases: Machine-Learning Pilot Feasibility Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Shahriar Zawad</surname><given-names>Md Rahat</given-names></name><degrees>BSc, MS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Tumpa</surname><given-names>Zerin Nasrin</given-names></name><degrees>BSc, MSc</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sollis</surname><given-names>Lydia</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Parab</surname><given-names>Shubham</given-names></name><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Washington</surname><given-names>Peter</given-names></name><degrees>BA, MS, PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Electrical and Computer Engineering, Rice University</institution><addr-line>Houston</addr-line><addr-line>TX</addr-line><country>United States</country></aff><aff id="aff2"><institution>Department of Information and Computer Sciences, University of Hawaiʻi at M&#x0101;noa</institution><addr-line>Honolulu</addr-line><addr-line>HI</addr-line><country>United States</country></aff><aff id="aff3"><institution>Department of Computer Science, New York University</institution><addr-line>New York</addr-line><addr-line>NY</addr-line><country>United States</country></aff><aff id="aff4"><institution>Department of Medicine, Division of Clinical Informatics and Digital Transformation, University of California, San Francisco</institution><addr-line>10 Koret Way</addr-line><addr-line>San Francisco</addr-line><addr-line>CA</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Law</surname><given-names>Stephanie</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Lin</surname><given-names>Kuan-Hsun</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Khan</surname><given-names>Yelman</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Peter Washington, BA, MS, PhD, Department of Medicine, Division of Clinical Informatics and Digital Transformation, University of California, San Francisco, 10 Koret Way, San Francisco, CA, 94143, United States, 1 4153532067; <email>Peter.Washington@ucsf.edu</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>26</day><month>6</month><year>2026</year></pub-date><volume>10</volume><elocation-id>e81368</elocation-id><history><date date-type="received"><day>31</day><month>07</month><year>2025</year></date><date date-type="rev-recd"><day>06</day><month>05</month><year>2026</year></date><date date-type="accepted"><day>08</day><month>05</month><year>2026</year></date></history><copyright-statement>&#x00A9; Md Rahat Shahriar Zawad, Zerin Nasrin Tumpa, Lydia Sollis, Shubham Parab, Peter Washington. Originally published in JMIR Formative Research (<ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>), 26.6.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://formative.jmir.org/2026/1/e81368"/><abstract><sec><title>Background</title><p>Parkinson disease (PD) is a pervasive neurodegenerative disorder globally, largely characterized by motor symptoms. Most existing artificial intelligence models for PD detection are trained on participants in well-resourced settings with confirmed clinical diagnoses. However, specialist-confirmed labels are often infeasible in low-resource settings.</p></sec><sec><title>Objective</title><p>We developed a web platform for structured mouse data collection through pattern tracing tests. We sought to assess the feasibility of leveraging data from a community-recruited sample of participants with suspected but undiagnosed PD to train artificial intelligence models that achieve respectable performance in predicting diagnosed PD. We tested whether using weaker diagnostic labels that may be more feasible to collect in community or global health settings, where access to professional neurologists is sparse or nonexistent, can lead to models that learn predictive signals that are diagnostically useful.</p></sec><sec sec-type="methods"><title>Methods</title><p>261 participants (73 self-reported PD, 155 non-PD, and 33 suspected PD) were recruited from community organizations in Hawaii and completed 3 pattern tracing tasks on our custom web assessment: straight line, sine wave, and spiral wave. During each task, cursor positions, screen dimensions, and an in-target boolean flag were recorded. From these data, we engineered features and generated mouse trace images. We built 3 categories of classifiers: (1) a feed-forward neural network using engineered features, (2) fine-tuned computer vision deep learning models, and (3) multimodal models concatenating a feed-forward neural network with computer vision models. Performance was evaluated using 1 primary experiment and 2 secondary analyses. The primary experiment involved training on suspected PD versus non-PD and testing on self-reported PD versus non-PD. A secondary analysis evaluated the reverse direction by training on participants with self-reported PD and without PD and then testing on participants with suspected PD versus participants without PD. Additionally, a cross-validation analysis was conducted using participants with self-reported PD versus those without PD with 5-fold cross-validation to establish baseline performance under well-defined diagnostic labels.</p></sec><sec sec-type="results"><title>Results</title><p>The best-performing models included a multimodal Vision Transformer in the primary experiment (<italic>F</italic><sub>1</sub>: mean 0.7619, SD 0.0535), a multimodal ResNet-50 in the secondary analysis (<italic>F</italic><sub>1</sub>: mean 0.9353, SD 0.0334), and an image-based DenseNet-201 in the cross-validation analysis (<italic>F</italic><sub>1</sub>: mean 0.9027, SD 0.0332). Training on patients with suspected PD yielded meaningful performance in predicting self-reported PD, supporting the feasibility of using lower-specificity labels for model development.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This pilot feasibility study suggests that remotely collected mouse-tracing data can support PD screening models under data labeling conditions of low diagnostic specificity: models trained on suspected PD from a community sample may learn signals that can transfer to predicting actual PD. Future work may consider pretraining using weaker labels and then fine-tuning on stronger clinical labels.</p></sec></abstract><kwd-group><kwd>Parkinson disease</kwd><kwd>feasibility study</kwd><kwd>remote screening</kwd><kwd>mouse-trace data</kwd><kwd>digital diagnostics</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Parkinson disease (PD) is a neurodegenerative disorder that significantly impacts the central nervous system. Major symptoms include tremors, bradykinesia, muscle rigidity, and postural instability [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref2">2</xref>], which progressively worsen over time, leading to difficulties in performing routine tasks such as typing and using a mouse. The progression of these symptoms significantly affects quality of life, making early and accurate diagnosis crucial to enable early intervention [<xref ref-type="bibr" rid="ref3">3</xref>]. PD is the second most common neurodegenerative disease after Alzheimer disease, affecting approximately 10 million people globally. In the United States, around 1 million individuals are diagnosed with PD, with an annual increase of about 90,000 new cases. This number is projected to rise to 1.2 million by 2030 [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>]. Currently, there is no definitive biomarker for PD, and diagnosis is primarily based on clinical symptoms and neuropsychological tests such as the Mini-Mental State Examination and the Unified Parkinson Disease Rating Scale [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref7">7</xref>]. These tests involve questionnaires and subjective evaluations by clinicians, which can lead to significant biases and potential misdiagnoses [<xref ref-type="bibr" rid="ref6">6</xref>]. This is particularly problematic, as PD symptoms often overlap with those of other age-related conditions and drug-induced Parkinsonism [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. Additionally, PD is characterized by the degeneration of dopamine-producing neurons in the brain, and by the time motor symptoms become apparent, approximately 30% to 50% of these neurons have already deteriorated [<xref ref-type="bibr" rid="ref11">11</xref>]. Therefore, improving approaches for more accessible classification of PD remains an important goal for effective management and treatment.</p><p>Previous digital health research on PD classification has included the analysis of hand and finger movements, keystroke dynamics, speech, handwriting, drawing tests, gait analysis, and sensor data from accelerometers and gyroscopes [<xref ref-type="bibr" rid="ref12">12</xref>-<xref ref-type="bibr" rid="ref27">27</xref>]. The use of sensors placed on lower limbs, wearable sensors supported by video recordings, and sensing coils or paper-based pads has proven effective in classifying PD and detecting tremors [<xref ref-type="bibr" rid="ref16">16</xref>-<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref30">30</xref>]. However, these methods often require controlled laboratory settings and specialized devices, limiting their broader applicability. Self-administered methods, such as keyboard interactions, keystroke dynamics, and smartphone screen interactions, have also been explored [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref21">21</xref>], but they may introduce biases, particularly against individuals with slower typing speeds. Mobile apps for data collection, symptom monitoring, and treatment management have demonstrated utility in tracking activities such as finger-tapping speed, gait, and motor performance [<xref ref-type="bibr" rid="ref31">31</xref>-<xref ref-type="bibr" rid="ref33">33</xref>], though they may pose challenges for older adults unfamiliar with smartphone technology. Moreover, video-based evaluations of finger tapping, facial expression, hand movement, and gait analysis have shown strong performance in PD classification [<xref ref-type="bibr" rid="ref34">34</xref>-<xref ref-type="bibr" rid="ref37">37</xref>]. Multimodal approaches combining different data types, such as speech, gait, and upper limb movement data, have also demonstrated potential in classifying patients with PD [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>].</p><p>Despite the prior success of digital PD biomarkers, these tools have traditionally been trained using data collected from well-resourced settings. Transferring such models for use in lower-resourced settings often requires training or fine-tuning the models on data from those settings. However, it is often only feasible to obtain lower-specificity, community-collected data labels in these settings. We sought to understand how well labels of suspected PD transfer to predicting diagnosed PD.</p><p>To support this objective, we structured our evaluation around 1 primary experiment and 2 secondary analyses, each reflecting different levels of diagnostic certainty and real-world deployment scenarios. The primary experiment involved training models on participants with suspected PD and without PD and evaluating them on patients with self-reported PD and without PD. This experiment directly addresses our central research question by assessing whether models trained using weaker, low-specificity, community-recruited labels can be diagnostically useful. We also conducted a secondary analysis examining the reverse direction, in which models were trained on participants with self-reported PD and without PD and tested on individuals with suspected PD and without PD. This analysis was included to assess whether the learned signal is bidirectional. Additionally, we conducted a cross-validation analysis using only participants with self-reported PD and without PD to establish baseline performance under well-defined diagnostic labels. Importantly, the suspected PD group in this study is based solely on the self-report and does not represent clinically confirmed PD. Instead, it reflects a heterogeneous population with uncertain diagnostic status, which we use to model real-world diagnostic ambiguity rather than validated prodromal diseases. Accordingly, this study is positioned as a feasibility investigation to determine whether meaningful PD-related signals can be learned under conditions of diagnostic uncertainty.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Overview</title><p>We created a website to collect structured mouse movement data by having participants complete a series of mouse-tracing tests remotely. We trained a series of deep-learning models using various features derived from the mouse traces. <xref ref-type="fig" rid="figure1">Figure 1</xref> outlines the workflow from data collection to model evaluation and interpretability analysis.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>The study workflow from data collection to model evaluation and interpretability analysis. (A) Participants completed the data collection process remotely on the website. (B) Engineered features and mouse-trace images were fed into 3 classes of models. The results were analyzed and visualized to identify the best performing models. (C) The best multimodal models (multimodal ResNet-50 and multimodal ViT) were analyzed for interpretability using GradSHAP (Gradient Shapley Additive Explanations) feature importance. DenseNet-201: Densely Connected Convolutional Network-201; MobileNet V2: Mobile Network v2; PD: Parkinson disease; ResNet-50: Residual Network-50; ViT: Vision Transformer.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e81368_fig01.png"/></fig></sec><sec id="s2-2"><title>Participant Recruitment and Data Collection</title><p>We recruited participants for this study through both online methods (email and social media posts) and offline methods (community meetings and conventions in Hawaii). We collaborated with the Hawaii Parkinson&#x2019;s Association and Beyond Rehab to post flyers and advertise the study to various PD emailing lists. Additionally, we established a recruitment booth at the 2024 Hawaii Parkinson&#x2019;s Association Symposium and the 2024 Hawaii Annual Parkinson&#x2019;s Run, where we provided potential participants with flyers describing how to complete the study.</p><p>We collected data via a web application that we developed [<xref ref-type="bibr" rid="ref40">40</xref>], illustrated in <xref ref-type="fig" rid="figure2">Figure 2</xref>. Participants provided demographic and disease-related information, including age and dominant hand. Due to the infeasibility of obtaining official diagnostic documents for all participants under the constraints of the pilot grant that funded this project, we asked participants to self-report their PD status.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Pages of the data collection website: (A) Introduction page of the website to inform participants about the study; (B) Participants were asked to provide information about themselves; (C) Participants were asked to confirm their information to prevent mistakes; (D) Participants were asked to trace a straight line; (E) Participants were asked to trace a sine wave; (F) Participants were asked to trace a spiral wave.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e81368_fig02.png"/></fig><p>Notably, we provided an option to select &#x201C;suspected PD&#x201D; for participants who think that they might have PD but are yet to receive a formal diagnosis, as nonmotor symptoms and subtle, nonspecific motor signs may appear before a formal PD diagnosis, which is often referred to as the prodromal phase of PD [<xref ref-type="bibr" rid="ref41">41</xref>]. For example, in the Rotterdam Study, it was found that among individuals who developed PD after a mean follow-up of 5.8 years, 71.8% had reported at least one early subjective motor symptom [<xref ref-type="bibr" rid="ref42">42</xref>]. For patients below 50 years, it typically takes over 2 years to receive an official PD diagnosis [<xref ref-type="bibr" rid="ref43">43</xref>]. Moreover, disparities in the health care system make it harder for people to access a diagnosis, and non-White Americans in the United States are half as likely to be diagnosed with PD [<xref ref-type="bibr" rid="ref44">44</xref>]. Additionally, in low-income and middle-income countries (ie, Kenya), a diagnosis of PD is often followed by a period of uncertainty where, sometimes, a diagnostic decision is reversed [<xref ref-type="bibr" rid="ref45">45</xref>].</p><p>However, participants who selected &#x201C;suspected PD&#x201D; did so based on their personal concerns or perceived symptoms and were not required to report or demonstrate clinically observable motor symptoms or provide official diagnosis documents during participation. Therefore, the &#x201C;suspected PD&#x201D; category may include individuals in the prodromal phase of PD, individuals with other motor or neurological conditions, or even individuals without any actual motor conditions.</p><p>Participants used a physical mouse on their desktop or laptop to trace a straight line, sine wave, and spiral wave on the website. We visualized their progress and alignment with the lines through highlighted portions and start or end markings. We developed the website using HTML and Bootstrap for the interface and visuals, and JavaScript to track cursor position every 500 ms. The data included mouse positions (x and y axes) and whether the mouse was inside the line (true or false). The web application also captured screen dimensions and operating system details for contextual information. Upon completing the test, all data were securely transmitted and stored in a Google Firebase collection.</p></sec><sec id="s2-3"><title>Feature Engineering and Mouse-Trace Image Generation</title><p>Based on the raw data collected, we engineered several features to quantify tracing performance across the 3 tracing tasks (straight line, sine wave, and spiral). These features include the following:</p><list list-type="bullet"><list-item><p><italic>Mean deviation from centerline (straight line only)</italic>: the average absolute vertical deviation of the traced points from the expected centerline, normalized by the screen height. The centerline is determined based on the screen height and adjusted to align with the web interface.</p></list-item><list-item><p><italic>Time taken (ms)</italic>: the total tracing time is approximated by multiplying the number of recorded points by the 500-ms sampling interval.</p></list-item><list-item><p><italic>Time taken with respect to window width (ms/pixel)</italic>: the total time, normalized by the screen width, is calculated as the total time divided by the window width. This metric accounts for variations in screen size among participants.</p></list-item><list-item><p><italic>Percentage of points traced inside the target</italic>: the proportion (from 0 to 1) of recorded points that fall inside the expected trace area.</p></list-item><list-item><p><italic>Raw count of points traced inside the target</italic>: simply the number of points recorded inside the expected trace area.</p></list-item></list><p>Using the features shown in <xref ref-type="table" rid="table1">Table 1</xref>, we quantified the consistency and accuracy of a participant&#x2019;s trace on each test pattern.</p><p>To generate mouse-trace images, we created canvases corresponding to each participant&#x2019;s screen dimensions. The recorded x and y coordinates were then used to render the trace, where segments starting with points inside the target region are colored green and those that fall outside are colored red. <xref ref-type="fig" rid="figure3">Figure 3</xref> illustrates the samples of these plots.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Engineered features extracted from mouse-trace data.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Feature name</td><td align="left" valign="bottom">Description</td><td align="left" valign="bottom">Applicable trace</td></tr></thead><tbody><tr><td align="left" valign="top">Mean deviation from centerline (fraction of screen height)</td><td align="left" valign="top">Average absolute vertical deviation from the expected centerline, normalized by the screen height</td><td align="left" valign="top">Straight line</td></tr><tr><td align="left" valign="top">Time taken (ms)</td><td align="left" valign="top">Total time estimated by multiplying the number of recorded points by 500 ms</td><td align="left" valign="top">All</td></tr><tr><td align="left" valign="top">Time taken with respect to window width (ms/pixel)</td><td align="left" valign="top">Total time divided by the window width. This normalizes the tracing duration to account for differences in screen dimensions</td><td align="left" valign="top">All</td></tr><tr><td align="left" valign="top">Percentage of points traced inside (as a fraction, 0-1)</td><td align="left" valign="top">Percentage of the number of points inside the expected trace region to the total number of points</td><td align="left" valign="top">All</td></tr><tr><td align="left" valign="top">Number of points traced inside</td><td align="left" valign="top">Count of points that are within the expected trace region, irrespective of timing</td><td align="left" valign="top">All</td></tr></tbody></table></table-wrap><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Samples of mouse-trace images produced: (A) Straight line; (B) Sine wave; (C) Spiral wave.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e81368_fig03.png"/></fig></sec><sec id="s2-4"><title>Model Selection and Model Development</title><p>We developed three categories of deep-learning models, as shown in <xref ref-type="fig" rid="figure4">Figure 4</xref>, each utilizing different input modalities, to better understand the individual and combined contributions of image and tabular mouse-trace data for PD classification. The first category of models focused on engineered tabular features, processed through a feed-forward neural network. We used this category to determine whether using purely engineered features can reliably classify patients diagnosed with PD. A feed-forward neural network was selected for consistency with the tabular data branch used later in the multimodal models. The second category of models comprised image-based models, where input images were passed through pretrained convolutional neural network (CNN)&#x2013;based architectures: Densely Connected Convolutional Network-201 (DenseNet-201), Residual Network-50 (ResNet-50), and Mobile Network v2 (MobileNet V2), and two transformer-based architectures: Vision Transformer (ViT) and Shifted Window Transformer (SwinT). CNN-based architectures (ie, DenseNet-201, ResNet-50, and MobileNet V2) excel at capturing edges and textures, which can help detect tremor-related discrepancies in the image trace. On the other hand, transformer-based architectures such as ViT use global self-attention, which can help capture the overall geometry of the traces. Additionally, SwinT uses hierarchical shifting-window attention, which can help capture both fine-grained patterns and the overall trace shape. Specifically, we used ViT-Base-Patch16-224 and swin_base_patch4_window7_224. Each of these models was selected based on their prior performance on different image-based tasks, as both CNN and transformer-based architectures have demonstrated tolerance to variations in scale, resolution, and local noise&#x2014;properties that are expected in remotely collected mouse-trace images generated from diverse hardware and screen configurations. Transfer learning was applied by unfreezing the final 45 layers of each network and by replacing the classification heads for training. The third category of models consisted of multimodal models, which integrated both data types. Tabular features were passed through a feed-forward neural network, while image inputs were processed via the same pretrained backbones used in the image-based models. The resulting feature representations were concatenated and passed through additional hidden layers for classification. All models were trained as binary classifiers for up to 50 epochs, with early stopping applied using a patience of 5. By structuring the models consistently across these categories, we aimed to isolate and analyze the impact of each data modality and understand how individual components contribute to the performance of the multimodal architectures.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Model architectures. (A) Tabular data models; (B) Image data models; (C) Multimodal models. DenseNet-201: Densely Connected Convolutional Network-201; MobileNet V2: Mobile Network v2; ResNet-50: Residual Network-50; SwinT: Shifted Window Transformer; ViT: Vision Transformer.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e81368_fig04.png"/></fig></sec><sec id="s2-5"><title>Data Splitting and Hyperparameter Tuning</title><p>We evaluated model performance across 3 experimental settings, with 1 primary experiment and 2 secondary analyses, designed to reflect different levels of diagnostic certainty and real-world deployment scenarios. The primary experiment focuses on assessing the feasibility of training models on patients who self-reported suspected PD and predicting diagnosed PD.</p><p>In the primary experiment, models were trained on participants with suspected PD and 60% of non-PD data and evaluated on all PD cases and the remaining 40% of non-PD samples, split equally into a test set and a validation set. This experiment directly addresses the central research objective by assessing whether models trained on low-specificity, community-recruited labels can generalize to predict diagnosed PD. To mitigate variability caused by nondeterministic behavior observed in some of our image-based and multimodal models, final performance was estimated by averaging results across 20 independently trained models, with average performance reported using 500 bootstrap resamples in each run. Model hyperparameters were tuned using Optuna [<xref ref-type="bibr" rid="ref46">46</xref>] over 30 trials.</p><p>In a secondary analysis, models were trained on all participants with self-reported PD and 60% of the samples without PD and evaluated on participants with suspected PD combined with the remaining 40% of non-PD data. This analysis was designed to assess whether models trained on patients diagnosed with PD can generalize to individuals with uncertain or emerging motor symptoms. Hyperparameters were tuned using Optuna over 30 trials, and final performance was estimated by averaging results across 20 independently trained models, each evaluated using 500 bootstrap resamples. This analysis is not part of the primary study objective and is included only to assess whether the learned signal is bidirectional.</p><p>In the cross-validation analysis, we included only participants labeled as either self-reported PD or non-PD, explicitly excluding those marked as suspected PD. Models were trained and evaluated using 5-fold cross-validation. Within each fold, hyperparameters were tuned using Optuna across 10 trials, and performance was estimated using 500 bootstrapped resamples per fold. We repeated each fold 10 times with independently initialized models, reporting average performance across runs. This experiment established a baseline for distinguishing controls with PD from controls without PD using stronger supervisory labels.</p><p>Bootstrapping across the different experiments was used to estimate variability and model stability under resampling. However, these approaches do not increase the amount of independent data and therefore do not fully capture uncertainty arising from the limited dataset size.</p></sec><sec id="s2-6"><title>Evaluation Metrics</title><p>To evaluate model performance, we used 4 commonly used classification metrics: sensitivity, specificity, accuracy, and <italic>F</italic><sub>1</sub>-score. These metrics were calculated using the confusion matrix derived from model predictions, consisting of the following:</p><list list-type="bullet"><list-item><p>True positives: cases correctly predicted as positive</p></list-item><list-item><p>True negatives: cases correctly predicted as negative</p></list-item><list-item><p>False positives: negative cases incorrectly predicted as positive</p></list-item><list-item><p>False negatives: positive cases incorrectly predicted as negative</p></list-item></list><p>From these values, we calculated the following metrics:</p><list list-type="bullet"><list-item><p>Sensitivity, the proportion of actual positive cases correctly identified, is defined as <inline-formula><mml:math id="ieqn1"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mtext>sensitivity</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula>.</p></list-item><list-item><p>Specificity, the proportion of actual negative cases correctly classified, is defined as&#x202F;<inline-formula><mml:math id="ieqn2"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mtext>specificity</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:mrow></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula>.</p></list-item><list-item><p>Accuracy, the overall proportion of correctly classified cases across both classes, is calculated as &#x202F;<inline-formula><mml:math id="ieqn3"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mtext>accuracy</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula>.</p></list-item><list-item><p>The <italic>F</italic><sub>1</sub>-score, the harmonic mean of precision and recall, is particularly useful for imbalanced class distributions. The <italic>F</italic><sub>1</sub>-score is computed as&#x202F;<inline-formula><mml:math id="ieqn4"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mrow><mml:msub><mml:mi>F</mml:mi><mml:mn>1</mml:mn></mml:msub></mml:mrow><mml:mtext>-score</mml:mtext><mml:mo>=</mml:mo><mml:mn>2</mml:mn><mml:mo>&#x00D7;</mml:mo><mml:mfrac><mml:mrow><mml:mtext>Precision</mml:mtext><mml:mo>&#x00D7;</mml:mo><mml:mtext>Recall</mml:mtext></mml:mrow><mml:mrow><mml:mtext>Precision</mml:mtext><mml:mo>+</mml:mo><mml:mtext>Recall</mml:mtext></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula>, where  <inline-formula><mml:math id="ieqn5"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mtext>precision</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:mrow></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula> and <inline-formula><mml:math id="ieqn6"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mtext>recall</mml:mtext><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mi mathvariant="normal">F</mml:mi><mml:mi mathvariant="normal">N</mml:mi></mml:mrow></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula>.</p></list-item></list><p>Each of these metrics was estimated using 500 bootstrapped resamples to compute both the mean and SD, providing a robust measure of model stability and generalizability. We used the mean <italic>F</italic><sub>1</sub>-score as the base metric to select the best performing models from our analysis. All metric values that we presented included the mean and SD of the metrics.</p></sec><sec id="s2-7"><title>Saliency Map and Feature Importance</title><p>To identify important features for the best performing model architectures, we created GradSHAP (Gradient Shapley Additive Explanations) saliency plots, as GradSHAP is optimized for identifying complex feature importances in deep-learning models [<xref ref-type="bibr" rid="ref47">47</xref>]. GradSHAP was applied to both the image and engineered tabular inputs to quantify their respective contributions to the model&#x2019;s predictions. For the image modality, attributions were computed separately for the sine, straight, and spiral images by comparing the model&#x2019;s output on actual inputs and shuffled versions of the same batch, used as baselines. Attribution values were summed across spatial dimensions to yield a single importance score for each image input. Importantly, the sign of each attribution was preserved to indicate the direction of influence: positive values reflect contributions toward a PD or suspected PD prediction, while negative values indicate support for a non-PD classification.</p></sec><sec id="s2-8"><title>Ethical Considerations</title><p>Our study was approved by the University of Hawaii Institutional Review Board (protocol 2022&#x2010;00857). We collected informed consent forms from all participants at the start of data collection on the website. All data used in this analysis were anonymized by default, as the assessment data did not include any personal information.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Dataset</title><p>We had 261 participants with completed attempts for the mouse-trace section of the website. Among the 261 participants, 73 self-reported as having PD, 155 as non-PD, and the remaining 33 as suspected PD. Attempts with data available for all 3 mouse-trace tasks, irrespective of the age group, were included. The characteristics of the collected data are shown in <xref ref-type="fig" rid="figure5">Figure 5</xref> and <xref ref-type="table" rid="table2">Table 2</xref>.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Participant distribution among the different classes: (A) Parkinson disease (PD), non-PD, and suspected PD, stratified by (B) device type, (C) dominant hand, and (D) age.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e81368_fig05.png"/></fig><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Participant distribution among the different classes (Parkinson disease [PD], non-PD, and suspected PD) for age, dominant hand, and device type.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristics</td><td align="left" valign="bottom">Participants</td><td align="left" valign="bottom">PD</td><td align="left" valign="bottom">Non-PD</td><td align="left" valign="bottom">Suspected PD</td></tr></thead><tbody><tr><td align="left" valign="top">Age (y)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>23&#x2010;49</td><td align="left" valign="top">16</td><td align="left" valign="top">9</td><td align="left" valign="top">2</td><td align="left" valign="top">5</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>50&#x2010;59</td><td align="left" valign="top">113</td><td align="left" valign="top">15</td><td align="left" valign="top">97</td><td align="left" valign="top">1</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>60&#x2010;69</td><td align="left" valign="top">126</td><td align="left" valign="top">46</td><td align="left" valign="top">53</td><td align="left" valign="top">27</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>70+</td><td align="left" valign="top">6</td><td align="left" valign="top">3</td><td align="left" valign="top">3</td><td align="left" valign="top">0</td></tr><tr><td align="left" valign="top">Dominant hand</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Right</td><td align="left" valign="top">185</td><td align="left" valign="top">55</td><td align="left" valign="top">99</td><td align="left" valign="top">31</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Left</td><td align="left" valign="top">76</td><td align="left" valign="top">18</td><td align="left" valign="top">56</td><td align="left" valign="top">2</td></tr><tr><td align="left" valign="top">Device type</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Windows</td><td align="left" valign="top">208</td><td align="left" valign="top">44</td><td align="left" valign="top">145</td><td align="left" valign="top">19</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mac</td><td align="left" valign="top">42</td><td align="left" valign="top">28</td><td align="left" valign="top">7</td><td align="left" valign="top">7</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Linux</td><td align="left" valign="top">11</td><td align="left" valign="top">1</td><td align="left" valign="top">3</td><td align="left" valign="top">7</td></tr><tr><td align="left" valign="top">Total</td><td align="left" valign="top">261</td><td align="left" valign="top">73</td><td align="left" valign="top">155</td><td align="left" valign="top">33</td></tr></tbody></table></table-wrap></sec><sec id="s3-2"><title>Performance Metrics</title><sec id="s3-2-1"><title>Primary Experiment: Training on Suspected PD vs Non-PD and Testing on PD vs Non-PD</title><p>In our primary experiment, where models trained on suspected PD and non-PD data were tested on patients diagnosed with PD and without PD, the multimodal ViT model performed best, achieving a mean <italic>F</italic><sub>1</sub>-score of 0.7619 (SD 0.0535) with balanced performance (accuracy: mean 0.7663, SD 0.0500; sensitivity: mean 0.5961, SD 0.0859; specificity: mean 0.9694, SD 0.0319). Overall, the performance improved as we moved from tabular to image data: the feed-forward neural network (<italic>F</italic><sub>1</sub>-score: mean 0.1022, SD 0.0654) achieved only 0.0551 (SD 0.0369) in sensitivity but 1.0000 (SD 0.0000) in specificity, indicating severe overfitting due to class imbalance. Looking at image-based models, ResNet-50 led the group (<italic>F</italic><sub>1</sub>: mean 0.7119, SD 0.0529; accuracy: mean 0.7236, SD 0.0455; sensitivity: mean 0.4921, SD 0.0836; specificity: mean 1.0000, SD 0.0000), while DenseNet-201 and MobileNet V2 performed more poorly (DenseNet-201 <italic>F</italic><sub>1</sub>: mean 0.5958, SD 0.0062; MobileNet V2 <italic>F</italic><sub>1</sub>: mean 0.6059, SD 0.0216). Adding engineered features to the image backbones produced mixed results for the <italic>F</italic><sub>1</sub>-score: ViT&#x2019;s <italic>F</italic><sub>1</sub>-score jumped from 0.4263 (SD 0.1504) to 0.7619 (SD 0.0535) and MobileNet V2 went from 0.6059 (SD 0.0216) to 0.6611 (SD 0.0549), but the <italic>F</italic><sub>1</sub>-score for DenseNet201, SwinT, and ResNet-50 actually dropped (DenseNet-201: from 0.5958, SD 0.0062 to 0.5383, SD 0.0553; SwinT: from 0.5026, SD 0.1076 to 0.3998, SD 0.0792; and ResNet-50: from 0.7119, SD 0.0529 to 0.4970, SD 0.0563). These results suggest that models trained on suspected PD samples can generalize to actual self-reported cases better than chance and that multimodal fusion provides meaningful gains for some backbones but not all. Complete performance metrics for this split are shown in <xref ref-type="table" rid="table3">Table 3</xref> and <xref ref-type="fig" rid="figure6">Figure 6A</xref>.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>The performance metrics for all models trained on suspected Parkinson disease (PD) and non-PD data, tested on PD and non-PD data with 500 bootstrap resampling.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Data type and model</td><td align="left" valign="bottom">Accuracy, mean (SD)</td><td align="left" valign="bottom">Sensitivity, mean (SD)</td><td align="left" valign="bottom">Specificity, mean (SD)</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>, mean (SD)</td></tr></thead><tbody><tr><td align="left" valign="top">Multimodal</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ViT<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="top">0.7663 (0.0500)</td><td align="left" valign="top">0.5961 (0.0859)</td><td align="left" valign="top">0.9694 (0.0319)</td><td align="left" valign="top">0.7619 (0.0535)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SwinT<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup></td><td align="left" valign="top">0.5023 (0.0477)</td><td align="left" valign="top">0.0934 (0.0960)</td><td align="left" valign="top">0.9902 (0.0182)</td><td align="left" valign="top">0.3998 (0.0792)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DenseNet-201<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup></td><td align="left" valign="top">0.5886 (0.0383)</td><td align="left" valign="top">0.2438 (0.0703)</td><td align="left" valign="top">1.0000 (0.0000)</td><td align="left" valign="top">0.5383 (0.0553)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ResNet-50<sup><xref ref-type="table-fn" rid="table3fn4">d</xref></sup></td><td align="left" valign="top">0.5610 (0.0365)</td><td align="left" valign="top">0.1931 (0.0671)</td><td align="left" valign="top">1.0000 (0.0000)</td><td align="left" valign="top">0.4970 (0.0563)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MobileNet V2<sup><xref ref-type="table-fn" rid="table3fn5">e</xref></sup></td><td align="left" valign="top">0.6752 (0.0444)</td><td align="left" valign="top">0.4778 (0.1149)</td><td align="left" valign="top">0.9108 (0.0985)</td><td align="left" valign="top">0.6611 (0.0549)</td></tr><tr><td align="left" valign="top">Images</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ViT</td><td align="left" valign="top">0.5415 (0.1018)</td><td align="left" valign="top">0.3599 (0.4091)</td><td align="left" valign="top">0.7582 (0.4094)</td><td align="left" valign="top">0.4263 (0.1504)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SwinT</td><td align="left" valign="top">0.5686 (0.0702)</td><td align="left" valign="top">0.3816 (0.3403)</td><td align="left" valign="top">0.7919 (0.2737)</td><td align="left" valign="top">0.5026 (0.1076)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DenseNet-201</td><td align="left" valign="top">0.6199 (0.0049)</td><td align="left" valign="top">0.3544 (0.0089)</td><td align="left" valign="top">0.9369 (0.0000)</td><td align="left" valign="top">0.5958 (0.0062)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ResNet-50</td><td align="left" valign="top">0.7236 (0.0455)</td><td align="left" valign="top">0.4921 (0.0836)</td><td align="left" valign="top">1.0000 (0.0000)</td><td align="left" valign="top">0.7119 (0.0529)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MobileNet V2</td><td align="left" valign="top">0.6330 (0.0159)</td><td align="left" valign="top">0.3510 (0.0292)</td><td align="left" valign="top">0.9695 (0.0000)</td><td align="left" valign="top">0.6059 (0.0216)</td></tr><tr><td align="left" valign="top">Engineered features</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FFNN<sup><xref ref-type="table-fn" rid="table3fn6">f</xref></sup></td><td align="left" valign="top">0.4859 (0.0201)</td><td align="left" valign="top">0.0551 (0.0369)</td><td align="left" valign="top">1.0000 (0.0000)</td><td align="left" valign="top">0.1022 (0.0654)</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>ViT: Vision Transformer.</p></fn><fn id="table3fn2"><p><sup>b</sup>SwinT: Shifted Window Transformer.</p></fn><fn id="table3fn3"><p><sup>c</sup>DenseNet-201: Densely Connected Convolutional Network-201.</p></fn><fn id="table3fn4"><p><sup>d</sup>ResNet-50: Residual Network-50.</p></fn><fn id="table3fn5"><p><sup>e</sup>MobileNet V2: Mobile Network v2.</p></fn><fn id="table3fn6"><p><sup>f</sup>FFNN: feed-forward neural network.</p></fn></table-wrap-foot></table-wrap><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>Key performance metrics (<italic>F</italic><sub>1</sub>-score, sensitivity, and specificity) for all models. (A) Trained on suspected Parkinson disease (PD) versus non-PD and tested on PD versus non-PD data evaluated with 500 bootstraps resampling. (B) Trained on PD versus non-PD and tested on suspected PD versus non-PD data. (C) Trained and tested on PD versus non-PD data (on 5-fold cross-validation). The error bars represent SD values. DenseNet: densely connected convolutional network; FFNN: feed-forward neural network; MobileNet: Mobile Network; ResNet: Residual Network; SwinT: Shifted Window Transformer; ViT: Vision Transformer.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e81368_fig06.png"/></fig></sec><sec id="s3-2-2"><title>Secondary Analysis: Training on PD vs Non-PD, Testing on Suspected PD vs Non-PD</title><p>In one of our secondary analyses, models were trained on PD and non-PD data and tested on suspected PD and non-PD data. The multimodal ResNet-50 model achieved the highest <italic>F</italic><sub>1</sub>-score (mean 0.9353, SD 0.0334), with balanced sensitivity (mean 1.0000, SD 0.0000) and specificity (mean 0.9045, SD 0.0506). The feed-forward neural network using only engineered features scored a mean <italic>F</italic><sub>1</sub> of 0.8523 (SD 0.0488; accuracy: mean 0.8746, SD 0.0474; sensitivity: mean 1.0000, SD 0.0000; specificity: mean 0.8058, SD 0.0734), showing that tabular data alone still carry useful signals but may not match multimodal models in this case. Among the image-based models, MobileNet V2 was the best, with a mean <italic>F</italic><sub>1</sub>-score of 0.8359 (SD 0.0560; accuracy: mean 0.8575, SD 0.0470; sensitivity: mean 0.7118, SD 0.1058; specificity: mean 0.9375, SD 0.0443). DenseNet-201 followed with mean <italic>F</italic><sub>1</sub> of 0.6809 (SD 0.0073; accuracy: mean 0.7507, SD 0.0043; sensitivity: mean 0.4137, SD 0.0122; specificity: mean 0.9355, SD 0.0000), while SwinT and ViT trailed (SwinT <italic>F</italic><sub>1</sub>: mean 0.5588, SD 0.2272; ViT <italic>F</italic><sub>1</sub>: mean 0.5467, SD 0.2659). Notably, ResNet-50 trained on images failed to detect any positives (sensitivity: mean 0.0000, SD 0.0000) and scored mean <italic>F</italic><sub>1</sub> of 0.3769 (SD 0.0108). Adding engineered features with image inputs produced positive effects for the <italic>F</italic><sub>1</sub>-score: ResNet-50 jumped from mean 0.3769 (SD 0.0108) to mean 0.9353 (SD 0.0334); DenseNet-201 jumped from mean 0.6809 (SD 0.0073) to mean 0.8712 (SD 0.0472); SwinT jumped from mean 0.5588 (SD 0.2272) to mean 0.8697 (SD 0.0380); and ViT went from mean 0.5467 (SD 0.2659) to mean 0.6726 (SD 0.2242). By contrast, the <italic>F</italic><sub>1</sub>-score of MobileNet V2 dipped from mean 0.8359 (SD 0.0560) to mean 0.7523 (SD 0.1336). These results indicate that while detecting early or ambiguous motor patterns in suspected PD, multimodal fusion can improve robustness and performance balance. Complete performance metrics for this split are shown in <xref ref-type="table" rid="table4">Table 4</xref>, and comparisons of <italic>F</italic><sub>1</sub>-score, sensitivity, and specificity are visualized in <xref ref-type="fig" rid="figure6">Figure 6B</xref>.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>The performance metrics for models trained on Parkinson disease (PD) and non-PD data, tested on suspected PD and non-PD data with 500 bootstrap resampling.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Data type and model</td><td align="left" valign="bottom">Accuracy, mean (SD)</td><td align="left" valign="bottom">Sensitivity, mean (SD)</td><td align="left" valign="bottom">Specificity, mean (SD)</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>, mean (SD)</td></tr></thead><tbody><tr><td align="left" valign="top">Multimodal</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ViT<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td><td align="left" valign="top">0.7414 (0.1585)</td><td align="left" valign="top">0.6370 (0.3958)</td><td align="left" valign="top">0.7986 (0.2211)</td><td align="left" valign="top">0.6726 (0.2242)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SwinT<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup></td><td align="left" valign="top">0.8782 (0.0369)</td><td align="left" valign="top">0.8801 (0.0501)</td><td align="left" valign="top">0.8771 (0.0528)</td><td align="left" valign="top">0.8697 (0.0380)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DenseNet-201<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">0.8768 (0.0465)</td><td align="left" valign="top">0.9371 (0.0561)</td><td align="left" valign="top">0.8438 (0.0645)</td><td align="left" valign="top">0.8712 (0.0472)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ResNet-50<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup></td><td align="left" valign="top">0.9383 (0.0327)</td><td align="left" valign="top">1.0000 (0.0000)</td><td align="left" valign="top">0.9045 (0.0506)</td><td align="left" valign="top">0.9353 (0.0334)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MobileNet V2<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup></td><td align="left" valign="top">0.8145 (0.0747)</td><td align="left" valign="top">0.5285 (0.2227)</td><td align="left" valign="top">0.9713 (0.0138)</td><td align="left" valign="top">0.7523 (0.1336)</td></tr><tr><td align="left" valign="top">Images</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ViT</td><td align="left" valign="top">0.6135 (0.2308)</td><td align="left" valign="top">0.7422 (0.3615)</td><td align="left" valign="top">0.5430 (0.4047)</td><td align="left" valign="top">0.5467 (0.2659)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SwinT</td><td align="left" valign="top">0.7263 (0.1106)</td><td align="left" valign="top">0.3119 (0.4256)</td><td align="left" valign="top">0.9535 (0.0675)</td><td align="left" valign="top">0.5588 (0.2272)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DenseNet-201</td><td align="left" valign="top">0.7507 (0.0043)</td><td align="left" valign="top">0.4137 (0.0122)</td><td align="left" valign="top">0.9355 (0.0000)</td><td align="left" valign="top">0.6809 (0.0073)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ResNet-50</td><td align="left" valign="top">0.6054 (0.0274)</td><td align="left" valign="top">0.0000 (0.0000)</td><td align="left" valign="top">0.9374 (0.0424)</td><td align="left" valign="top">0.3769 (0.0108)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MobileNet V2</td><td align="left" valign="top">0.8575 (0.0470)</td><td align="left" valign="top">0.7118 (0.1058)</td><td align="left" valign="top">0.9375 (0.0443)</td><td align="left" valign="top">0.8359 (0.0560)</td></tr><tr><td align="left" valign="top">Engineered features</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FFNN<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup></td><td align="left" valign="top">0.8746 (0.0474)</td><td align="left" valign="top">1.0000 (0.0000)</td><td align="left" valign="top">0.8058 (0.0734)</td><td align="left" valign="top">0.8523 (0.0488)</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>ViT: Vision Transformer.</p></fn><fn id="table4fn2"><p><sup>b</sup>SwinT: Shifted Window Transformer.</p></fn><fn id="table4fn3"><p><sup>c</sup>DenseNet-201: Densely Connected Convolutional Network-201.</p></fn><fn id="table4fn4"><p><sup>d</sup>ResNet-50: Residual Network-50.</p></fn><fn id="table4fn5"><p><sup>e</sup>MobileNet V2: Mobile Network v2.</p></fn><fn id="table4fn6"><p><sup>f</sup>FFNN: feed-forward neural network.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2-3"><title>Cross-Validation Analysis: 5-Fold Cross-Validation Predicting PD vs Non-PD</title><p>We also conducted a cross-validation analysis using PD and non-PD data for both training and testing via 5-fold cross-validation. The image-based DenseNet-201 model achieved the highest <italic>F</italic><sub>1</sub>-score (mean 0.9027, SD 0.0332), alongside an accuracy of 0.9179 (SD 0.0288), a sensitivity of 0.8360 (SD 0.0713), and a specificity of 0.9557 (SD 0.0327). Overall, the pretrained CNNs (ResNet-50 <italic>F</italic><sub>1</sub>: mean 0.8986, SD 0.0413; MobileNet V2 <italic>F</italic><sub>1</sub>: mean 0.8355, SD 0.0410; and DenseNet-201 <italic>F</italic><sub>1</sub>: mean 0.9027, SD 0.0332) outperformed both transformer-based image models (ViT <italic>F</italic><sub>1</sub>: mean 0.7900, SD 0.0789; SwinT <italic>F</italic><sub>1</sub>: mean 0.7819, SD 0.0774) and the feed-forward neural network using only engineered features (<italic>F</italic><sub>1</sub>: mean 0.5558, SD 0.1161), which showed high specificity (mean 0.8993, SD 0.0419) but low sensitivity (mean 0.4955, SD 0.1583). When tabular features were added to the image data, multimodal SwinT led to a negligibly small <italic>F</italic><sub>1</sub> gain (around +0.0071). By contrast, all other multimodal models experienced <italic>F</italic><sub>1</sub> drops of approximately 0.001 to 0.0785. These results suggest that while image-based CNNs capture the majority of diagnostic signals from mouse-trace images, the marginal benefit of integrating engineered features is almost nonexistent for most of the architectures. Complete performance metrics for this split are provided in <xref ref-type="table" rid="table5">Table 5</xref> and <xref ref-type="fig" rid="figure6">Figure 6C</xref>.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>The performance metrics for models trained and tested on Parkinson disease (PD) and non-PD data, evaluated using 5-fold cross-validation with 500 bootstrap resampling.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Data type and model</td><td align="left" valign="bottom">Accuracy, mean (SD)</td><td align="left" valign="bottom">Sensitivity, mean (SD)</td><td align="left" valign="bottom">Specificity, mean (SD)</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>, mean (SD)</td></tr></thead><tbody><tr><td align="left" valign="top">Multimodal</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ViT<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup></td><td align="left" valign="top">0.8255 (0.0529)</td><td align="left" valign="top">0.7730 (0.1422)</td><td align="left" valign="top">0.8488 (0.0566)</td><td align="left" valign="top">0.7883 (0.0757)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SwinT<sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup></td><td align="left" valign="top">0.8263 (0.0608)</td><td align="left" valign="top">0.6949 (0.1847)</td><td align="left" valign="top">0.8891 (0.0595)</td><td align="left" valign="top">0.7890 (0.0822)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DenseNet-201<sup><xref ref-type="table-fn" rid="table5fn3">c</xref></sup></td><td align="left" valign="top">0.8654 (0.0638)</td><td align="left" valign="top">0.6809 (0.2060)</td><td align="left" valign="top">0.9507 (0.0134)</td><td align="left" valign="top">0.8242 (0.0968)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ResNet-50<sup><xref ref-type="table-fn" rid="table5fn4">d</xref></sup></td><td align="left" valign="top">0.8727 (0.0260)</td><td align="left" valign="top">0.7547 (0.0905)</td><td align="left" valign="top">0.9286 (0.0266)</td><td align="left" valign="top">0.8476 (0.0341)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MobileNet V2<sup><xref ref-type="table-fn" rid="table5fn5">e</xref></sup></td><td align="left" valign="top">0.8566 (0.0367)</td><td align="left" valign="top">0.7492 (0.1275)</td><td align="left" valign="top">0.9071 (0.0175)</td><td align="left" valign="top">0.8294 (0.0513)</td></tr><tr><td align="left" valign="top">Images</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ViT</td><td align="left" valign="top">0.8366 (0.0545)</td><td align="left" valign="top">0.7290 (0.1128)</td><td align="left" valign="top">0.8875 (0.0619)</td><td align="left" valign="top">0.7900 (0.0789)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>SwinT</td><td align="left" valign="top">0.8404 (0.0421)</td><td align="left" valign="top">0.6352 (0.1230)</td><td align="left" valign="top">0.9379 (0.0270)</td><td align="left" valign="top">0.7819 (0.0774)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>DenseNet-201</td><td align="left" valign="top">0.9179 (0.0288)</td><td align="left" valign="top">0.8360 (0.0713)</td><td align="left" valign="top">0.9557 (0.0327)</td><td align="left" valign="top">0.9027 (0.0332)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ResNet-50</td><td align="left" valign="top">0.9141 (0.0329)</td><td align="left" valign="top">0.8430 (0.0917)</td><td align="left" valign="top">0.9484 (0.0168)</td><td align="left" valign="top">0.8986 (0.0413)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>MobileNet V2</td><td align="left" valign="top">0.8629 (0.0319)</td><td align="left" valign="top">0.7359 (0.0865)</td><td align="left" valign="top">0.9220 (0.0183)</td><td align="left" valign="top">0.8355 (0.0410)</td></tr><tr><td align="left" valign="top">Engineered features</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>FFNN<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">0.7689 (0.0432)</td><td align="left" valign="top">0.4955 (0.1583)</td><td align="left" valign="top">0.8993 (0.0419)</td><td align="left" valign="top">0.5558 (0.1161)</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup>ViT: Vision Transformer.</p></fn><fn id="table5fn2"><p><sup>b</sup>SwinT: Shifted Window Transformer.</p></fn><fn id="table5fn3"><p><sup>c</sup>DenseNet-201: Densely Connected Convolutional Network-201.</p></fn><fn id="table5fn4"><p><sup>d</sup>ResNet-50: Residual Network-50.</p></fn><fn id="table5fn5"><p><sup>e</sup>MobileNet V2: Mobile Network v2.</p></fn><fn id="table5fn6"><p><sup>f</sup>FFNN: feed-forward neural network.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s3-3"><title>Feature Importance Analysis of Multimodal Models</title><p>We selected the best-performing models from each experimental setting based on the highest mean <italic>F</italic><sub>1</sub>-scores achieved across runs. In the primary experiment, the multimodal ViT achieved the best performance, and in the secondary analysis, the multimodal ResNet-50 performed best. In the cross-validation analysis, the image-based DenseNet-201 model achieved the highest performance.</p><p>We conducted GradSHAP-based feature importance analysis on the 2 multimodal models from the primary experiment and the secondary analysis to better understand the relative contributions of image and engineered features. We did not perform the feature importance analysis on the image-based DenseNet-201 model, as such an analysis would provide limited additional insight: with no tabular features present, the dominance of image inputs is expected and not subject to comparison. Our goal was to explore how much influence tabular features or image features have in a multimodal setting and whether models rely solely on image inputs or leverage both data types.</p><p><xref ref-type="fig" rid="figure7">Figure 7</xref> depicts the feature importance analysis for the multimodal ViT model trained on suspected PD versus non-PD and tested on PD versus non-PD. We found that the model relied heavily on the images for prediction. However, in this case, the engineered features, especially the time required to trace the patterns, exhibited high SHAP (Shapley Additive Explanations) values. The height and width of the screen used by the participant also exhibited relatively high SHAP values.</p><p><xref ref-type="fig" rid="figure8">Figure 8</xref> depicts the feature importance analysis for the multimodal ResNet-50 model trained on PD versus non-PD and tested on suspected PD versus non-PD. We found that the model relied predominantly on image features for prediction, with the spiral, sine, and straight line images showing the highest SHAP values. Among the engineered features, only the time taken to trace the spiral and sine waves, as well as the straight line, exhibited significant SHAP values, while the rest of the tabular features had a negligible impact.</p><fig position="float" id="figure7"><label>Figure 7.</label><caption><p>Interpretability analysis of the multimodal Vision Transformer (ViT) model for the patients with self-reported Parkinson disease (PD) and without PD (trained on suspected PD and non-PD). (The x-axis range is set to [&#x2212;2, 2] in the figure for better comparison, and the outlier GradSHAP [Gradient Shapley Additive Explanations] values are removed from the figure.)</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e81368_fig07.png"/></fig><fig position="float" id="figure8"><label>Figure 8.</label><caption><p>Interpretability analysis of the multimodal ResNet-50 (Residual Network-50) model for the patients with self-reported suspected Parkinson disease (PD) and without PD (trained on PD and non-PD). (The x-axis range is set to [&#x2212;4, 4] in the figure for better comparison, and the outlier GradSHAP [Gradient Shapley Additive Explanations] values are removed from the figure.)</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v10i1e81368_fig08.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Results</title><p>We sought to study the feasibility of training models using weak labels of &#x201C;suspected PD&#x201D; to predict confirmed PD in a community-recruited sample. We evaluated model performance using 1 primary experiment and 2 secondary analyses, each reflecting different assumptions about diagnostic certainty and real-world deployment scenarios. The primary experiment involved training models on participants with suspected PD and without PD and evaluating them on patients with self-reported PD and without PD, reflecting a real-world use case in which models trained on low-specificity, community-recruited labels are applied to identify diagnosed PD. We found that training models on patients with suspected PD yielded moderate yet meaningful performance in predicting patients with self-reported PD. These preliminary findings support the feasibility of leveraging community-recruited, low-specificity labels to learn patterns that generalize to predicting diagnosed PD. This suggests that, even in the presence of diagnostic uncertainty in labels, suspected PD data can possibly retain signals relevant to motor symptoms that may still be useful for developing scalable screening tools in global health contexts. However, we emphasize that this claim needs to be supported by future work involving participants with clinically confirmed diagnoses.</p><p>We also found that images derived from spiral, sine, and straight line tracing were the dominant contributors to model predictions for the multimodal models. Tabular features such as tracing time showed modest attribution in the ResNet-50 (secondary analysis), while showing much higher influence in ViT (primary analysis with suspected PD). Device-related features (screen height and width) played a minimal to nonexistent role. In the ViT model trained on patients with suspected PD, the increased influence of engineered features suggests that engineered data can complement visual patterns when used to train models to identify real patients with PD.</p></sec><sec id="s4-2"><title>Comparison to Previous Works</title><p>To the best of our knowledge, we conducted the first pilot feasibility study to assess whether lower-specificity weak labels of &#x201C;suspected PD&#x201D; can enable artificial intelligence models to learn useful motor signatures related to PD. From a computational methods perspective, our study also expands upon previous research by introducing an approach relying exclusively on mouse-trace data and images produced from a brief online test for PD classification through the use of deep-learning models. Unlike prior methods that have explored hand and finger movements, keyboard typing patterns, keystroke dynamics, speech analysis, handwriting, drawing tests, and sensor data from accelerometers, gyroscopes, and smartphone interactions, we specifically focus on the remote collection of mouse-tracing data, and our experiments demonstrate the potential of mouse-trace data collected from a heterogeneous array of devices to provide predictive power in classifying PD.</p><p>Previous studies by Gil-Martin et al [<xref ref-type="bibr" rid="ref48">48</xref>] and Pereira et al [<xref ref-type="bibr" rid="ref49">49</xref>] focused on hand movement dynamics from spiral, meander, and other drawing shapes for PD analysis. However, their data collection was not conducted remotely, and they did not consider handedness, unlike our study. Their best models achieved accuracies of 97.7% and 83.77%, respectively. Goel et al [<xref ref-type="bibr" rid="ref50">50</xref>] used pen-and-paper methods to collect spiral pattern data but also lacked remote testing and consideration of handedness, achieving an accuracy of 87.36%. Memedi et al [<xref ref-type="bibr" rid="ref51">51</xref>] used a remote data collection method involving a touchscreen tablet and web interface, but their study spanned 3 years and involved only 65 participants, resulting in an accuracy of around 84%. Wang et al [<xref ref-type="bibr" rid="ref52">52</xref>] achieved 96.2% accuracy using the data collected during the drawing of &#x03A0; and &#x03A0;&#x039B; shapes. However, their data collection method involved an iPad and stylus and was not conducted remotely. The classification model suggested by Gajos et al [<xref ref-type="bibr" rid="ref53">53</xref>] detected ataxia or parkinsonism with high sensitivity (0.91) and specificity (0.90) but included only 46 patients with PD in their dataset with 22,946 controls.</p><p>These studies served as important and inspirational foundational literature that we aimed to build upon. The results from most prior works were obtained under controlled conditions with specialized hardware; however, our remote approach trades some performance for scalability.</p><p>A previous pilot study of ours [<xref ref-type="bibr" rid="ref54">54</xref>], which explored the feasibility of an earlier version of our web application on a much smaller participant sample, achieved an accuracy of 74.29% and an <italic>F</italic><sub>1</sub>-score of 73.11% using classical machine-learning models. This work used both keyboard and mouse-trace data as engineered features and did not include patients with suspected PD in the data collection process. Our current models show marked improvements in performance compared to this prior pilot study, possibly due to either our novel machine-learning approach presented here or the significantly expanded dataset size.</p></sec><sec id="s4-3"><title>Clinical Implications and Further Validation</title><p>Our findings support 2 key observations. First, despite label noise, models trained using patients with &#x201C;suspected PD&#x201D; may retain sufficient motor signals to enable the meaningful prediction of diagnosed PD, supporting the feasibility of using community-recruited, low-specificity data for model development. Second, motor patterns observed in individuals with suspected PD share detectable similarities with those diagnosed with PD, allowing the models to generalize even when diagnostic certainty is low. However, several key validation steps are required to fully validate this approach, including evaluation using clinically confirmed prodromal PD cohorts and the inclusion of other related motor disorders for a more rigorous assessment of model specificity (ie, whether the models are actually identifying PD or reporting noise caused by motor dysfunctions). Ultimately, our findings should be interpreted as preliminary feasibility evidence to support further, larger-scale investigation.</p></sec><sec id="s4-4"><title>Limitations and Future Work</title><p>As a pilot feasibility study, this work has several limitations that should be considered in future research. First, the sample size of 261, split into 3 diagnostic categories, may not be sufficient to generalize the findings across a diverse population and heterogeneous disease stages. This limitation is particularly relevant for the suspected PD group, which contained only 33 participants. Although we tried to mitigate this through repeated training runs and evaluation across multiple splits, small sample sizes can still affect model generalizability and may have been the reason behind the occasional appearance of extreme values for sensitivity and specificity. Moreover, this small sample size for the suspected PD group limits the statistical power and generalizability of our findings. In the future, we plan to prioritize expanding recruitment and validating these findings in larger and more diverse cohorts. Moreover, while we performed hyperparameter tuning for each model, further optimization, especially regarding model architecture and data fusion strategies, could improve performance and generalization. Some models, particularly those involving image-based and multimodal inputs, exhibited nondeterministic behavior. These models produced variable results across repeated training runs on identical data splits, likely due to the stochastic nature of deep learning, their sensitivity to complex, high-dimensional input spaces, and resampling on the small sample sizes. This reinforces the importance of repeated experimentation and performance averaging in evaluating model robustness. We used a fixed sampling rate of 500 ms to store mouse positions on screen, resulting in some data points with only one time step represented. While we retained those data in this study, future work should explore more granular sampling rates (eg, 50/100 ms) and stricter exclusion criteria.</p><p>Notably, a key limitation of this study is that the &#x201C;suspected PD&#x201D; category was based solely on self-report and did not require clinical verification. Consequently, this group is heterogeneous and may include individuals with health anxiety, age-related motor conditions, or non-PD neurodegenerative disorders. Future work should incorporate longitudinal follow-up or clinician-verified diagnoses to better characterize which patients with suspected PD progress to PD and to refine early-stage prediction models.</p><p>Additionally, our focus on mouse-tracing data collected through a website does not fully capture all aspects of PD symptoms. Importantly, the study did not account for medication usage, specifically distinguishing the &#x201C;on&#x201D; phase versus the &#x201C;off&#x201D; phase, which can significantly influence the presence and severity of symptoms such as tremors [<xref ref-type="bibr" rid="ref55">55</xref>-<xref ref-type="bibr" rid="ref57">57</xref>]. Stress, which is known to exacerbate tremors, was also not accounted for, potentially affecting the results [<xref ref-type="bibr" rid="ref58">58</xref>]. All data were collected remotely using participants&#x2019; own devices, resulting in variability in devices, operating systems, and screen configurations. Participant characteristics, such as age and handedness, were not balanced across groups. These factors may introduce confounding effects, as differences in hardware, cursor behavior, or user interaction patterns could influence both engineered features and generated mouse-trace images. Furthermore, the impact of device type and handedness on the results remains unclear, as models trained on mouse-tracing data tend to reflect device type and handedness bias [<xref ref-type="bibr" rid="ref59">59</xref>]. In addition, PD often affects one side of the body more than the other, and it is not certain that participants&#x2019; dominant hands were the ones most affected by the disease. Future work should include controlled data collection using standardized hardware and display settings to calibrate model performance and validate findings under more reproducible conditions.</p></sec><sec id="s4-5"><title>Conclusions</title><p>In this early-stage pilot feasibility study, we provide exploratory and hypothesis-generating evidence that models trained using weaker labels of &#x201C;suspected PD&#x201D; from a community-recruited sample can capture motor patterns that generalize to predicting diagnosed PD. However, due to the use of self-reported and heterogeneous labels, particularly within the suspected PD group, these results should not be interpreted as evidence of clinical screening utility and should serve as a basis for future extramurally funded work conducted using clinically confirmed cohorts in conjunction with lower-resourced community samples.</p></sec></sec></body><back><ack><p>The authors are grateful to the participants in this study. Only the language and grammar of this manuscript were revised using artificial intelligence tools such as ChatGPT and Grammarly. However, the authors thoroughly refined the language following the stylistic revision suggestions provided by these tools.</p></ack><notes><sec><title>Funding</title><p>This research was, in part, funded by the National Institutes of Health (NIH) agreement number 1OT2OD032581-01. The views and conclusions contained in this document are those of the authors and should not be interpreted as representing the official policies, either expressed or implied, of the NIH.</p></sec><sec><title>Data Availability</title><p>We plan to release this dataset publicly through a separate dataset descriptor paper. Prior to publication of our dataset paper, which is currently under review, readers may contact the first author upon reasonable requests for dataset or code access and cite this publication when using the data.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: MRSZ, LS, ZNT, SP, PW</p><p>Data curation: MRSZ, ZNT, LS, SP</p><p>Formal analysis: MRSZ</p><p>Funding acquisition: PW</p><p>Supervision: PW</p><p>Visualization: MRSZ</p><p>Web development: MRSZ, SP, LS</p><p>Writing &#x2013; original draft: MRSZ</p><p>Writing &#x2013; review and editing: PW</p><p>All authors had full access to the data used in the study and had final responsibility for the decision to submit for publication.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CNN</term><def><p>convolutional neural network</p></def></def-item><def-item><term id="abb2">DenseNet-201</term><def><p>Densely Connected Convolutional Network-201</p></def></def-item><def-item><term id="abb3">FN</term><def><p>false negative</p></def></def-item><def-item><term id="abb4">FP</term><def><p>false positive</p></def></def-item><def-item><term id="abb5">GradSHAP</term><def><p>Gradient Shapley Additive Explanations</p></def></def-item><def-item><term id="abb6">MobileNet V2</term><def><p>Mobile Network v2</p></def></def-item><def-item><term id="abb7">PD</term><def><p>Parkinson disease</p></def></def-item><def-item><term id="abb8">ResNet-50</term><def><p>Residual Network-50</p></def></def-item><def-item><term id="abb9">SHAP</term><def><p>Shapley Additive Explanations</p></def></def-item><def-item><term id="abb10">SwinT</term><def><p>Shifted Window Transformer</p></def></def-item><def-item><term id="abb11">TN</term><def><p>true negative</p></def></def-item><def-item><term id="abb12">TP</term><def><p>true positive</p></def></def-item><def-item><term id="abb13">ViT</term><def><p>Vision Transformer</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Burke</surname><given-names>RE</given-names> </name></person-group><article-title>Evaluation of the Braak staging scheme for Parkinson&#x2019;s disease: introduction to a panel presentation</article-title><source>Mov Disord</source><year>2010</year><volume>25 Suppl 1</volume><issue>S1</issue><fpage>S76</fpage><lpage>S77</lpage><pub-id pub-id-type="doi">10.1002/mds.22783</pub-id><pub-id pub-id-type="medline">20187252</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Olanow</surname><given-names>CW</given-names> </name><name name-style="western"><surname>Stern</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Sethi</surname><given-names>K</given-names> </name></person-group><article-title>The scientific and clinical basis for the treatment of Parkinson disease (2009)</article-title><source>Neurology</source><year>2009</year><month>05</month><day>26</day><volume>72</volume><issue>21 Suppl 4</issue><fpage>S1</fpage><lpage>136</lpage><pub-id pub-id-type="doi">10.1212/WNL.0b013e3181a1d44c</pub-id><pub-id pub-id-type="medline">19470958</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="web"><article-title>What is Parkinson&#x2019;s?</article-title><source>Parkinson&#x2019;s foundation</source><year>2024</year><access-date>2024-07-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.parkinson.org/understanding-parkinsons/what-is-parkinsons">https://www.parkinson.org/understanding-parkinsons/what-is-parkinsons</ext-link></comment></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="web"><article-title>Statistics</article-title><source>Parkinson&#x2019;s Foundation</source><access-date>2024-07-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.parkinson.org/understanding-parkinsons/statistics">https://www.parkinson.org/understanding-parkinsons/statistics</ext-link></comment></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pangman</surname><given-names>VC</given-names> </name><name name-style="western"><surname>Sloan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Guse</surname><given-names>L</given-names> </name></person-group><article-title>An examination of psychometric properties of the Mini-Mental State Examination and the standardized Mini-Mental State Examination: implications for clinical practice</article-title><source>Appl Nurs Res</source><year>2000</year><month>11</month><volume>13</volume><issue>4</issue><fpage>209</fpage><lpage>213</lpage><pub-id pub-id-type="doi">10.1053/apnr.2000.9231</pub-id><pub-id pub-id-type="medline">11078787</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hamzehei</surname><given-names>S</given-names> </name><name name-style="western"><surname>Akbarzadeh</surname><given-names>O</given-names> </name><name name-style="western"><surname>Attar</surname><given-names>H</given-names> </name><name name-style="western"><surname>Rezaee</surname><given-names>K</given-names> </name><name name-style="western"><surname>Fasihihour</surname><given-names>N</given-names> </name><name name-style="western"><surname>Khosravi</surname><given-names>MR</given-names> </name></person-group><article-title>Predicting the total Unified Parkinson&#x2019;s Disease Rating Scale (UPDRS) based on ML techniques and cloud-based update</article-title><source>J Cloud Comp</source><year>2023</year><month>01</month><day>21</day><volume>12</volume><issue>1</issue><fpage>12</fpage><pub-id pub-id-type="doi">10.1186/s13677-022-00388-1</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Myrberg</surname><given-names>K</given-names> </name><name name-style="western"><surname>Hyd&#x00E9;n</surname><given-names>LC</given-names> </name><name name-style="western"><surname>Samuelsson</surname><given-names>C</given-names> </name></person-group><article-title>The Mini-Mental State Examination (MMSE) from a language perspective: an analysis of test interaction</article-title><source>Clin Linguist Phon</source><year>2020</year><month>07</month><day>2</day><volume>34</volume><issue>7</issue><fpage>652</fpage><lpage>670</lpage><pub-id pub-id-type="doi">10.1080/02699206.2019.1687757</pub-id><pub-id pub-id-type="medline">31739693</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nair</surname><given-names>P</given-names> </name><name name-style="western"><surname>Trisno</surname><given-names>R</given-names> </name><name name-style="western"><surname>Baghini</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Pendharkar</surname><given-names>G</given-names> </name><name name-style="western"><surname>Chung</surname><given-names>H</given-names> </name></person-group><article-title>Predicting early stage drug induced parkinsonism using unsupervised and supervised machine learning</article-title><source>Annu Int Conf IEEE Eng Med Biol Soc</source><year>2020</year><month>07</month><volume>2020</volume><fpage>776</fpage><lpage>779</lpage><pub-id pub-id-type="doi">10.1109/EMBC44109.2020.9175343</pub-id><pub-id pub-id-type="medline">33018101</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="web"><article-title>How Parkinson&#x2019;s disease is diagnosed</article-title><source>American Parkinson Disease Association</source><access-date>2026-05-23</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.apdaparkinson.org/what-is-parkinsons/diagnosing/">https://www.apdaparkinson.org/what-is-parkinsons/diagnosing/</ext-link></comment></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="web"><article-title>Diagnosing Parkinson&#x2019;s</article-title><source>Parkinson&#x2019;s Europe</source><access-date>2024-09-21</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.parkinsonseurope.org/about-parkinsons/diagnosis/how-is-parkinsons-diagnosed/">https://www.parkinsonseurope.org/about-parkinsons/diagnosis/how-is-parkinsons-diagnosed/</ext-link></comment></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Brooker</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Gonzalez-Latapi</surname><given-names>P</given-names> </name></person-group><article-title>Biomarkers in Parkinson&#x2019;s disease</article-title><source>Neurol Clin</source><year>2025</year><month>05</month><volume>43</volume><issue>2</issue><fpage>229</fpage><lpage>248</lpage><pub-id pub-id-type="doi">10.1016/j.ncl.2024.12.005</pub-id><pub-id pub-id-type="medline">40185520</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rovini</surname><given-names>E</given-names> </name><name name-style="western"><surname>Maremmani</surname><given-names>C</given-names> </name><name name-style="western"><surname>Cavallo</surname><given-names>F</given-names> </name></person-group><article-title>How wearable sensors can support Parkinson's disease diagnosis and treatment: a systematic review</article-title><source>Front Neurosci</source><year>2017</year><volume>11</volume><fpage>555</fpage><pub-id pub-id-type="doi">10.3389/fnins.2017.00555</pub-id><pub-id pub-id-type="medline">29056899</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Arroyo-Gallego</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ledesma-Carbayo</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Butterworth</surname><given-names>I</given-names> </name><etal/></person-group><article-title>Detecting motor impairment in early Parkinson&#x2019;s disease via natural typing interaction with keyboards: validation of the neuroQWERTY approach in an uncontrolled at-home setting</article-title><source>J Med Internet Res</source><year>2018</year><month>03</month><day>26</day><volume>20</volume><issue>3</issue><fpage>e89</fpage><pub-id pub-id-type="doi">10.2196/jmir.9462</pub-id><pub-id pub-id-type="medline">29581092</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Demir</surname><given-names>B</given-names> </name><name name-style="western"><surname>Ulukaya</surname><given-names>S</given-names> </name><name name-style="western"><surname>Erdem</surname><given-names>O</given-names> </name></person-group><article-title>Detection of Parkinson&#x2019;s disease with keystroke data</article-title><source>Comput Methods Biomech Biomed Eng</source><year>2023</year><month>10</month><volume>26</volume><issue>13</issue><fpage>1653</fpage><lpage>1667</lpage><pub-id pub-id-type="doi">10.1080/10255842.2023.2245516</pub-id><pub-id pub-id-type="medline">37599616</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tsanas</surname><given-names>A</given-names> </name><name name-style="western"><surname>Little</surname><given-names>MA</given-names> </name><name name-style="western"><surname>McSharry</surname><given-names>PE</given-names> </name><name name-style="western"><surname>Ramig</surname><given-names>LO</given-names> </name></person-group><article-title>Accurate telemonitoring of Parkinson&#x2019;s disease progression by noninvasive speech tests</article-title><source>IEEE Trans Biomed Eng</source><year>2010</year><month>04</month><volume>57</volume><issue>4</issue><fpage>884</fpage><lpage>893</lpage><pub-id pub-id-type="doi">10.1109/TBME.2009.2036000</pub-id><pub-id pub-id-type="medline">19932995</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Del Din</surname><given-names>S</given-names> </name><name name-style="western"><surname>Elshehabi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Galna</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Gait analysis with wearables predicts conversion to Parkinson disease</article-title><source>Ann Neurol</source><year>2019</year><month>09</month><volume>86</volume><issue>3</issue><fpage>357</fpage><lpage>367</lpage><pub-id pub-id-type="doi">10.1002/ana.25548</pub-id><pub-id pub-id-type="medline">31294853</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Klucken</surname><given-names>J</given-names> </name><name name-style="western"><surname>Barth</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kugler</surname><given-names>P</given-names> </name><etal/></person-group><article-title>Unbiased and mobile gait analysis detects motor impairment in Parkinson&#x2019;s disease</article-title><source>PLoS ONE</source><year>2013</year><volume>8</volume><issue>2</issue><fpage>e56956</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0056956</pub-id><pub-id pub-id-type="medline">23431395</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cancela</surname><given-names>J</given-names> </name><name name-style="western"><surname>Pastorino</surname><given-names>M</given-names> </name><name name-style="western"><surname>Tzallas</surname><given-names>AT</given-names> </name><etal/></person-group><article-title>Wearability assessment of a wearable system for Parkinson&#x2019;s disease remote monitoring based on a body area network of sensors</article-title><source>Sensors (Basel)</source><year>2014</year><month>09</month><day>16</day><volume>14</volume><issue>9</issue><fpage>17235</fpage><lpage>17255</lpage><pub-id pub-id-type="doi">10.3390/s140917235</pub-id><pub-id pub-id-type="medline">25230307</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Patel</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lorincz</surname><given-names>K</given-names> </name><name name-style="western"><surname>Hughes</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Monitoring motor fluctuations in patients with Parkinson&#x2019;s disease using wearable sensors</article-title><source>IEEE Trans Inf Technol Biomed</source><year>2009</year><month>11</month><volume>13</volume><issue>6</issue><fpage>864</fpage><lpage>873</lpage><pub-id pub-id-type="doi">10.1109/TITB.2009.2033471</pub-id><pub-id pub-id-type="medline">19846382</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Giancardo</surname><given-names>L</given-names> </name><name name-style="western"><surname>S&#x00E1;nchez-Ferro</surname><given-names>A</given-names> </name><name name-style="western"><surname>Arroyo-Gallego</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Computer keyboard interaction as an indicator of early Parkinson&#x2019;s disease</article-title><source>Sci Rep</source><year>2016</year><month>10</month><day>5</day><volume>6</volume><issue>1</issue><fpage>34468</fpage><pub-id pub-id-type="doi">10.1038/srep34468</pub-id><pub-id pub-id-type="medline">27703257</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wylie</surname><given-names>SA</given-names> </name><name name-style="western"><surname>van den Wildenberg</surname><given-names>WPM</given-names> </name><name name-style="western"><surname>Ridderinkhof</surname><given-names>KR</given-names> </name><etal/></person-group><article-title>The effect of Parkinson&#x2019;s disease on interference control during action selection</article-title><source>Neuropsychologia</source><year>2009</year><month>01</month><volume>47</volume><issue>1</issue><fpage>145</fpage><lpage>157</lpage><pub-id pub-id-type="doi">10.1016/j.neuropsychologia.2008.08.001</pub-id><pub-id pub-id-type="medline">18761363</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Goni</surname><given-names>M</given-names> </name><name name-style="western"><surname>Eickhoff</surname><given-names>SB</given-names> </name><name name-style="western"><surname>Far</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Patil</surname><given-names>KR</given-names> </name><name name-style="western"><surname>Dukart</surname><given-names>J</given-names> </name></person-group><article-title>Smartphone-based digital biomarkers for Parkinson's disease in a remotely-administered setting</article-title><source>IEEE Access</source><year>2022</year><month>03</month><day>3</day><volume>10</volume><fpage>28361</fpage><lpage>28384</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2022.3156659</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Skaramagkas</surname><given-names>V</given-names> </name><name name-style="western"><surname>Andrikopoulos</surname><given-names>G</given-names> </name><name name-style="western"><surname>Kefalopoulou</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Polychronopoulos</surname><given-names>P</given-names> </name></person-group><article-title>A study on the essential and Parkinson's arm tremor classification</article-title><source>Signals</source><year>2021</year><volume>2</volume><issue>2</issue><fpage>201</fpage><lpage>224</lpage><pub-id pub-id-type="doi">10.3390/signals2020016</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schneider</surname><given-names>SA</given-names> </name><name name-style="western"><surname>Drude</surname><given-names>L</given-names> </name><name name-style="western"><surname>Kasten</surname><given-names>M</given-names> </name><name name-style="western"><surname>Klein</surname><given-names>C</given-names> </name><name name-style="western"><surname>Hagenah</surname><given-names>J</given-names> </name></person-group><article-title>A study of subtle motor signs in early Parkinson&#x2019;s disease</article-title><source>Mov Disord</source><year>2012</year><month>10</month><volume>27</volume><issue>12</issue><fpage>1563</fpage><lpage>1566</lpage><pub-id pub-id-type="doi">10.1002/mds.25161</pub-id><pub-id pub-id-type="medline">23032728</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Prince</surname><given-names>J</given-names> </name><name name-style="western"><surname>Andreotti</surname><given-names>F</given-names> </name><name name-style="western"><surname>De Vos</surname><given-names>M</given-names> </name></person-group><article-title>Multi-source ensemble learning for the remote prediction of Parkinson&#x2019;s disease in the presence of source-wise missing data</article-title><source>IEEE Trans Biomed Eng</source><year>2019</year><month>05</month><volume>66</volume><issue>5</issue><fpage>1402</fpage><lpage>1411</lpage><pub-id pub-id-type="doi">10.1109/TBME.2018.2873252</pub-id><pub-id pub-id-type="medline">30403615</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lim</surname><given-names>MD</given-names> </name><name name-style="western"><surname>Connie</surname><given-names>T</given-names> </name><name name-style="western"><surname>Goh</surname><given-names>MKO</given-names> </name><name name-style="western"><surname>Saedon</surname><given-names>NI</given-names> </name></person-group><article-title>Model-based feature extraction and classification for Parkinson disease screening using gait analysis: development and validation study</article-title><source>JMIR Aging</source><year>2025</year><month>04</month><day>8</day><volume>8</volume><fpage>e65629</fpage><pub-id pub-id-type="doi">10.2196/65629</pub-id><pub-id pub-id-type="medline">40198116</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Idrisoglu</surname><given-names>A</given-names> </name><name name-style="western"><surname>Dallora</surname><given-names>AL</given-names> </name><name name-style="western"><surname>Anderberg</surname><given-names>P</given-names> </name><name name-style="western"><surname>Berglund</surname><given-names>JS</given-names> </name></person-group><article-title>Applied machine learning techniques to diagnose voice-affecting conditions and disorders: systematic literature review</article-title><source>J Med Internet Res</source><year>2023</year><month>07</month><day>19</day><volume>25</volume><fpage>e46105</fpage><pub-id pub-id-type="doi">10.2196/46105</pub-id><pub-id pub-id-type="medline">37467031</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vasquez-Correa</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Arias-Vergara</surname><given-names>T</given-names> </name><name name-style="western"><surname>Orozco-Arroyave</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Eskofier</surname><given-names>B</given-names> </name><name name-style="western"><surname>Klucken</surname><given-names>J</given-names> </name><name name-style="western"><surname>Noth</surname><given-names>E</given-names> </name></person-group><article-title>Multimodal assessment of Parkinson's disease: a deep learning approach</article-title><source>IEEE J Biomed Health Inform</source><year>2019</year><month>07</month><volume>23</volume><issue>4</issue><fpage>1618</fpage><lpage>1630</lpage><pub-id pub-id-type="doi">10.1109/JBHI.2018.2866873</pub-id><pub-id pub-id-type="medline">30137018</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kandori</surname><given-names>A</given-names> </name><name name-style="western"><surname>Yokoe</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sakoda</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Quantitative magnetic detection of finger movements in patients with Parkinson&#x2019;s disease</article-title><source>Neurosci Res</source><year>2004</year><month>06</month><volume>49</volume><issue>2</issue><fpage>253</fpage><lpage>260</lpage><pub-id pub-id-type="doi">10.1016/j.neures.2004.03.004</pub-id><pub-id pub-id-type="medline">15140567</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bhattacharjee</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bandyopadhyay</surname><given-names>D</given-names> </name></person-group><article-title>Flexible paper touchpad for Parkinson's hand tremor detection</article-title><source>Sens Actuators A Phys</source><year>2019</year><month>08</month><volume>294</volume><fpage>164</fpage><lpage>172</lpage><pub-id pub-id-type="doi">10.1016/j.sna.2019.05.006</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lipsmeier</surname><given-names>F</given-names> </name><name name-style="western"><surname>Taylor</surname><given-names>KI</given-names> </name><name name-style="western"><surname>Kilchenmann</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Evaluation of smartphone-based testing to generate exploratory outcome measures in a phase 1 Parkinson&#x2019;s disease clinical trial</article-title><source>Mov Disord</source><year>2018</year><month>08</month><volume>33</volume><issue>8</issue><fpage>1287</fpage><lpage>1297</lpage><pub-id pub-id-type="doi">10.1002/mds.27376</pub-id><pub-id pub-id-type="medline">29701258</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wan</surname><given-names>S</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Guizani</surname><given-names>M</given-names> </name></person-group><article-title>Deep multi-layer perceptron classifier for behavior analysis to estimate Parkinson's disease severity using smartphones</article-title><source>IEEE Access</source><year>2018</year><month>07</month><day>6</day><volume>6</volume><fpage>36825</fpage><lpage>36833</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2018.2851382</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lakshminarayana</surname><given-names>R</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>D</given-names> </name><name name-style="western"><surname>Burn</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Using a smartphone-based self-management platform to support medication adherence and clinical consultation in Parkinson&#x2019;s disease</article-title><source>NPJ Parkinsons Dis</source><year>2017</year><volume>3</volume><fpage>2</fpage><pub-id pub-id-type="doi">10.1038/s41531-016-0003-z</pub-id><pub-id pub-id-type="medline">28649602</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Park</surname><given-names>KW</given-names> </name><name name-style="western"><surname>McKeown</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>ZJ</given-names> </name></person-group><article-title>Clinically informed automated assessment of finger tapping videos in Parkinson's disease</article-title><source>Sensors (Basel)</source><year>2023</year><month>11</month><day>13</day><volume>23</volume><issue>22</issue><fpage>9149</fpage><pub-id pub-id-type="doi">10.3390/s23229149</pub-id><pub-id pub-id-type="medline">38005535</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Pappas</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Boughanem</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Baudendistel</surname><given-names>ST</given-names> </name><etal/></person-group><article-title>Video-based clinical gait analysis in Parkinson&#x2019;s disease: a novel approach using frontal plane videos and machine learning</article-title><conf-name>2024 46th Annual International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)</conf-name><conf-date>Jul 15-19, 2024</conf-date><pub-id pub-id-type="doi">10.1109/EMBC53108.2024.10781504</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jin</surname><given-names>B</given-names> </name><name name-style="western"><surname>Qu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>L</given-names> </name><name name-style="western"><surname>Gao</surname><given-names>Z</given-names> </name></person-group><article-title>Diagnosing Parkinson disease through facial expression recognition: video analysis</article-title><source>J Med Internet Res</source><year>2020</year><month>07</month><day>10</day><volume>22</volume><issue>7</issue><fpage>e18697</fpage><pub-id pub-id-type="doi">10.2196/18697</pub-id><pub-id pub-id-type="medline">32673247</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Qi</surname><given-names>W</given-names> </name><name name-style="western"><surname>Shen</surname><given-names>S</given-names> </name><name name-style="western"><surname>Dong</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Digital biomarkers for Parkinson disease: bibliometric analysis and a scoping review of deep learning for freezing of gait</article-title><source>J Med Internet Res</source><year>2025</year><month>05</month><day>20</day><volume>27</volume><fpage>e71560</fpage><pub-id pub-id-type="doi">10.2196/71560</pub-id><pub-id pub-id-type="medline">40392578</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Deng</surname><given-names>D</given-names> </name><name name-style="western"><surname>Ostrem</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Nguyen</surname><given-names>V</given-names> </name><etal/></person-group><article-title>Interpretable video-based tracking and quantification of parkinsonism clinical motor states</article-title><source>NPJ Parkinsons Dis</source><year>2024</year><month>06</month><day>25</day><volume>10</volume><issue>1</issue><fpage>122</fpage><pub-id pub-id-type="doi">10.1038/s41531-024-00742-x</pub-id><pub-id pub-id-type="medline">38918385</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Li</surname><given-names>W</given-names> </name><name name-style="western"><surname>Zhu</surname><given-names>W</given-names> </name><name name-style="western"><surname>Dorsey</surname><given-names>ER</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>J</given-names> </name></person-group><article-title>Predicting parkinson&#x2019;s disease with multimodal irregularly collected longitudinal smartphone data</article-title><conf-name>2020 IEEE International Conference on Data Mining (ICDM)</conf-name><conf-date>Nov 17-20, 2020</conf-date><pub-id pub-id-type="doi">10.1109/ICDM50108.2020.00133</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="web"><source>Parkinson&#x2019;s Study</source><access-date>2025-07-17</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://parkinsonsurvey.github.io/">https://parkinsonsurvey.github.io/</ext-link></comment></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gaenslen</surname><given-names>A</given-names> </name><name name-style="western"><surname>Swid</surname><given-names>I</given-names> </name><name name-style="western"><surname>Liepelt-Scarfone</surname><given-names>I</given-names> </name><name name-style="western"><surname>Godau</surname><given-names>J</given-names> </name><name name-style="western"><surname>Berg</surname><given-names>D</given-names> </name></person-group><article-title>The patients&#x2019; perception of prodromal symptoms before the initial diagnosis of Parkinson&#x2019;s disease</article-title><source>Mov Disord</source><year>2011</year><month>03</month><volume>26</volume><issue>4</issue><fpage>653</fpage><lpage>658</lpage><pub-id pub-id-type="doi">10.1002/mds.23499</pub-id><pub-id pub-id-type="medline">21370256</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>de Lau</surname><given-names>LML</given-names> </name><name name-style="western"><surname>Koudstaal</surname><given-names>PJ</given-names> </name><name name-style="western"><surname>Hofman</surname><given-names>A</given-names> </name><name name-style="western"><surname>Breteler</surname><given-names>MMB</given-names> </name></person-group><article-title>Subjective complaints precede Parkinson disease: the Rotterdam study</article-title><source>Arch Neurol</source><year>2006</year><month>03</month><volume>63</volume><issue>3</issue><fpage>362</fpage><lpage>365</lpage><pub-id pub-id-type="doi">10.1001/archneur.63.3.noc50312</pub-id><pub-id pub-id-type="medline">16401729</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Valasaki</surname><given-names>M</given-names> </name></person-group><article-title>Constructing the detecting stage: social processes and the diagnostic journey of early onset Parkinson&#x2019;s disease</article-title><source>Sociol Health Illn</source><year>2023</year><month>05</month><volume>45</volume><issue>4</issue><fpage>872</fpage><lpage>889</lpage><pub-id pub-id-type="doi">10.1111/1467-9566.13622</pub-id><pub-id pub-id-type="medline">36762824</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zaman</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Ghahari</surname><given-names>S</given-names> </name><name name-style="western"><surname>McColl</surname><given-names>MA</given-names> </name></person-group><article-title>Barriers to accessing healthcare services for people with Parkinson's disease: a scoping review</article-title><source>J Parkinsons Dis</source><year>2021</year><volume>11</volume><issue>4</issue><fpage>1537</fpage><lpage>1553</lpage><pub-id pub-id-type="doi">10.3233/JPD-212735</pub-id><pub-id pub-id-type="medline">34308913</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fothergill-Misbah</surname><given-names>N</given-names> </name><name name-style="western"><surname>Walker</surname><given-names>R</given-names> </name><name name-style="western"><surname>Kwasa</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hooker</surname><given-names>J</given-names> </name><name name-style="western"><surname>Hampshire</surname><given-names>K</given-names> </name></person-group><article-title>&#x201C;Old people problems&#x201D;, uncertainty and legitimacy: challenges with diagnosing Parkinson&#x2019;s disease in Kenya</article-title><source>Soc Sci Med</source><year>2021</year><month>08</month><volume>282</volume><fpage>114148</fpage><pub-id pub-id-type="doi">10.1016/j.socscimed.2021.114148</pub-id><pub-id pub-id-type="medline">34153822</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Akiba</surname><given-names>T</given-names> </name><name name-style="western"><surname>Sano</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yanase</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ohta</surname><given-names>T</given-names> </name><name name-style="western"><surname>Koyama</surname><given-names>M</given-names> </name></person-group><article-title>Optuna: a next-generation hyperparameter optimization framework</article-title><source>KDD &#x2019;19: Proceedings of the 25th ACM SIGKDD International Conference on Knowledge Discovery &#x0026; Data Mining</source><year>2019</year><month>07</month><fpage>2623</fpage><lpage>2631</lpage><pub-id pub-id-type="doi">10.1145/3292500.3330701</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lundberg</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SI</given-names> </name></person-group><article-title>A unified approach to interpreting model predictions</article-title><conf-name>31st International Conference on Neural Information Processing Systems</conf-name><conf-date>Dec 4-9, 2017</conf-date><pub-id pub-id-type="doi">10.5555/3295222.3295230</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gil-Mart&#x00ED;n</surname><given-names>M</given-names> </name><name name-style="western"><surname>Montero</surname><given-names>JM</given-names> </name><name name-style="western"><surname>San-Segundo</surname><given-names>R</given-names> </name></person-group><article-title>Parkinson&#x2019;s disease detection from drawing movements using convolutional neural networks</article-title><source>Electronics (Basel)</source><year>2019</year><month>08</month><day>17</day><volume>8</volume><issue>8</issue><fpage>907</fpage><pub-id pub-id-type="doi">10.3390/electronics8080907</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Pereira</surname><given-names>CR</given-names> </name><name name-style="western"><surname>Weber</surname><given-names>SAT</given-names> </name><name name-style="western"><surname>Hook</surname><given-names>C</given-names> </name><name name-style="western"><surname>Rosa</surname><given-names>GH</given-names> </name><name name-style="western"><surname>Papa</surname><given-names>JP</given-names> </name></person-group><article-title>Deep learning-aided Parkinson&#x2019;s disease diagnosis from handwritten dynamics</article-title><conf-name>2016 29th SIBGRAPI Conference on Graphics, Patterns and Images (SIBGRAPI)</conf-name><conf-date>Oct 4-7, 2016</conf-date><pub-id pub-id-type="doi">10.1109/SIBGRAPI.2016.054</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Goel</surname><given-names>N</given-names> </name><name name-style="western"><surname>Khanna</surname><given-names>A</given-names> </name><name name-style="western"><surname>Gupta</surname><given-names>D</given-names> </name><name name-style="western"><surname>Gupta</surname><given-names>N</given-names> </name></person-group><article-title>Detection of Parkinson&#x2019;s disease using machine learning techniques for voice and handwriting features</article-title><conf-name>International Conference on Innovative Computing and Communications</conf-name><conf-date>Mar 21-22, 2019</conf-date><pub-id pub-id-type="doi">10.1007/978-981-15-1286-5_56</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Memedi</surname><given-names>M</given-names> </name><name name-style="western"><surname>Sadikov</surname><given-names>A</given-names> </name><name name-style="western"><surname>Groznik</surname><given-names>V</given-names> </name><etal/></person-group><article-title>Automatic spiral analysis for objective assessment of motor symptoms in Parkinson's disease</article-title><source>Sensors (Basel)</source><year>2015</year><month>09</month><day>17</day><volume>15</volume><issue>9</issue><fpage>23727</fpage><lpage>23744</lpage><pub-id pub-id-type="doi">10.3390/s150923727</pub-id><pub-id pub-id-type="medline">26393595</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Huang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Chatzakou</surname><given-names>M</given-names> </name><etal/></person-group><article-title>LSTM-CNN: an efficient diagnostic network for Parkinson&#x2019;s disease utilizing dynamic handwriting analysis</article-title><source>Comput Methods Programs Biomed</source><year>2024</year><month>04</month><volume>247</volume><fpage>108066</fpage><pub-id pub-id-type="doi">10.1016/j.cmpb.2024.108066</pub-id><pub-id pub-id-type="medline">38364361</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gajos</surname><given-names>KZ</given-names> </name><name name-style="western"><surname>Reinecke</surname><given-names>K</given-names> </name><name name-style="western"><surname>Donovan</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Computer mouse use captures ataxia and parkinsonism, enabling accurate measurement and detection</article-title><source>Mov Disord</source><year>2020</year><month>02</month><volume>35</volume><issue>2</issue><fpage>354</fpage><lpage>358</lpage><pub-id pub-id-type="doi">10.1002/mds.27915</pub-id><pub-id pub-id-type="medline">31769069</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Parab</surname><given-names>S</given-names> </name><name name-style="western"><surname>Boster</surname><given-names>J</given-names> </name><name name-style="western"><surname>Washington</surname><given-names>P</given-names> </name></person-group><article-title>Parkinson disease recognition using a gamified website: machine learning development and usability study</article-title><source>JMIR Form Res</source><year>2023</year><month>09</month><day>29</day><volume>7</volume><fpage>e49898</fpage><pub-id pub-id-type="doi">10.2196/49898</pub-id><pub-id pub-id-type="medline">37773607</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sieberts</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Schaff</surname><given-names>J</given-names> </name><name name-style="western"><surname>Duda</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Crowdsourcing digital health measures to predict Parkinson&#x2019;s disease severity: the Parkinson&#x2019;s disease digital biomarker DREAM Challenge</article-title><source>NPJ Digit Med</source><year>2021</year><month>03</month><day>19</day><volume>4</volume><issue>1</issue><fpage>53</fpage><pub-id pub-id-type="doi">10.1038/s41746-021-00414-7</pub-id><pub-id pub-id-type="medline">33742069</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Severson</surname><given-names>KA</given-names> </name><name name-style="western"><surname>Chahine</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Smolensky</surname><given-names>LA</given-names> </name><etal/></person-group><article-title>Discovery of Parkinson&#x2019;s disease states and disease progression modelling: a longitudinal data study using machine learning</article-title><source>Lancet Digit Health</source><year>2021</year><month>09</month><volume>3</volume><issue>9</issue><fpage>e555</fpage><lpage>e564</lpage><pub-id pub-id-type="doi">10.1016/S2589-7500(21)00101-1</pub-id><pub-id pub-id-type="medline">34334334</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roussos</surname><given-names>G</given-names> </name><name name-style="western"><surname>Herrero</surname><given-names>TR</given-names> </name><name name-style="western"><surname>Hill</surname><given-names>DL</given-names> </name><etal/></person-group><article-title>Identifying and characterising sources of variability in digital outcome measures in Parkinson&#x2019;s disease</article-title><source>NPJ Digit Med</source><year>2022</year><month>07</month><day>15</day><volume>5</volume><issue>1</issue><fpage>93</fpage><pub-id pub-id-type="doi">10.1038/s41746-022-00643-4</pub-id><pub-id pub-id-type="medline">35840653</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rochester</surname><given-names>L</given-names> </name><name name-style="western"><surname>Hetherington</surname><given-names>V</given-names> </name><name name-style="western"><surname>Jones</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Attending to the task: interference effects of functional tasks on walking in Parkinson&#x2019;s disease and the roles of cognition, depression, fatigue, and balance</article-title><source>Arch Phys Med Rehabil</source><year>2004</year><month>10</month><volume>85</volume><issue>10</issue><fpage>1578</fpage><lpage>1585</lpage><pub-id pub-id-type="doi">10.1016/j.apmr.2004.01.025</pub-id><pub-id pub-id-type="medline">15468014</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tumpa</surname><given-names>ZN</given-names> </name><name name-style="western"><surname>Zawad</surname><given-names>MRS</given-names> </name><name name-style="western"><surname>Sollis</surname><given-names>L</given-names> </name><name name-style="western"><surname>Parab</surname><given-names>S</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>IY</given-names> </name><name name-style="western"><surname>Washington</surname><given-names>P</given-names> </name></person-group><article-title>Quantifying device type and handedness biases in a remote Parkinson&#x2019;s disease AI-powered assessment</article-title><source>NPJ Digit Med</source><year>2025</year><month>08</month><day>27</day><volume>8</volume><issue>1</issue><fpage>550</fpage><pub-id pub-id-type="doi">10.1038/s41746-025-01934-2</pub-id><pub-id pub-id-type="medline">40866555</pub-id></nlm-citation></ref></ref-list></back></article>