<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id><journal-id journal-id-type="publisher-id">formative</journal-id><journal-id journal-id-type="index">27</journal-id><journal-title>JMIR Formative Research</journal-title><abbrev-journal-title>JMIR Form Res</abbrev-journal-title><issn pub-type="epub">2561-326X</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e64082</article-id><article-id pub-id-type="doi">10.2196/64082</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Acceptability of Active and Passive Data Collection Methods for Mobile Health Research: Cross-Sectional Survey of an Online Adult Sample in the United States</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Roque</surname><given-names>Nelson</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Felt</surname><given-names>John</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Center for Healthy Aging, The Pennsylvania State University</institution><addr-line>422 Biobehavioral Health Building</addr-line><addr-line>University Park</addr-line><addr-line>PA</addr-line><country>United States</country></aff><aff id="aff2"><institution>Department of Psychology, University of Central Florida</institution><addr-line>Orlando</addr-line><addr-line>FL</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Wu</surname><given-names>Chaoyi</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Zandesh</surname><given-names>Zahra</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Nelson Roque, PhD, Center for Healthy Aging, The Pennsylvania State University, 422 Biobehavioral Health Building, University Park, PA, 16801, United States, 1 814-863-7502; <email>nur375@psu.edu</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>12</day><month>9</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e64082</elocation-id><history><date date-type="received"><day>09</day><month>07</month><year>2024</year></date><date date-type="rev-recd"><day>30</day><month>05</month><year>2025</year></date><date date-type="accepted"><day>02</day><month>06</month><year>2025</year></date></history><copyright-statement>&#x00A9; Nelson Roque, John Felt. Originally published in JMIR Formative Research (<ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>), 12.9.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://formative.jmir.org/2025/1/e64082"/><abstract><sec><title>Background</title><p>Digital health technologies, including wearable devices and app-based cognitive and health assessments, are pervasive and crucial to better understanding important public health problems (eg, Alzheimer&#x2019;s disease and related dementias). Central to understanding mechanisms driving individuals&#x2019; willingness to share various data streams are concerns regarding data privacy, security, and control over generated data.</p></sec><sec><title>Objective</title><p>This survey was designed to learn more about attitudes and opinions related to digital health technologies and the sharing of associated data.</p></sec><sec sec-type="methods"><title>Methods</title><p>A total of 1509 adults were recruited from Prolific to complete an online survey via Qualtrics. Of these, 1489 participants provided valid data for analyses. Participants completed a structured survey consisting of multiple modules after informed consent was provided. These included: (1) demographic characteristics; (2) prior research experience; (3) mobility factors (eg, use of mobility aids, driving frequency); (4) technology ownership (eg, smartphones, tablets, home Wi-Fi); (5) social media use (eg, frequency of engagement with platforms such as Facebook, Instagram, and TikTok); (6) willingness to contribute different types of data across categories, including activities, sensors, and metadata; (7) opinions about data control and privacy options (eg, data deletion, stream-specific control); and (8) willingness to interact with assistive technologies such as robots, for Instrumental Activities of Daily Living.</p></sec><sec sec-type="results"><title>Results</title><p>The final cohort (N=1489) had a mean age of 35.5 years (SD 12.0), was 44% female (n=652), and predominantly identified as White (76%, n=1134), with high rates of smartphone ownership (99%, n=1479) and home Wi-Fi access (98%, n=1464). Participants were most willing to share data streams with clear health implications and least willing to share data streams with greater privacy or reidentification potential (eg, GPS location, in-vehicle dashcam footage). On average, people were willing to complete ambulatory cognitive assessments for 56.7 (SD 36.2) days, air quality monitoring for 58.1 (SD 37.7) days, and GPS location monitoring for 37 (SD 39.0) days. People expected control over their data, including the ability to delete all or specific streams of the data contributed for research. Most participants prioritized control over their data, with 71% (n=1061) favoring the ability to delete all data contributed for research purposes. Stream-specific data deletion (65%, n=960) and time-specific deletion (44%, n=653) were also valued; interest in sharing data with insurance providers (30%, n=453) or caregivers (26%, n=384) was notably lower.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Findings have implications for the design of digital health technologies and education-related to the use and implications of collected data.</p></sec></abstract><kwd-group><kwd>mHealth</kwd><kwd>privacy</kwd><kwd>smartphones</kwd><kwd>sensors</kwd><kwd>acceptability</kwd><kwd>mobile health</kwd><kwd>attitudes</kwd><kwd>opinions</kwd><kwd>digital health technologies</kwd><kwd>online survey</kwd><kwd>surveys</kwd><kwd>data privacy</kwd><kwd>questionnaires</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>Digital health technologies, including app-based cognitive and psychosocial assessments and wearable sensor-based health monitoring devices, are pervasive and crucial for better understanding and predicting trajectories related to important public health outcomes such as Alzheimer&#x2019;s disease and related dementias. The availability of detailed sensor data streams and data available via application programming interfaces creates new opportunities for scientific discovery, especially considering that passively collected data may be more robust for measuring aspects of daily life that can be influenced by observation, memory interference, or retrospective biases. The increase in easily shareable metadata (eg, Google Takeout) also creates a new fruitful avenue for research, however the extent public awareness and willingness to share these data and from other data streams remains unclear. Past studies have shown that in general, the overall acceptance for various smartphone-based tasks and sensing modalities is low, with variations in type of activity and sensor [<xref ref-type="bibr" rid="ref1">1</xref>, <xref ref-type="bibr" rid="ref2">2</xref>]. However, repeated prompting for specific data streams has been shown to increase willingness to share [<xref ref-type="bibr" rid="ref3">3</xref>]. In general, participants are interested in learning from their own data, and a proportion of these are also interested in sharing their information with a health care provider [<xref ref-type="bibr" rid="ref4">4</xref>].</p></sec><sec id="s1-2"><title>Privacy, Security, and Data Controls</title><p>Critical to understanding mechanisms driving willingness to share various data streams are concerns about data privacy, security, and control over generated data [<xref ref-type="bibr" rid="ref3">3</xref>, <xref ref-type="bibr" rid="ref5">5</xref>]Once the data are collected, different members of a research team, often across different institutions, work with deidentified versions of the datasets. In some cases, data are stored indefinitely for algorithm development&#x2014;seeking new purposes or uses for the data that were not originally considered. In other cases, advances in machine learning have made it possible to reidentify individuals with enough precision to warrant security concerns over warehousing sensitive data without appropriate deidentification procedures [<xref ref-type="bibr" rid="ref6">6</xref>]). As such, it is imperative to consider the most important stakeholder, the respondent and to assess their expectations regarding the data they generate for research and the level of controls they expect.</p></sec><sec id="s1-3"><title>Assessment: Active vs Passive?</title><p>To answer important scientific questions, researchers are interested in collecting data across the spectrum of participant involvement and burden, ranging from active data collection activities (eg, completing a survey, cognitive assessments), to passive data collection (eg, extracting sensor data streams, reading existing metadata [<xref ref-type="bibr" rid="ref7">7</xref>]; <xref ref-type="fig" rid="figure1">Figure 1</xref>). Passive data collection methods refer to data captured automatically without participant effort (eg, sensors, metadata), whereas active methods require participant involvement (eg, completing surveys or assessments). Active data collection also requires input from the respondent in a manner that makes the goal of the research more apparent. On the other hand, passive assessment does not requiring respondent burden or input, but rather, relies on data that is collected continuously in the background.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Active-passive continuum of research data streams: activities, sensors, and metadata (examples listed for each data stream category).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e64082_fig01.png"/></fig><p>In general, the mechanisms driving willingness to contribute various data, irrespective of specific study demands, sponsors, and incentives [<xref ref-type="bibr" rid="ref5">5</xref>] remain unclear. From the general patterns of attrition observed in longitudinal studies, it is apparent that a subset of participants may have a multitude of reasons for choosing to not engage in certain research activities.</p></sec><sec id="s1-4"><title>This Study</title><p>The purpose of this study is to investigate the acceptability of active and passive data collection methods in mobile health research. This survey was designed to explore attitudes and opinions related to digital health technologies and willingness to share related data. The three research questions guiding this work are:</p><list list-type="order"><list-item><p>RQ1: What types of data are people willing to contribute?</p></list-item><list-item><p>RQ2: For how long are people willing to contribute critical data streams?</p></list-item><list-item><p>RQ3: What type of data control and feedback do people expect?</p></list-item></list></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Participants</title><p>A total of 1509 adults were recruited from Prolific [<xref ref-type="bibr" rid="ref8">8</xref>]. The Prolific platform allows researchers to post a &#x2018;task&#x2019; with a short description for potential participants to review before beginning. In addition to the study background language, we the potential participants were informed: &#x201C;This survey is designed to learn more about your attitudes and opinions related to digital health technologies and related data/data-sharing.&#x201D; Two participants did not consent to participate, and 18 did not complete the survey and were dropped from the study, resulting in a total of 1489 participants with a mean age of 35.5 (SD 11.97) years.</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>This work was carried out in accordance with The Code of Ethics of the World Medical Association (Declaration of Helsinki). The Institutional Review Board (IRB) at the University of Central Florida approved the study protocol described in this manuscript (IRB No: STUDY00002281). The survey was pilot tested by members of the research laboratory conducting the study, for issues of usability and technical functioning. The IRB determined this study as exempt from regulation for human subjects research. Participants were provided an opportunity to accept or refuse consent before beginning this voluntary survey. The consent form indicated the expected time commitment, compensation, and nature of study. If consent was refused, the survey would close for that participant. Participants received US $2 after completing the survey on the Prolific Research Platform. All data was deidentified; the authors are accountable for all aspects of the work (including full data access, integrity of the data and the accuracy of the data analysis) in ensuring that questions related to the accuracy or integrity of any part of the work are appropriately investigated and resolved.</p></sec><sec id="s2-3"><title>Materials and Design</title><p>Participants completed a battery of questionnaires via the Qualtrics survey platform, designed to assess sample demographic characteristics (eg, technology ownership, mobility), opinions about data control, and willingness to contribute various data for research. These modules were designed to assess various facets of attitudes and behavior relevant to longitudinal observational research, to determine heterogeneity in willingness to use devices or share data.</p></sec><sec id="s2-4"><title>Procedures</title><p>The participants completed a questionnaire via the Qualtrics survey platform, where the first page displayed the consent form and a radio button to select regarding consent. If participants consented, they were presented with modules on separate pages assessing: (1) demographic characteristics; (2) prior research experience; (3) mobility (ie, use of aids; driving frequency); (4) tech ownership (ie, own a tablet, smartphone, home Wi-Fi); (5) social media usage (ie, frequency of using Facebook, Twitter, Snapchat, Instagram, TikTok, WhatsApp); (6) willingness and extent of contributing various data (ie, across categories of activities, sensors, metadata); (7) opinions about data controls; and (8) willingness to use a robot for Instrumental Activities of Daily Living (IADLs). This survey totaled 52 questions over 12 pages presented in the same order for all participants (see <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> for full survey). Questions for demographic reporting required responses, while all other items only suggested responses. Participants were only able to navigate forward and not backward through the survey.</p></sec><sec id="s2-5"><title>Data Preparation and Analysis Plan</title><p>This study reports findings related to the willingness and extent of contributing various data and opinions about data controls. All data were processed using R software (version 4.0.2; R Foundation for Statistical Computing) [<xref ref-type="bibr" rid="ref9">9</xref>], using the <italic>tidyverse</italic> package [<xref ref-type="bibr" rid="ref10">10</xref>], including <italic>ggplot2</italic> for data visualization [<xref ref-type="bibr" rid="ref11">11</xref>] and <italic>dplyr</italic> for data wrangling [<xref ref-type="bibr" rid="ref12">12</xref>].</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Sample Characteristics</title><p>The sample was 44% female (n=652), with a mean age of 36 (SD 11.97, 20-84). A total of 99% (n=1479) of the individuals owned a mobile phone and 98% (n=1464) had access to home Wi-Fi (<xref ref-type="table" rid="table1">Table 1</xref>).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Sample characteristics from online study.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristics</td><td align="left" valign="bottom">Participants (N=1489)</td></tr></thead><tbody><tr><td align="left" valign="top">Age (years), mean (SD; range)</td><td align="left" valign="top">36.5 (12.0; 20-84)</td></tr><tr><td align="left" valign="top">Age &#x2265;50, years, n (%)</td><td align="left" valign="top">224 (15.04)</td></tr><tr><td align="left" valign="top">Past research experience, n (%)</td><td align="left" valign="top">1238 (83.14)</td></tr><tr><td align="left" valign="top" colspan="2">Sex, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="left" valign="top">811 (54.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">652 (43.7)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other</td><td align="left" valign="top">19 (1.27)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Proportion Unspecified + No Report</td><td align="left" valign="top">4 (0.2)</td></tr><tr><td align="left" valign="top" colspan="2">Race/Ethnicity, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Hispanic</td><td align="left" valign="top">116 (7.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>White</td><td align="left" valign="top">1134 (76.15)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Black</td><td align="left" valign="top">156 (10.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Asian</td><td align="left" valign="top">193 (12.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>American Indian, Alaska Native</td><td align="left" valign="top">22 (1.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Other</td><td align="left" valign="top">27 (1.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Average miles driven per week, mean (SD)</td><td align="left" valign="top">78 (181.9)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Median miles driven per week, IQR</td><td align="left" valign="top">29 (5-80)</td></tr><tr><td align="left" valign="top" colspan="2">Technology ownership, n (%)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Tablet</td><td align="left" valign="top">929 (62.39)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Smartphone</td><td align="left" valign="top">1479 (99.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Activity tracker</td><td align="left" valign="top">660 (44.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Home Wi-Fi</td><td align="left" valign="top">1464 (98.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Home Assistant (eg, Alexa)</td><td align="left" valign="top">812 (54.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Awareness regarding Google Takeout</td><td align="left" valign="top">217 (14.6)</td></tr></tbody></table></table-wrap></sec><sec id="s3-2"><title>RQ1: What Data Are People Willing to Contribute?</title><sec id="s3-2-1"><title>Overview</title><p>For each category of data, the sections below report the most and least endorsed options, as summarized in <xref ref-type="fig" rid="figure2">Figure 2</xref>.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>(A) Respondents&#x2019; willingness to complete various activities in the context of research; (B) Respondents&#x2019; willingness to wear various sensors in the context of research; (C) Respondents&#x2019; willingness to share various metadata in the context of research.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e64082_fig02.png"/></fig></sec><sec id="s3-2-2"><title>Activities</title><p>Among the activities assessed that could potentially take place in the context of research, 15-minute video or phone calls were the least endorsed options. Respondents were most willing to complete daily surveys about stress, mood, and emotions, as well as daily cognitive assessments.</p></sec><sec id="s3-2-3"><title>Sensors</title><p>Of the sensors assessed that could be worn in the context of research, whole home real-time location sensors and in-cabin, driver-facing dashcams were the three least endorsed options. In contrast, the respondents were most willing to wear an activity tracker, a heart rate monitor, and air quality sensors.</p></sec><sec id="s3-2-4"><title>Metadata</title><p>Of the metadata assessed that may be requested in the context of research, a Google Search history export as well as keystroke data (from computer or mobile phone) were the least endorsed. In contrast, the respondents were most willing to share data from smartphone activity trackers as well as phone and SMS metadata (number and duration of calls).</p></sec></sec><sec id="s3-3"><title>RQ2: For How Long Are People Willing to Contribute Critical Data Streams?</title><p>Participants were asked to consider a hypothetical study in which they were asked to complete three activities (queried independently), and rate how long in days they would be willing to complete each activity, for a maximum of 100 days (see <xref ref-type="other" rid="box1">Textbox 1</xref> for full questions): (1) daily assessments of cognition; (2) wear and charge an air quality or pollution sensor; and (3) wear and charge a GPS location sensor.</p><boxed-text id="box1"><title> Questions posed to participants in regard to three data collection activities (ie, cognitive assessments, air quality sensing, GPS location sensing).</title><p>Question</p><p>Imagine a study, where you were asked to complete daily assessments of your cognition, via short "&#x201C;brain games"&#x201D; or "&#x201C;mini-video games"&#x201D;. For how many days might you be willing to complete these assessments (up to 100 days d)?</p><p>Imagine a study, where you were asked to wear an air pollution sensor daily, clipping it to a work bag or to your clothing. For how many days might you be willing to wear and charge this device (up to 100 days d)?</p><p>Imagine a study, where you were asked to wear a GPS location sensor daily, clipping it to a work bag or to your clothing. For how many days might you be willing to wear and charge this device (up to 100 days d)?</p></boxed-text><p>Paired sample <italic>t</italic> tests were conducted to assess the differential willingness to share data from these three critical data streams, each previously implicated in cognitive health research (ie, mobile cognitive assessments, location data (GPS), and ambulatory air quality monitoring). On average, people were willing to complete ambulatory cognitive assessments for 56.7 (SD 36.2) days, air quality monitoring for 58.1 (SD 37.7) days, and GPS location monitoring for 37 (SD 39.0) days. Comparing mobile cognitive assessments and air quality monitoring&#x2014;participants were willing to complete each for a similar period of time (ie, mean difference of approximately 1.4 d; <italic>t</italic><sub>1488</sub>=&#x2212;1.44; <italic>P</italic>=.14). Upon comparing mobile cognitive assessments and GPS location monitoring, participants were willing to complete cognitive assessments for close to 20 more days than GPS location monitoring (ie, mean difference of approximately 19.7 d; <italic>t</italic><sub>1483</sub>=&#x2212;17.89; <italic>P</italic>&#x003C;.001). Comparing mobile air quality monitoring and GPS location monitoring &#x2013; participants were willing to complete air quality monitoring for close to 21 more days than GPS location monitoring (ie, mean difference of approximately 21 days; <italic>t</italic><sub>1483</sub>=&#x2212;20.65; <italic>P</italic>&#x003C;.001).</p></sec><sec id="s3-4"><title>RQ3: What Do People Expect From Their Data?</title><p>Participants were asked: &#x201C;Please select the types of control you expect to have over the data submitted as part of a research study&#x201D; Among the data control and sharing aspects assessed, 1042 (70%) participants were most interested in the ability to delete all their contributed research data, followed by the ability to select specific data streams for deletion (65%, 960) and deleting a specific moment in time (44%, 653). Respondents were least interested in the ability to share data with their insurance providers and caregivers (n=453, 30% and n=384, 25%, respectively; <xref ref-type="fig" rid="figure3">Figure 3</xref>).</p><p>When asked &#x201C;Please rate how comfortable (5-point scale, from extremely comfortable to extremely uncomfortable) you would feel about each of the following situations related to your hypothetical data,&#x201D; participant responses varied by data usage scenario (see <xref ref-type="fig" rid="figure4">Figure 4</xref>): (1) data used only for the purpose of the original study; (2) data used to develop algorithms; (3) data used by outside institutions collaborating on this research; (4) data used indefinitely for purposes unknown today; (5) data used to identify the participant; (6) data used to solve a public health problem; (7) data used to develop therapies and diagnoses. Unsurprisingly, participants were mostly uncomfortable with reidentification and with data being used for unspecified future purposes.. Respondents were mixed in regard to data being used by external collaborations. Participants were mostly comfortable with data being used for the original purpose, to develop therapies and diagnoses, and for algorithm development.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Respondents&#x2019; expectations for data controls as it relates to research.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e64082_fig03.png"/></fig><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Proportion of sample respondents reporting their comfort levels with various aspects of data usage. The x-axis categorizes different data usage aspects. The y-axis represents the proportion of respondents. Responses range from &#x201C;Extremely uncomfortable&#x201D; to &#x201C;Extremely comfortable,&#x201D; indicated by different shades of gray.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e64082_fig04.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Summary of the Findings</title><sec id="s4-1-1"><title>RQ1: What Data Are People Willing to Contribute?</title><p>Overall, participants were most willing to share data streams that have clear health implications (eg, activity sensor, heart rate monitors, air quality monitors) and least willing to share sensitive data streams (eg, GPS locations, driver/passenger-facing dashcam footage, Google search history). Participants were most willing to share data from active data collection activities and were least willing to share passive data streams (eg, sensors, metadata). People&#x2019;s willingness to share data that has obvious health implications replicates prior findings in this area [<xref ref-type="bibr" rid="ref4">4</xref>] and underscores the necessity of education on the relevance of each data stream to health outcomes, if it is to be considered and adopted by research participants.</p></sec><sec id="s4-1-2"><title>RQ2: How Long Are People Willing to Contribute Critical Data Streams?</title><p>On average, participants are willing to share data for up to 37 days, though this varied by data stream assessed. Willingness to share GPS location data was lowest, highlighting participant privacy concerns associated with data that may be more sensitive or identifiable, as was seen with the Strava data leak [<xref ref-type="bibr" rid="ref6">6</xref>]). In contrast, daily cognitive assessments and ambulatory air quality monitoring, were similarly endorsed, further supporting engagement with data streams with clear health implications.</p></sec><sec id="s4-1-3"><title>RQ3: What Controls and Feedback Do People Expect From Their Data?</title><p>Most participants endorsed the desire to delete all or specific streams of research data contributed by them. Although these data-related protections are required as per IRB regulations, most digital health technologies used for research do not necessarily have a straightforward method using which a person may delete their contributed data. This often requires a direct communication with the research group and a manual backend process. Future iterations of app- and cloud-based digital health technologies may want to consider affording the data provider (ie, the participant) more control over their data, including ways to download, remove data as desired, as well as mechanisms by which they can easily share data with key stakeholders in their life (eg, family or physician). Google Takeout is a platform through which Google account users can export all data originating from Google applications. In this study, only 14% individuals were aware of this tool, highlighting the need for data sharing education. Regarding various data usage scenarios, participants were mostly uncomfortable with unknown data use scenarios and reidentification, and comfortable with data being used to develop therapies and diagnoses, especially for the original purpose. Interestingly, participants reported mixed responses about their ratings of comfort, in regard to data being used by external collaborators. These findings highlight the importance of being transparent with participants on the various ways the data are being used&#x2014;as not all data use scenarios are seemingly acceptable.</p></sec></sec><sec id="s4-2"><title>Limitations and Future Directions</title><p>Although a large sample (ie, of approximately 1500 respondents) was recruited for this study, a major limitation is that participant demographics indicate a recruitment bias toward midlife, highly educated (69% have associates degree or higher), White participants (76%, n = 1134), and individuals active on online research platforms. As participation required familiarity with digital interfaces and online survey platforms, the sample may not adequately reflect the views of individuals with low technology adoption rates&#x2014;particularly those in rural or socioeconomically disadvantaged communities [<xref ref-type="bibr" rid="ref13">13</xref>]. Future research should consider probing similar research questions, leveraging a representative and more diverse sample of respondents, especially considering past research has shown differential willingness to share various data as a function of education and minority status. The extent to which older adults (ie, &#x003E;60 years) are aware of and are willing to participate by sharing sensor data and metadata is unclear. Older adults were sparsely represented in this sample, limiting insight into the acceptability of sensor-based monitoring among individuals most likely to benefit from digital health interventions (eg, including those aimed at chronic disease mitigation or cognitive decline). Age-related factors such as cognitive load, sensory impairments, or comfort with technology may interact with perceived burden; however, these nuances were not explored in this study.</p><p>In addition, this study did not directly measure aspects of personality, or expectations for data privacy&#x2014;two factors likely to explain variance in willingness to share data across the spectrum of participant burden. Participants&#x2019; decisions may have been influenced by recent media exposure or personal experiences related to data breaches or algorithmic discrimination, but these factors were not assessed. It is expected that awareness of specific events that highlight the reidentification potential of various sensitive data (eg, GPS) may moderate willingness to share sensitive data, along with the personality constructs of openness and consciousness [<xref ref-type="bibr" rid="ref14">14</xref>]).</p></sec><sec id="s4-3"><title>Conclusions</title><p>Importantly, the study relies on self-reported, hypothetical willingness to share data, which may not correspond with real-world behavior, particularly when actual study conditions involve real data collection amidst daily life schedules and hassles. Future work should validate these findings in live digital health trials to assess whether stated willingness translates to actual participation and data-sharing compliance. This study aimed to elucidate the types of data and control measures that participants expect in research. These findings can guide the optimization of study protocols to enhance participant engagement, data quality, and minimize participant burden. Ensuring participant privacy is paramount, and researchers have a duty to transparently communicate the rationale for data collection and its potential benefits. As researchers intend to collect rich data across the Active-Passive data continuum (see <xref ref-type="fig" rid="figure1">Figure 1</xref>), our participant&#x2019;s privacy comes first, and it is our duty to inform them why we collect the data we do. This approach will foster trust and encourage greater participation in research involving potentially sensitive data streams.</p></sec></sec></body><back><ack><p>NR was previously affiliated with the University of Central Florida and is now at Penn State University. This work was supported in part by funding from a UCF startup.</p></ack><notes><sec><title>Data Availability</title><p>The data that support the findings of this study are available in a public repository on GitHub [<xref ref-type="bibr" rid="ref15">15</xref>]. The repository includes deidentified datasets, code for data preprocessing and analysis, and documentation to facilitate reuse.</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">IRB</term><def><p>institutional review board</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Revilla</surname><given-names>M</given-names> </name><name name-style="western"><surname>Couper</surname><given-names>MP</given-names> </name><name name-style="western"><surname>Ochoa</surname><given-names>C</given-names> </name></person-group><article-title>Willingness of online panelists to perform additional tasks</article-title><source>Methods, Data, Analyses: A Journal for Quantitative Methods and Survey Methodology (Mda)</source><year>2019</year><volume>13</volume><issue>2</issue><fpage>223</fpage><lpage>252</lpage><pub-id pub-id-type="doi">10.12758/mda.2018.01</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wenz</surname><given-names>A</given-names> </name><name name-style="western"><surname>J&#x00E4;ckle</surname><given-names>A</given-names> </name><name name-style="western"><surname>Couper</surname><given-names>MP</given-names> </name></person-group><article-title>Willingness to use mobile technologies for data collection in a probability household panel</article-title><source>Surv Res Methods</source><year>2019</year><volume>13</volume><issue>1</issue><fpage>1</fpage><lpage>22</lpage><pub-id pub-id-type="doi">10.18148/srm/2019.v1i1.7298</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Struminskaya</surname><given-names>B</given-names> </name><name name-style="western"><surname>Lugtig</surname><given-names>P</given-names> </name><name name-style="western"><surname>Toepoel</surname><given-names>V</given-names> </name><name name-style="western"><surname>Schouten</surname><given-names>B</given-names> </name><name name-style="western"><surname>Giesen</surname><given-names>D</given-names> </name><name name-style="western"><surname>Dolmans</surname><given-names>R</given-names> </name></person-group><article-title>Sharing data collected with smartphone sensors: willingness, participation, and nonparticipation bias</article-title><source>Public Opin Q</source><year>2021</year><volume>85</volume><issue>Suppl 1</issue><fpage>423</fpage><lpage>462</lpage><pub-id pub-id-type="doi">10.1093/poq/nfab025</pub-id><pub-id pub-id-type="medline">34602867</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Seltzer</surname><given-names>E</given-names> </name><name name-style="western"><surname>Goldshear</surname><given-names>J</given-names> </name><name name-style="western"><surname>Guntuku</surname><given-names>SC</given-names> </name><etal/></person-group><article-title>Patients&#x2019; willingness to share digital health and non-health data for research: a cross-sectional study</article-title><source>BMC Med Inform Decis Mak</source><year>2019</year><month>08</month><day>8</day><volume>19</volume><issue>1</issue><fpage>157</fpage><pub-id pub-id-type="doi">10.1186/s12911-019-0886-9</pub-id><pub-id pub-id-type="medline">31395102</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Keusch</surname><given-names>F</given-names> </name><name name-style="western"><surname>Wenz</surname><given-names>A</given-names> </name><name name-style="western"><surname>Conrad</surname><given-names>F</given-names> </name></person-group><article-title>Do you have your smartphone with you? Behavioral barriers for measuring everyday activities with smartphone sensors</article-title><source>Comput Human Behav</source><year>2022</year><month>02</month><volume>127</volume><fpage>107054</fpage><pub-id pub-id-type="doi">10.1016/j.chb.2021.107054</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Hsu</surname><given-names>J</given-names> </name></person-group><article-title>The strava heat map shows even militaries can&#x2019;t keep secrets from social data</article-title><source>Wired</source><access-date>2025-04-21</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.wired.com/story/strava-heat-map-military-bases-fitness-trackers-privacy/">https://www.wired.com/story/strava-heat-map-military-bases-fitness-trackers-privacy/</ext-link></comment></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hysong</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Petersen</surname><given-names>LA</given-names> </name></person-group><article-title>Passive monitoring versus active assessment of clinical performance: impact on measured quality of care</article-title><source>Med Care</source><year>2011</year><month>10</month><volume>49</volume><issue>10</issue><fpage>883</fpage><lpage>890</lpage><pub-id pub-id-type="doi">10.1097/MLR.0b013e318222a36c</pub-id><pub-id pub-id-type="medline">21918399</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="web"><article-title>Quality data from real people for faster breakthroughs</article-title><source>Prolific</source><access-date>2025-07-09</access-date><comment><ext-link ext-link-type="uri" xlink:href="http://www.prolific.co">www.prolific.co</ext-link></comment></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="web"><article-title>The R Project for Statistical Computing</article-title><source>The R Foundation</source><year>2021</year><access-date>2025-07-09</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.R-project.org/">https://www.R-project.org/</ext-link></comment></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wickham</surname><given-names>H</given-names> </name><name name-style="western"><surname>Averick</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bryan</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Welcome to the Tidyverse</article-title><source>JOSS</source><year>2019</year><volume>4</volume><issue>43</issue><fpage>1686</fpage><pub-id pub-id-type="doi">10.21105/joss.01686</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wickham</surname><given-names>H</given-names> </name></person-group><article-title>ggplot2</article-title><source>WIREs Computational Stats</source><year>2011</year><month>03</month><volume>3</volume><issue>2</issue><fpage>180</fpage><lpage>185</lpage><pub-id pub-id-type="doi">10.1002/wics.147</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="report"><person-group person-group-type="author"><name name-style="western"><surname>Wickham</surname><given-names>H</given-names> </name><name name-style="western"><surname>Francois</surname><given-names>R</given-names> </name><name name-style="western"><surname>Henry</surname><given-names>L</given-names> </name><name name-style="western"><surname>M&#x00FC;ller</surname><given-names>K</given-names> </name><collab>Dplyr</collab></person-group><article-title>Dplyr: A Grammar of Data Manipulation. R Package Version 0.8.4.</article-title><year>2014</year><access-date>2020-08-12</access-date><publisher-name>R project</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://CRAN.R-project.org/package=dplyr">https://CRAN.R-project.org/package=dplyr</ext-link></comment></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pethig</surname><given-names>F</given-names> </name><name name-style="western"><surname>Kroenung</surname><given-names>J</given-names> </name><name name-style="western"><surname>Noeltner</surname><given-names>M</given-names> </name></person-group><article-title>A stigma power perspective on digital government service avoidance</article-title><source>Gov Inf Q</source><year>2021</year><month>04</month><volume>38</volume><issue>2</issue><fpage>101545</fpage><pub-id pub-id-type="doi">10.1016/j.giq.2020.101545</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Linek</surname><given-names>SB</given-names> </name><name name-style="western"><surname>Fecher</surname><given-names>B</given-names> </name><name name-style="western"><surname>Friesike</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hebing</surname><given-names>M</given-names> </name></person-group><article-title>Data sharing as social dilemma: Influence of the researcher&#x2019;s personality</article-title><source>PLOS ONE</source><year>2017</year><volume>12</volume><issue>8</issue><fpage>e0183216</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0183216</pub-id><pub-id pub-id-type="medline">28817642</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="web"><article-title>Nelsonroque/cascadelab_apdcm_mhealth</article-title><source>GitHub</source><access-date>2025-08-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/nelsonroque/cascadelab_apdcm_mhealth">https://github.com/nelsonroque/cascadelab_apdcm_mhealth</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Data for the willingness to participate, and share various streams.</p><media xlink:href="formative_v9i1e64082_app1.docx" xlink:title="DOCX File, 26 KB"/></supplementary-material></app-group></back></article>