<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JFR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id>
      <journal-title>JMIR Formative Research</journal-title>
      <issn pub-type="epub">2561-326X</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v10i1e79315</article-id>
      <article-id pub-id-type="pmid">42140619</article-id>
      <article-id pub-id-type="doi">10.2196/79315</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Evaluating Crowdsourced Data Collection for Carceral Death Surveillance: Pilot Study Using Amazon Mechanical Turk</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Sarvestan</surname>
            <given-names>Javad</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Hagan</surname>
            <given-names>Liesl M</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Wang</surname>
            <given-names>Emily</given-names>
          </name>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0314-2464</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Healey-Parera</surname>
            <given-names>Julia</given-names>
          </name>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0004-1523-8799</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Duan</surname>
            <given-names>Amy</given-names>
          </name>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-0928-5489</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Cloud</surname>
            <given-names>David H</given-names>
          </name>
          <degrees>PhD, JD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Population Health Sciences</institution>
            <institution>School of Medicine</institution>
            <institution>Duke University</institution>
            <addr-line>215 Morris Street</addr-line>
            <addr-line>Suite 210, Box 104023</addr-line>
            <addr-line>Durham, NC, 27701</addr-line>
            <country>United States</country>
            <phone>1 919 681 6801</phone>
            <email>david.cloud@duke.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-5270-4171</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Fliss</surname>
            <given-names>Mike Dolan</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3194-7171</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Brinkley-Rubinstein</surname>
            <given-names>Lauren</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2191-6240</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Population Health Sciences</institution>
        <institution>School of Medicine</institution>
        <institution>Duke University</institution>
        <addr-line>Durham, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Injury Prevention Research Center</institution>
        <institution>University of North Carolina at Chapel Hill</institution>
        <addr-line>Chapel Hill, NC</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: David H Cloud <email>david.cloud@duke.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2026</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>15</day>
        <month>5</month>
        <year>2026</year>
      </pub-date>
      <volume>10</volume>
      <elocation-id>e79315</elocation-id>
      <history>
        <date date-type="received">
          <day>19</day>
          <month>6</month>
          <year>2025</year>
        </date>
        <date date-type="rev-request">
          <day>21</day>
          <month>8</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>10</day>
          <month>2</month>
          <year>2026</year>
        </date>
        <date date-type="accepted">
          <day>16</day>
          <month>2</month>
          <year>2026</year>
        </date>
      </history>
      <copyright-statement>©Emily Wang, Julia Healey-Parera, Amy Duan, David H Cloud, Mike Dolan Fliss, Lauren Brinkley-Rubinstein. Originally published in JMIR Formative Research (https://formative.jmir.org), 15.05.2026.</copyright-statement>
      <copyright-year>2026</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on https://formative.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://formative.jmir.org/2026/1/e79315" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>People who are incarcerated face significantly higher health risks than the general population, yet deaths in custody remain underreported and poorly monitored by public health systems. Although the federal Death in Custody Reporting Act requires reporting of all deaths in correctional facilities to the US Department of Justice, reporting has been inconsistent, delayed, and often publicly inaccessible. Consequently, researchers have turned to press releases issued by correctional agencies as one of the few timely sources of information on deaths in custody. However, these press releases vary widely in content and structure, making standardized data extraction difficult. Crowdsourcing platforms such as Amazon Mechanical Turk (MTurk) may offer a faster, low-cost method for gathering data, but their utility in this setting remains untested.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This pilot study evaluated whether MTurk could be used to extract structured information from press releases about deaths in custody.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We selected 144 press releases describing deaths between 2000 and 2023 from state prison systems and Immigration and Customs Enforcement. Each press release was assigned to 3 MTurk crowd workers (who were required to be English speaking and located in the United States), resulting in 432 individual responses. Workers were informed in advance that the task involved reviewing sensitive content related to deaths in custody. Crowd workers completed a 16-question form aligned with Death in Custody Reporting Act variables, including age, race and ethnicity, date of death, and facility location. Data quality was assessed using strict concordance (all 3 responses matched), 2-way concordance (2 of 3 responses matched), and qualitative review of common errors. Task completion time was also recorded. Sampling included complete subsets of selected press releases and a stratified subset from systems with more complex reporting formats.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>All 144 entries were completed within 48 hours. However, agreement across crowd workers was low: strict concordance was 14.2% (20/144) for age, 12.3% (18/144) for race or ethnicity, and 11.4% (16/144) for date of birth. Qualitative review identified frequent errors, missing data, and inattentive or automated responses. Crowd workers often misinterpreted system-specific terminology or copied placeholders instead of extracting information from the source. The low agreement indicated that this baseline MTurk configuration produced insufficient data quality for more resource-intensive use.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>MTurk enabled rapid task completion but produced low-quality results when applied to extracting structured data from carceral press releases. These findings suggest that general crowdsourcing platforms are poorly suited to complex data abstraction tasks without additional training or oversight. With improved task design or support from artificial intelligence tools, crowdsourcing may help address gaps in the surveillance of deaths in custody. Long-term improvements will require consistent, transparent, and standardized reporting practices across correctional institutions.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>carceral health</kwd>
        <kwd>deaths in custody</kwd>
        <kwd>mortality surveillance</kwd>
        <kwd>crowdsourcing</kwd>
        <kwd>Amazon Mechanical Turk</kwd>
        <kwd>structured data abstraction</kwd>
        <kwd>digital epidemiology</kwd>
        <kwd>health equity</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>With more than 1.2 million people held in state and federal prisons, the United States operates the most expansive prison system in the world [<xref ref-type="bibr" rid="ref1">1</xref>]. As mass incarceration has grown, premature deaths in custody have emerged as a mounting public health crisis, increasing in scale while receiving limited attention from public health systems [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. People who are incarcerated experience substantial health disparities shaped by the conditions of confinement [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Overcrowding, idleness, unsanitary living spaces, inadequate nutrition, limited access to medical and mental health care, isolation, and exposure to violence all contribute to worsening health and increased risk of premature death [<xref ref-type="bibr" rid="ref2">2</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. Since 2001, the prison mortality rate has increased by 77%, with particularly steep rises in suicides and drug- and alcohol-related deaths. Between 2001 and 2018, drug- and alcohol-related deaths increased more than sixfold, and suicides rose by more than 85% [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>].</p>
      <p>Despite the growing number of deaths in US jails and prisons, the nation lacks a coordinated public health and policy infrastructure for tracking, reporting, and responding to carceral mortality [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. The Death in Custody Reporting Act (DCRA) requires state and local agencies, as well as federal agencies within the Department of Justice, to report all deaths in custody to the Attorney General, including deaths occurring during arrest; in transit; and within correctional facilities such as jails, prisons, and juvenile detention centers. However, DCRA does not apply to agencies outside the Department of Justice, such as US Immigration and Customs Enforcement (ICE), which is housed within the Department of Homeland Security and governed instead by internal policies and congressional directives requiring separate public reporting [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref12">12</xref>].</p>
      <p>This fragmented jurisdictional landscape contributes to persistent gaps, delays, and inconsistencies in mortality data, which undermine efforts to track trends, hold institutions accountable for conditions that contribute to preventable deaths in custody, and seek justice for those who die behind bars and their families [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. A recent national study found that only 1 prison system, Iowa, publicly releases death data that are both timely and complete under DCRA standards. Over one-third of systems release no individual-level death data at all, while most others either publish information with substantial delays or omit essential details such as age, cause of death, or facility [<xref ref-type="bibr" rid="ref11">11</xref>].</p>
      <p>Although incarceration is a key structural determinant of health inequities in the United States [<xref ref-type="bibr" rid="ref4">4</xref>], responsibility for tracking deaths in custody has largely remained outside the public health system. Surveillance of deaths in jails, prisons, and other detention facilities is not integrated into Centers for Disease Control and Prevention mortality systems, and carceral health research receives minimal support from the National Institutes of Health [<xref ref-type="bibr" rid="ref13">13</xref>]. This lack of public health ownership is reflected in vital records systems, including death certificates, which do not consistently indicate whether a death occurred in custody. Although adding a standardized field or checkbox has been proposed, it has not been implemented nationally [<xref ref-type="bibr" rid="ref2">2</xref>]. Because federal funding priorities shape state and local public health capacity, these gaps further constrain the ability of public health systems to monitor and respond to carceral mortality [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref14">14</xref>].</p>
      <p>In 2019, federal responsibility for collecting deaths-in-custody data shifted from the Bureau of Justice Statistics, a statistical agency with a mandate for public reporting, to the Bureau of Justice Assistance, a grant-making agency with less experience in data collection and analysis. This transition raised concerns about data quality and transparency. Although Bureau of Justice Assistance began publishing carceral mortality dashboards in 2024, the datasets contain clear errors and omissions, including states listed as having no deaths and entries missing key information such as cause of death or demographic characteristics [<xref ref-type="bibr" rid="ref14">14</xref>]. These shortcomings have further weakened confidence in federal oversight of deaths in custody.</p>
      <p>Surveillance, transparency, and accountability are closely linked in the context of carceral mortality. Transparency depends on timely, public reporting of deaths by correctional systems, yet official data sources often fail to meet this standard [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. National analyses of DCRA compliance show that 39% of prison systems release no individual-level death data. Among systems that do report deaths, only Iowa publishes complete and timely information that includes all DCRA-required elements within the federal 3-month reporting window [<xref ref-type="bibr" rid="ref11">11</xref>]. Because official carceral mortality data are frequently delayed or incomplete, press releases issued by carceral systems often provide the earliest publicly available information about deaths in custody. However, both the availability and content of these press releases vary widely across jurisdictions.</p>
      <p>This study builds on the work of the Third City Project at Duke University, which was launched during the COVID-19 pandemic to improve transparency in carceral health data. While initially focused on tracking infectious disease outbreaks in prisons and jails, the project later expanded to address broader gaps in mortality reporting. Through manual review and coding of hundreds of press releases, the research team found that although these documents often contain valuable information, extracting structured data from them is labor intensive and difficult to scale [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref14">14</xref>].</p>
      <p>These constraints prompted consideration of alternative approaches that might support more timely data abstraction without relying exclusively on trained research staff. One such approach is crowdsourcing, which has been increasingly used in health and social science research to complete discrete, repeatable tasks at scale. Platforms such as Amazon Mechanical Turk (MTurk) and Prolific are commonly used to recruit participants for surveys and behavioral experiments, offering speed, relatively low cost, and access to large respondent pools [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref19">19</xref>]. In public health, crowdsourcing has been applied to studies of vaccine attitudes [<xref ref-type="bibr" rid="ref20">20</xref>], substance use [<xref ref-type="bibr" rid="ref21">21</xref>], and disability [<xref ref-type="bibr" rid="ref22">22</xref>], as well as in criminology to research on public attitudes toward incarceration and punishment [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>].</p>
      <p>Beyond survey-based research, crowdsourcing has also been used for content-focused tasks in fields such as computer science, information science, and the digital humanities, including annotating scientific abstracts, labeling archival materials, and coding legal or biomedical texts [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. In these applications, crowd workers extract or classify information from existing documents rather than generate original responses. Such studies typically rely on relatively controlled source materials with consistent formats, specialized vocabularies, and detailed task instructions or training.</p>
      <p>By contrast, press releases reporting deaths in custody vary widely in structure, language, and level of detail; often include institution-specific terminology; and reflect differing norms around transparency and disclosure across carceral systems [<xref ref-type="bibr" rid="ref11">11</xref>]. These features introduce challenges that may limit the effectiveness of general-purpose crowdsourcing approaches designed for more standardized materials.</p>
      <p>At the same time, press releases are among the few mechanisms through which individual-level information about deaths in custody enters the public record within days or weeks of a death, despite substantial variation in content and completeness [<xref ref-type="bibr" rid="ref11">11</xref>]. Consequently, they represent a constrained but potentially valuable data source for improving the timeliness of carceral mortality surveillance.</p>
      <p>This pilot study examines the use of MTurk to extract structured mortality information from press releases describing deaths in custody, using a basic task design and minimal crowd worker screening or training to characterize baseline performance.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Study Design and Data Sources</title>
        <p>As part of its ongoing work to improve transparency around carceral health outcomes, the Third City Project systematically collects and standardizes data on in-custody deaths reported through state prison system press releases [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. Press releases were selected from a broader dataset of carceral mortality notifications compiled by the Third City Project, which includes public announcements from state Departments of Corrections; the Federal Bureau of Prisons; ICE; and select territories such as Washington, District of Columbia, and Puerto Rico.</p>
        <p>For this pilot study, we analyzed 144 press releases from state prison systems and ICE. Press releases from jails, the Federal Bureau of Prisons, Washington, District of Columbia, and Puerto Rico were not included. Consequently, the MTurk sample represents deaths occurring in state prisons and immigration detention but not in jails or federal prisons.</p>
        <p>Press releases were sourced from official Department of Corrections websites, agency social media accounts, and periodic bulletins. Relevant information was manually extracted and entered into standardized, state-specific Qualtrics (Qualtrics Inc) forms capturing variables such as the decedent’s name, demographic characteristics, date and location of death, cause of death, facility name, and incarceration date. In some cases, states also maintained dashboards or published aggregate mortality statistics. The dataset was cleaned and standardized using custom R scripts prior to analysis.</p>
      </sec>
      <sec>
        <title>Crowdsourcing Platform and Procedure</title>
        <p>MTurk is a web-based crowdsourcing platform that allows employers, known as requesters, to post microtasks online—called human intelligence tasks (HITs)—for human workers, or “turkers,” to complete in exchange for compensation. Each HIT is a self-contained assignment, such as identifying content in a photo, extracting information from a document, or answering survey questions. Once an HIT is completed, the requester reviews the quality of the submission and determines whether the work meets standards for payment.</p>
        <p>In July 2024, we conducted a pilot study using MTurk to evaluate whether crowd workers could extract structured data from publicly available prison death press releases. Each HIT required workers to complete a structured 16-question form based on a single press release. For each entry, workers were provided the decedent’s name, a direct link to the press release, the correctional system involved, and system-specific instructions. Variables aligned with DCRA requirements and included age, race or ethnicity, date and location of death, cause of death, and facility name. Workers were instructed to leave fields blank if information was not reported.</p>
        <p>Each press release was independently assigned to 3 crowd workers to enable comparison across responses. Task instructions were intentionally brief, and no formal attention checks were embedded, to observe baseline performance under low-barrier conditions. Because ICE press releases often include more detailed immigration and medical histories, a supplemental survey containing 8 additional questions was deployed for ICE entries only. Crowd workers were informed prior to task acceptance that the assignment involved reviewing a press release describing a death in custody and could decline participation without penalty.</p>
      </sec>
      <sec>
        <title>Sampling</title>
        <p>Entries were selected by taking a complete sample of press releases published in 2023 from the larger Third City dataset (n=7184 as of August 2024), supplemented by a stratified subsample of up to 5 press releases from each of 5 systems with more complex reporting formats: Arkansas, Florida, Montana, Texas, and ICE.</p>
        <p>Because this pilot was designed to assess feasibility rather than generate population-level estimates, we did not aim for a balanced or representative sample. Instead, we deliberately oversampled systems with more complex reporting structures to ensure inclusion of both straightforward and challenging cases. This design should be interpreted as a feasibility test rather than as representative of typical state prison press releases.</p>
      </sec>
      <sec>
        <title>Data Quality Assessment and Statistical Analysis</title>
        <p>To assess data quality, we conducted a concordance analysis comparing responses submitted by the 3 crowd workers assigned to each press release. Analyses focused on variables required under the DCRA, as these fields are central to carceral mortality surveillance.</p>
        <p>We calculated the percentage of entries in which all 3 crowd workers provided the same response (strict concordance) and the percentage in which 2 of 3 responses matched (2-way concordance). These measures reflect complete and majority agreement, respectively, and exclude partial matches. CIs were calculated for all concordance estimates. Discrepancies were reviewed qualitatively to identify common sources of error, including missing or skipped fields, inconsistent interpretation of press release content, and copying of placeholder examples rather than source material.</p>
        <p>To limit risks of misclassification, MTurk outputs were treated strictly as data extraction measures rather than definitive classifications of press release content. Crowd worker responses were compared to data manually extracted by Third City Project research assistants as a reference point for identifying discrepancies, rather than as a formal gold standard validation. Assigning multiple independent crowd workers to each press release allowed us to quantify uncertainty and identify entries with high disagreement. Variables were defined using language commonly used in press releases (eg, “facility housed” and “press release date”) to avoid binary or morally loaded classifications.</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study involved analysis of publicly available press releases and was reviewed and approved by the Duke University Institutional Review Board (Pro00111898). All source materials were published by correctional agencies and accessed through official public channels. No private or nonpublic records were used.</p>
        <p>Decedent names and links to press releases were retained because they were part of the original public disclosures and were necessary to assess whether identifying information was consistently reported and could be reliably extracted across systems. No additional personal information was collected, inferred, or linked beyond what was included in the publicly released materials.</p>
        <p>Crowd workers were informed prior to task acceptance that the assignment involved reviewing a press release describing a death in custody. This warning appeared in the task title and description on the MTurk marketplace, allowing workers to opt out without penalty if they did not wish to engage with the content. All press releases were reviewed in advance by Third City Project research assistants to screen for graphic or disturbing material before inclusion in the task.</p>
        <p>Compensation was set based on task length and complexity and benchmarked against prevailing MTurk rates to ensure payment above the platform average for comparable tasks. The study did not require workers to generate original content or make judgments about responsibility or cause beyond extracting information explicitly stated in the source material.</p>
        <p>To limit the risk of misclassification that could affect public narratives about deaths in custody, MTurk outputs were treated as data extraction rather than definitive classifications. Each press release was reviewed by multiple independent crowd workers, and disagreement across responses was used to identify uncertainty rather than to assert accuracy. Results were reported in aggregate, and high-disagreement cases were flagged for review rather than interpreted as definitive records.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>The MTurk pilot demonstrated that while crowdsourcing offers a rapid turnaround for data collection, it yielded low-quality results when applied to carceral death press releases. All 144 assigned tasks were completed within 2 days, reflecting the efficiency of the platform. However, concordance analysis revealed low consistency across crowd worker responses.</p>
      <p><xref ref-type="table" rid="table1">Table 1</xref> presents 2-way (2-of-3) concordance for variables aligned with DCRA reporting requirements, along with 95% CIs. Two-way concordance captures how often independently submitted responses converged on the same value for a given field.</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Two-way concordance of Amazon Mechanical Turk crowd worker responses for variables extracted from prison mortality press releases.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="500"/>
          <col width="500"/>
          <thead>
            <tr valign="top">
              <td>Variable</td>
              <td>Two-way concordance (95% CI)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>First name</td>
              <td>0.7092 (0.6268-0.7826)</td>
            </tr>
            <tr valign="top">
              <td>Last name</td>
              <td>0.6596 (0.5751-0.7372)</td>
            </tr>
            <tr valign="top">
              <td>Race or ethnicity</td>
              <td>0.6738 (0.5898-0.7503)</td>
            </tr>
            <tr valign="top">
              <td>Age</td>
              <td>0.5532 (0.4672-0.6369)</td>
            </tr>
            <tr valign="top">
              <td>Gender</td>
              <td>0.5957 (0.5099-0.6775)</td>
            </tr>
            <tr valign="top">
              <td>Location of death</td>
              <td>0.3688 (0.2892-0.4541)</td>
            </tr>
            <tr valign="top">
              <td>Date of death</td>
              <td>0.4255 (0.3427-0.5115)</td>
            </tr>
            <tr valign="top">
              <td>Cause of death</td>
              <td>0.3050 (0.2303-0.3880)</td>
            </tr>
            <tr valign="top">
              <td>Facility housed</td>
              <td>0.5035 (0.4182-0.5888)</td>
            </tr>
            <tr valign="top">
              <td>Press release date</td>
              <td>0.4751 (0.3905-0.5609)</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>Two-way concordance was highest for basic identifying information. Matching responses were most common for first name (0.7092, 95% CI 0.6268-0.7826), last name (0.6596, 95% CI 0.5751-0.7372), and race or ethnicity (0.6738, 95% CI 0.5898-0.7503). Moderate levels of concordance were observed for age (0.5532, 95% CI 0.4672-0.6369), gender (0.5957, 95% CI 0.5099-0.6775), and facility housed (0.5035, 95% CI 0.4182-0.5888).</p>
      <p>Lower 2-way concordance was observed for variables that were inconsistently reported or embedded within narrative text. These included date of death (0.4255, 95% CI 0.3427-0.5115), press release date (0.4751, 95% CI 0.3905-0.5609), location of death (0.3688, 95% CI 0.2892-0.4541), and cause of death (0.3050, 95% CI 0.2303-0.3880). Overall, convergence across independent responses was higher for discrete, clearly labeled fields than for information requiring interpretation across multiple sections of a press release.</p>
      <p><xref ref-type="table" rid="table2">Table 2</xref> presents strict 3-way concordance, defined as identical responses across all 3 independent crowd workers for a given field. This measure represents a conservative benchmark of consistency and reflects the upper bound of agreement achievable without review or correction.</p>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Three-way concordance of Amazon Mechanical Turk crowd worker responses for variables extracted from prison mortality press releases.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="500"/>
          <col width="500"/>
          <thead>
            <tr valign="top">
              <td>Variable</td>
              <td>Three-way concordance (95% CI)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>First name</td>
              <td>0.2553 (0.1857-0.3355)</td>
            </tr>
            <tr valign="top">
              <td>Last name</td>
              <td>0.2340 (0.1669-0.3127)</td>
            </tr>
            <tr valign="top">
              <td>Race or ethnicity</td>
              <td>0.1277 (0.0774-0.1942)</td>
            </tr>
            <tr valign="top">
              <td>Age</td>
              <td>0.1418 (0.0888-0.2105)</td>
            </tr>
            <tr valign="top">
              <td>Gender</td>
              <td>0.0639 (0.0296-0.1177)</td>
            </tr>
            <tr valign="top">
              <td>Location of death</td>
              <td>0.0567 (0.0248-0.1087)</td>
            </tr>
            <tr valign="top">
              <td>Date of death</td>
              <td>0.2553 (0.0345-0.1266)</td>
            </tr>
            <tr valign="top">
              <td>Cause of death</td>
              <td>0.0425 (0.0158-0.0903)</td>
            </tr>
            <tr valign="top">
              <td>Facility housed</td>
              <td>0.1277 (0.0774-0.1942)</td>
            </tr>
            <tr valign="top">
              <td>Press release date</td>
              <td>0.1206 (0.0718-0.1860)</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p>For demographic and contextual fields, 3-way concordance was substantially lower. Concordance for age (0.1418, 95% CI 0.0888-0.2105), race or ethnicity (0.1277, 95% CI 0.0774-0.1942), and facility housed (0.1277, 95% CI 0.0774-0.1942) indicated limited consistency across independently submitted responses. The lowest levels of 3-way concordance were observed for cause of death (0.0425, 95% CI 0.0158-0.0903), location of death (0.0567, 95% CI 0.0248-0.1087), and gender (0.0639, 95% CI 0.0296-0.1177), all of which were frequently missing, inconsistently reported, or embedded within narrative text.</p>
      <p>Qualitative review identified several common sources of error. First, some crowd workers submitted inaccurate data across multiple fields. For instance, several age and race entries appeared to be inferred from photographs in the press release rather than stated information. Second, crowd workers often skipped fields that were present in the source or copied placeholder examples instead of completing the form. Finally, for systems with more complex reporting formats, such as ICE or Texas, crowd workers sometimes returned overly specific but incorrect facility names, suggesting reliance on external sources or automated tools rather than the press release itself.</p>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <p>This study assessed whether MTurk could serve as a scalable tool to support the timely collection of carceral mortality data, a need made urgent by persistent delays, data gaps, and inconsistent reporting across carceral systems [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Although crowdsourcing platforms are widely used in public health research for their speed and low cost, their performance in complex data abstraction tasks is less well understood. Therefore, we conducted a feasibility study using a deliberately low-barrier task design, with minimal instructions and no enhanced crowd worker screening or training, to characterize baseline performance under conditions that might be considered for rapid, low-cost deployment. Under these conditions, MTurk enabled rapid task completion but produced low concordance across key mortality fields.</p>
      <p>Crowdsourcing has gained traction in public health for tasks such as disease surveillance, participatory epidemiology, and outbreak monitoring due to its capacity to generate large volumes of timely data at low cost [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>]. While their speed and scalability are appealing, researchers have raised concerns about data quality, sampling bias, and crowd worker attentiveness, especially in studies requiring accurate or complex data, where these tools may introduce significant limitations [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>]. Our findings are consistent with these concerns.</p>
      <p>Across many variables required under the DCRA, concordance between independently submitted crowd worker responses was low. Even for core DCRA fields such as age, race or ethnicity, and date of birth, strict 3-way agreement occurred in fewer than 15% (20/144, 18/144, and 37/144, respectively) of cases. These results indicate substantial inconsistency in how crowd workers interpreted and extracted information from the same press releases and suggest that baseline MTurk configurations are poorly suited for unreviewed abstraction of mortality data intended to support surveillance or accountability.</p>
      <p>One factor contributing to these limitations appears to be the specialized nature of carceral press releases. These documents often contain system-specific terminology, unclear abbreviations, and facility naming conventions that may be unfamiliar to general audiences. Crowd workers without prior experience or training appeared to struggle with these features, leading to errors even when the correct information was present. Errors were particularly common for variables that are central to DCRA reporting but inconsistently labeled in press releases, such as cause and location of death. In some cases, responses were overly specific but incorrect, suggesting reliance on external searches or automated tools rather than the press release itself.</p>
      <p>Despite these limitations, MTurk may have limited utility if applied in more constrained or carefully designed ways. More selective worker eligibility criteria, such as higher approval thresholds or prior experience with similar tasks, could improve performance. Providing clearer field-level guidance or brief tutorials tailored to carceral terminology may also reduce misinterpretation. For complex or sensitive variables, hybrid approaches that combine crowdsourcing with trained review may be necessary [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref28">28</xref>].</p>
      <p>Alternative platforms such as Prolific may offer stronger infrastructure for academic research. Prolific provides tools for prescreening, attention checks, and improved compensation, which have been associated with higher-quality data in survey-based studies. Some evidence suggests that experienced crowd workers may be migrating away from MTurk in favor of platforms with better pay and task design [<xref ref-type="bibr" rid="ref16">16</xref>]. Past public health studies have successfully used Prolific to conduct psychometrically oriented substance use research and administer surveys to determine perceptions of COVID-19 among the public [<xref ref-type="bibr" rid="ref25">25</xref>-<xref ref-type="bibr" rid="ref27">27</xref>]. However, it remains unclear whether these advantages would translate to complex data abstraction tasks involving heterogeneous and institutionally specific source materials, such as carceral death press releases.</p>
      <p>Emerging applications of large language models (LLMs) also merit consideration. LLMs are increasingly used to extract information from unstructured text and may offer potential for processing press releases and other narrative data related to carceral deaths [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. Exploring the use of LLMs for carceral mortality surveillance may be a worthwhile direction for future research.</p>
      <p>Our pilot used a low-barrier approach to assess baseline feasibility for a specific research objective to identify limitations and guide future applications of this method. Several strategies may improve the reliability of future efforts to extract structured data from press releases reporting deaths in custody. Dividing the task into smaller components may help crowd workers navigate complex narratives more effectively. Providing field-specific examples and a brief tutorial could improve clarity and reduce misinterpretation. Limiting participation to crowd workers with higher approval ratings or prior experience in similar tasks may also enhance consistency [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref32">32</xref>].</p>
      <p>Several limitations should be considered when interpreting these findings. First, the analysis relied on a single crowdsourcing platform and reflects the performance of its general worker pool without enhanced screening or training. Second, the pilot included a relatively small sample of 144 entries and intentionally oversampled systems with more complex reporting formats. As a result, the findings describe this specific feasibility test and should not be generalized to all state prison press releases. Third, the source materials themselves varied widely in structure and completeness, with essential information often missing or ambiguously reported. Fourth, although concordance was assessed across multiple workers, we did not validate MTurk outputs against a gold standard dataset coded by trained experts. Future studies should directly compare crowdsourced extraction to expert abstraction to better assess accuracy. Finally, this pilot was not designed to evaluate how task-level factors, such as compensation, task length, or worker background, affected performance. Examining these factors is an important direction for future work.</p>
      <p>Crowdsourcing methods also raise ethical concerns. These platforms often rely on low-paid labor to perform tasks requiring sustained attention and judgment. Asking untrained workers to process sensitive information about deaths in custody raises concerns about fairness, emotional burden, and responsibility in digital labor. In addition, this approach carries a risk of misclassifying carceral death data, which can have serious consequences. Records of deaths in custody carry legal, political, and public health significance, and inaccuracies may have unintended downstream effects.</p>
      <p>As deaths in custody remain an urgent but undermonitored public health concern, there is growing interest in approaches that could improve the timeliness of mortality data consistent with DCRA requirements. In this feasibility pilot, MTurk enabled rapid task completion but produced data with limited reliability for extracting several key mortality variables. These findings reflect the specific low-barrier task design and conditions tested here and indicate that caution is warranted when applying general-purpose crowdsourcing platforms to carceral mortality surveillance. Future research should examine whether more targeted task design, alternative platforms, or complementary automated approaches can improve performance, alongside continued efforts to strengthen standardized and transparent public reporting of deaths in custody.</p>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">DCRA</term>
          <def>
            <p>Death in Custody Reporting Act</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">HIT</term>
          <def>
            <p>human intelligence task</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">ICE</term>
          <def>
            <p>Immigration and Customs Enforcement</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">MTurk</term>
          <def>
            <p>Amazon Mechanical Turk</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>The authors are grateful to the Data+ program at Duke University for supporting undergraduate student involvement in the Third City Project.</p>
    </ack>
    <notes>
      <sec>
        <title>Funding</title>
        <p>This work was supported by the Robert Wood Johnson Foundation. The funder had no role in the design, analysis, interpretation, or publication of this study.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sawyer</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wagner</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Mass incarceration: the whole pie 2024</article-title>
          <source>Prison Policy Initiative</source>
          <year>2024</year>
          <access-date>2026-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.prisonpolicy.org/factsheets/pie2024_allimages.pdf">https://www.prisonpolicy.org/factsheets/pie2024_allimages.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mitchell</surname>
              <given-names>RA Jr</given-names>
            </name>
            <name name-style="western">
              <surname>Aronson</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <source>Death in Custody: How America Ignores the Truth and What We Can Do about It</source>
          <year>2023</year>
          <month>09</month>
          <day>05</day>
          <publisher-loc>Baltimore, MD</publisher-loc>
          <publisher-name>Johns Hopkins University Press</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Binswanger</surname>
              <given-names>IA</given-names>
            </name>
            <name name-style="western">
              <surname>Kinner</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Deaths in custody and following release</article-title>
          <source>J Health Hum Serv Adm</source>
          <year>2019</year>
          <month>12</month>
          <day>01</day>
          <volume>41</volume>
          <issue>4</issue>
          <fpage>45</fpage>
          <lpage>84</lpage>
          <pub-id pub-id-type="doi">10.1177/107937391904100403</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Brinkley-Rubinstein</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Berk</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>BA</given-names>
            </name>
          </person-group>
          <article-title>Carceral health care</article-title>
          <source>N Engl J Med</source>
          <year>2025</year>
          <month>02</month>
          <day>27</day>
          <volume>392</volume>
          <issue>9</issue>
          <fpage>892</fpage>
          <lpage>901</lpage>
          <pub-id pub-id-type="doi">10.1056/NEJMra2212149</pub-id>
          <pub-id pub-id-type="medline">40009808</pub-id>
          <pub-id pub-id-type="pmcid">PMC11995879</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cloud</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia-Grossman</surname>
              <given-names>IR</given-names>
            </name>
            <name name-style="western">
              <surname>Armstrong</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Public health and prisons: priorities in the age of mass incarceration</article-title>
          <source>Annu Rev Public Health</source>
          <year>2023</year>
          <month>04</month>
          <day>03</day>
          <volume>44</volume>
          <fpage>407</fpage>
          <lpage>28</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.annualreviews.org/content/journals/10.1146/annurev-publhealth-071521-034016?crawler=true&#38;mimetype=application/pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.1146/annurev-publhealth-071521-034016</pub-id>
          <pub-id pub-id-type="medline">36542770</pub-id>
          <pub-id pub-id-type="pmcid">PMC10128126</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wildeman</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Fitzpatrick</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Goldman</surname>
              <given-names>AW</given-names>
            </name>
          </person-group>
          <article-title>Conditions of confinement in American prisons and jails</article-title>
          <source>Annu Rev Law Soc Sci</source>
          <year>2018</year>
          <volume>14</volume>
          <fpage>29</fpage>
          <lpage>47</lpage>
          <pub-id pub-id-type="doi">10.1146/annurev-lawsocsci-101317-031025</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carson</surname>
              <given-names>EA</given-names>
            </name>
          </person-group>
          <article-title>Mortality in state and federal prisons, 2001–2019 – statistical tables</article-title>
          <source>Bureau of Justice Statistics</source>
          <year>2021</year>
          <access-date>2026-04-09</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bjs.ojp.gov/library/publications/mortality-state-and-federal-prisons-2001-2019-statistical-tables">https://bjs.ojp.gov/library/publications/mortality-state-and-federal-prisons-2001-2019-statistical-tables</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carson</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Mortality in Correctional Institutions (MCI) (formerly Deaths in Custody Reporting Program (DCRP))</article-title>
          <source>Bureau of Justice Statistics</source>
          <year>2019</year>
          <access-date>2025-03-31</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bjs.ojp.gov/data-collection/mortality-correctional-institutions-mci-formerly-deaths-custody-reporting-program">https://bjs.ojp.gov/data-collection/mortality-correctional-institutions-mci-formerly-deaths-custody-reporting-program</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Armstrong</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>No prisoner left behind? Enhancing public transparency of penal institutions</article-title>
          <source>Stanf Law Policy Rev</source>
          <year>2018</year>
          <volume>25</volume>
          <fpage>435</fpage>
          <lpage>76</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://law.stanford.edu/wp-content/uploads/2018/03/armstrong.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.2139/ssrn.2324387</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cullins</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Behne</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Brinkley-Rubinstein</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>The current state of carceral health data: an analysis of "listening sessions" with stakeholders</article-title>
          <source>Health Justice</source>
          <year>2023</year>
          <month>09</month>
          <day>28</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>40</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.doi.org/10.1186/s40352-023-00239-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s40352-023-00239-4</pub-id>
          <pub-id pub-id-type="medline">37768431</pub-id>
          <pub-id pub-id-type="pii">10.1186/s40352-023-00239-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC10537811</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fliss</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Lao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Behne</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Brinkley-Rubinstein</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Few prison systems release individual death data: death in custody reporting act completeness, speed, and compliance</article-title>
          <source>J Public Health Manag Pract</source>
          <year>2024</year>
          <volume>30</volume>
          <issue>3</issue>
          <fpage>424</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1097/PHH.0000000000001893</pub-id>
          <pub-id pub-id-type="medline">38603750</pub-id>
          <pub-id pub-id-type="pii">00124784-202405000-00017</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="web">
          <article-title>Uncounted deaths in America’s prisons and jails: how the Department of Justice failed to implement the Death in Custody Reporting Act</article-title>
          <source>United States Senate</source>
          <year>2022</year>
          <month>09</month>
          <day>20</day>
          <access-date>2026-04-08</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.hsgac.senate.gov/wp-content/uploads/imo/media/doc/2022-09-20%20PSI%20Staff%20Report%20-%20Uncounted%20Deaths%20in%20America's%20Prisons%20and%20Jails.pdf">https://tinyurl.com/2mu6eud2f</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Boch</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Murnan</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Nidey</surname>
              <given-names>NL</given-names>
            </name>
            <name name-style="western">
              <surname>Hardy</surname>
              <given-names>RY</given-names>
            </name>
            <name name-style="western">
              <surname>Iruka</surname>
              <given-names>IU</given-names>
            </name>
          </person-group>
          <article-title>Assessment of US federal funding of incarceration-related research, 1985 to 2022</article-title>
          <source>JAMA Netw Open</source>
          <year>2023</year>
          <month>02</month>
          <day>01</day>
          <volume>6</volume>
          <issue>2</issue>
          <fpage>e230803</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36848087"/>
          </comment>
          <pub-id pub-id-type="doi">10.1001/jamanetworkopen.2023.0803</pub-id>
          <pub-id pub-id-type="medline">36848087</pub-id>
          <pub-id pub-id-type="pii">2801711</pub-id>
          <pub-id pub-id-type="pmcid">PMC9972190</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cloud</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Cullins</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Armstrong</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Brinkley-Rubinstein</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Who counts, who's accountable: independent scholarship and the future of carceral mortality oversight</article-title>
          <source>Am J Public Health</source>
          <year>2026</year>
          <month>04</month>
          <volume>116</volume>
          <issue>4</issue>
          <fpage>552</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.2105/AJPH.2025.308360</pub-id>
          <pub-id pub-id-type="medline">41610387</pub-id>
          <pub-id pub-id-type="pmcid">PMC12981183</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aguinis</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Villamor</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Ramani</surname>
              <given-names>RS</given-names>
            </name>
          </person-group>
          <article-title>MTurk research: review and recommendations</article-title>
          <source>J Manag</source>
          <year>2020</year>
          <month>11</month>
          <day>19</day>
          <volume>47</volume>
          <issue>4</issue>
          <fpage>823</fpage>
          <lpage>37</lpage>
          <pub-id pub-id-type="doi">10.1177/0149206320969787</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stritch</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Pedersen</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Taggart</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>The opportunities and limitations of using Mechanical Turk (MTurk) in public administration and management scholarship</article-title>
          <source>Int Public Manag J</source>
          <year>2017</year>
          <month>01</month>
          <day>19</day>
          <volume>20</volume>
          <issue>3</issue>
          <fpage>489</fpage>
          <lpage>511</lpage>
          <pub-id pub-id-type="doi">10.1080/10967494.2016.1276493</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hunt</surname>
              <given-names>NC</given-names>
            </name>
            <name name-style="western">
              <surname>Scheetz</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Using MTurk to distribute a survey or experiment: methodological considerations</article-title>
          <source>J Inf Syst</source>
          <year>2019</year>
          <month>03</month>
          <day>01</day>
          <volume>33</volume>
          <issue>1</issue>
          <fpage>43</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.2308/isys-52021</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arditte</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Çek</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Timpano</surname>
              <given-names>KR</given-names>
            </name>
          </person-group>
          <article-title>The importance of assessing clinical phenomena in Mechanical Turk research</article-title>
          <source>Psychol Assess</source>
          <year>2016</year>
          <month>06</month>
          <volume>28</volume>
          <issue>6</issue>
          <fpage>684</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1037/pas0000217</pub-id>
          <pub-id pub-id-type="medline">26302105</pub-id>
          <pub-id pub-id-type="pii">2015-38662-001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cobanoglu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Cavusoglu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Turktarhan</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A beginner’s guide and best practices for using crowdsourcing platforms for survey research: the case of Amazon Mechanical Turk (MTurk)</article-title>
          <source>J Glob Bus Insights</source>
          <year>2021</year>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>92</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.5038/2640-6489.6.1.1177</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Geldsetzer</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Use of rapid online surveys to assess people's perceptions during infectious disease outbreaks: a cross-sectional survey on COVID-19</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>04</month>
          <day>02</day>
          <volume>22</volume>
          <issue>4</issue>
          <fpage>e18790</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/4/e18790/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/18790</pub-id>
          <pub-id pub-id-type="medline">32240094</pub-id>
          <pub-id pub-id-type="pii">v22i4e18790</pub-id>
          <pub-id pub-id-type="pmcid">PMC7124956</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Strickland</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Stoops</surname>
              <given-names>WW</given-names>
            </name>
          </person-group>
          <article-title>The use of crowdsourcing in addiction science research: Amazon Mechanical Turk</article-title>
          <source>Exp Clin Psychopharmacol</source>
          <year>2019</year>
          <month>02</month>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>18</lpage>
          <pub-id pub-id-type="doi">10.1037/pha0000235</pub-id>
          <pub-id pub-id-type="medline">30489114</pub-id>
          <pub-id pub-id-type="pii">2018-58865-001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Sabat</surname>
              <given-names>IE</given-names>
            </name>
            <name name-style="western">
              <surname>Martinez</surname>
              <given-names>LR</given-names>
            </name>
            <name name-style="western">
              <surname>Weaver</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A convenient solution: using MTurk to sample from hard-to-reach populations</article-title>
          <source>Ind Organ Psychol</source>
          <year>2015</year>
          <month>07</month>
          <day>28</day>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>220</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1017/iop.2015.29</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Pickett</surname>
              <given-names>JT</given-names>
            </name>
          </person-group>
          <article-title>Are relational inferences from crowdsourced and opt-in samples generalizable? Comparing criminal justice attitudes in the GSS and five online samples</article-title>
          <source>J Quant Criminol</source>
          <year>2019</year>
          <month>11</month>
          <day>13</day>
          <volume>36</volume>
          <fpage>907</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1007/s10940-019-09436-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>LaBranche</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Labrecque</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Public support for solitary confinement: a randomized experiment of belief updating and confirmation bias</article-title>
          <source>Victims Offenders</source>
          <year>2020</year>
          <month>07</month>
          <day>27</day>
          <volume>16</volume>
          <issue>2</issue>
          <fpage>266</fpage>
          <lpage>81</lpage>
          <pub-id pub-id-type="doi">10.1080/15564886.2020.1795766</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Stein</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Day</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Bien-Gund</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Mathews</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>PZ</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bayus</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Tucker</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Crowdsourcing in health and medical research: a systematic review</article-title>
          <source>Infect Dis Poverty</source>
          <year>2020</year>
          <month>01</month>
          <day>20</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>8</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://idpjournal.biomedcentral.com/articles/10.1186/s40249-020-0622-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s40249-020-0622-9</pub-id>
          <pub-id pub-id-type="medline">31959234</pub-id>
          <pub-id pub-id-type="pii">10.1186/s40249-020-0622-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC6971908</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wazny</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Applications of crowdsourcing in health: an overview</article-title>
          <source>J Glob Health</source>
          <year>2018</year>
          <month>06</month>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>010502</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29564087"/>
          </comment>
          <pub-id pub-id-type="doi">10.7189/jogh.08.010502</pub-id>
          <pub-id pub-id-type="medline">29564087</pub-id>
          <pub-id pub-id-type="pii">jogh-08-010502</pub-id>
          <pub-id pub-id-type="pmcid">PMC5840433</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="web">
          <article-title>Mortality</article-title>
          <source>Third City Project</source>
          <access-date>2025-04-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://3rdcityproject.com/index.php/mortality_data/">https://3rdcityproject.com/index.php/mortality_data/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Albert</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Smilek</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Comparing attentional disengagement between Prolific and MTurk samples</article-title>
          <source>Sci Rep</source>
          <year>2023</year>
          <month>11</month>
          <day>23</day>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>20574</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-023-46048-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-023-46048-5</pub-id>
          <pub-id pub-id-type="medline">37996446</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-023-46048-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC10667324</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stanton</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Carpenter</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Nance</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sturgeon</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Villalongo Andino</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A multisample demonstration of using the prolific platform for repeated assessment and psychometric substance use research</article-title>
          <source>Exp Clin Psychopharmacol</source>
          <year>2022</year>
          <month>08</month>
          <volume>30</volume>
          <issue>4</issue>
          <fpage>432</fpage>
          <lpage>43</lpage>
          <pub-id pub-id-type="doi">10.1037/pha0000545</pub-id>
          <pub-id pub-id-type="medline">35025585</pub-id>
          <pub-id pub-id-type="pii">2022-20692-001</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ovadje</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Al-Garadi</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Evaluating large language models for health-related text classification tasks with public social media data</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2024</year>
          <month>10</month>
          <day>01</day>
          <volume>31</volume>
          <issue>10</issue>
          <fpage>2181</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocae210</pub-id>
          <pub-id pub-id-type="medline">39121174</pub-id>
          <pub-id pub-id-type="pii">7731085</pub-id>
          <pub-id pub-id-type="pmcid">PMC11413434</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weng</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Large language models in biomedicine and health: current research landscape and future directions</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2024</year>
          <month>09</month>
          <day>01</day>
          <volume>31</volume>
          <issue>9</issue>
          <fpage>1801</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocae202</pub-id>
          <pub-id pub-id-type="medline">39169867</pub-id>
          <pub-id pub-id-type="pii">7737335</pub-id>
          <pub-id pub-id-type="pmcid">PMC11339542</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Vosgerau</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Acquisti</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Reputation as a sufficient condition for data quality on Amazon Mechanical Turk</article-title>
          <source>Behav Res Methods</source>
          <year>2014</year>
          <month>12</month>
          <volume>46</volume>
          <issue>4</issue>
          <fpage>1023</fpage>
          <lpage>31</lpage>
          <pub-id pub-id-type="doi">10.3758/s13428-013-0434-y</pub-id>
          <pub-id pub-id-type="medline">24356996</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
