<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id><journal-id journal-id-type="publisher-id">formative</journal-id><journal-id journal-id-type="index">27</journal-id><journal-title>JMIR Formative Research</journal-title><abbrev-journal-title>JMIR Form Res</abbrev-journal-title><issn pub-type="epub">2561-326X</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e70853</article-id><article-id pub-id-type="doi">10.2196/70853</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Misrepresentation of Overall and By-Gender Mortality Causes in Film Using Online, Crowd-Sourced Data: Quantitative Analysis</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Beauregard</surname><given-names>Calla Glavin</given-names></name><degrees>MPhil</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Danforth</surname><given-names>Christopher M</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Dodds</surname><given-names>Peter Sheridan</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff5">5</xref><xref ref-type="aff" rid="aff6">6</xref></contrib></contrib-group><aff id="aff1"><institution>Computational Story Lab, University of Vermont</institution><addr-line>Burlington</addr-line><addr-line>VT</addr-line><country>United States</country></aff><aff id="aff2"><institution>MassMutual Center of Excellence, Vermont Complex Systems Institute, University of Vermont</institution><addr-line>89 University Place</addr-line><addr-line>Burlington</addr-line><addr-line>VT</addr-line><country>United States</country></aff><aff id="aff3"><institution>Department of Mathematics and Statistics, University of Vermont</institution><addr-line>Burlington</addr-line><addr-line>VT</addr-line><country>United States</country></aff><aff id="aff4"><institution>Vermont Advanced Computing Center, University of Vermont</institution><addr-line>Burlington</addr-line><addr-line>VT</addr-line><country>United States</country></aff><aff id="aff5"><institution>Department of Computer Science, University of Vermont</institution><addr-line>Burlington</addr-line><addr-line>VT</addr-line><country>United States</country></aff><aff id="aff6"><institution>Santa Fe Institute</institution><addr-line>Santa Fe</addr-line><addr-line>NM</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Mavragani</surname><given-names>Amaryllis</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Shaw</surname><given-names>Kirsten</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Riffe</surname><given-names>Tim</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Calla Glavin Beauregard, MPhil, MassMutual Center of Excellence, Vermont Complex Systems Institute, University of Vermont, 89 University Place, Burlington, VT, 05452, United States, 1 (802) 656-3392; <email>calla.beauregard@uvm.edu</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>24</day><month>6</month><year>2025</year></pub-date><volume>9</volume><elocation-id>e70853</elocation-id><history><date date-type="received"><day>03</day><month>01</month><year>2025</year></date><date date-type="rev-recd"><day>10</day><month>04</month><year>2025</year></date><date date-type="accepted"><day>30</day><month>04</month><year>2025</year></date></history><copyright-statement>&#x00A9; Calla Glavin Beauregard, Christopher M Danforth, Peter Sheridan Dodds. Originally published in JMIR Formative Research (<ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>), 24.6.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://formative.jmir.org">https://formative.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://formative.jmir.org/2025/1/e70853"/><abstract><sec><title>Background</title><p>The common phrase &#x201C;representation matters&#x201D; asserts that media has a measurable and important impact on civic society&#x2019;s perception of self and others. The representation of health in media, in particular, may reflect and perpetuate a society&#x2019;s disease burden.</p></sec><sec><title>Objective</title><p>In this study, for the top 10 major causes of death in the United States, we aimed to examine how cinematic representation overall and by-gender mortality diverges from reality.</p></sec><sec sec-type="methods"><title>Methods</title><p>Using crowd-sourced data on over 68,000 film deaths from Cinemorgue Wiki, we employ natural language processing techniques to analyze shifts in representation of deaths in movies versus the 2021 National Vital Statistics Survey top 10 mortality causes. We parsed, stemmed, and classified each film death database entry, and then categorized film deaths by gender using a specifically trained gender text classifier.</p></sec><sec sec-type="results"><title>Results</title><p>Overall, movies strongly overrepresent suicide and, to a lesser degree, accidents. In terms of gender, movies overrepresent men and underrepresent women for nearly every major mortality cause, including heart disease and cerebrovascular disease (chi-square test, <italic>P</italic>&#x003C;.001); 73.6% (477/648) of film deaths from heart disease were men (vs 384,866/695,547, 55.4% in real life) and 69.4% (50/72) of film deaths from cerebrovascular disease were men (vs 70,852/162,890, 43.5% in real life). The 2 exceptions for which women were overrepresented are suicide and accidents (chi-square test, <italic>P</italic>&#x003C;.001), with 39.7% (945/2382) deaths from suicide in film being women (vs 9825/48,183, 20.4% in real life) and 38.8% (485/1250) deaths from accidents in film being women (vs 75,333/225,935, 33.5% in real life).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>We discuss the implications of under- and overrepresenting causes of death overall and by gender, as well as areas of future research.</p></sec></abstract><kwd-group><kwd>media representation</kwd><kwd>gender</kwd><kwd>mortality</kwd><kwd>natural language processing</kwd><kwd>NLP</kwd><kwd>data science</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Cardiovascular disease is the number one cause of death in both men and women in the United States according to the National Survey of Vital Statistics (NVSS), published annually by the Centers for Disease Control and Prevention (CDC) [<xref ref-type="bibr" rid="ref1">1</xref>]. However, men and women can experience different risk factors related to cardiovascular disease, as well as present different symptoms when experiencing a cardiovascular event [<xref ref-type="bibr" rid="ref2">2</xref>]. In recent years, the American Heart Association has highlighted the importance of understanding these differences with calls for an overhaul in how physicians consider gender in the diagnosis of cardiovascular disease [<xref ref-type="bibr" rid="ref3">3</xref>].</p><p>Representation in media is central to how we perceive our society, including health. Media portrayal and representation influence thoughts, behaviors, and actions toward certain groups, ideas, and phenomena, that is, the &#x201C;[m]edia, in short, [is] central to what ultimately come to represent our social realities&#x201D; [<xref ref-type="bibr" rid="ref4">4</xref>]. This connection has been studied across many demographic categories and aspects of social reality. Broadly, narratives delivered by film and other forms of media influence beliefs, which has been theorized as a &#x201C;dual empathy&#x201D; pathway wherein viewers process their feelings and thoughts while also perspective sharing with fictional characters [<xref ref-type="bibr" rid="ref5">5</xref>]. Salient media stories in both film and books impact identity formation in both middle-age and young adults when relating their own life stories [<xref ref-type="bibr" rid="ref6">6</xref>].</p><p>A subset of narrative theory is transportation theory, which purports that individuals who experience greater narrative transportation in response to fictional and nonfictional media are more likely to change their behaviors and beliefs and identify fewer factual inconsistencies in that media [<xref ref-type="bibr" rid="ref7">7</xref>]. Research has explored the connection of transportation in film with a variety of health conditions and behaviors; the depiction of smoking in entertainment film increased tobacco use behaviors in adolescents [<xref ref-type="bibr" rid="ref8">8</xref>], public awareness films improved young adult attitudes toward older adults [<xref ref-type="bibr" rid="ref9">9</xref>], drunk driving film scenarios reduced self-risk assessment in drunk-driving [<xref ref-type="bibr" rid="ref10">10</xref>], and a film depicting individuals with taboo chronic gut conditions improved understanding of the conditions and increased likeliness of discussing these conditions with friends and family pre- and postsurvey [<xref ref-type="bibr" rid="ref11">11</xref>]. In summary, film depictions influence viewer perception and beliefs across areas of health.</p><p>Outside of transportation theory, there is ample research regarding the media&#x2019;s representation and impact on health via other pathways. A recent study examined how acute myocardial infarction (eg, a heart attack) was portrayed in 100 popular films, demonstrating the general inaccuracy of its depiction of symptoms as well as its depiction by gender [<xref ref-type="bibr" rid="ref12">12</xref>]. Aside from that study, in terms of gender demographics, most research tends to focus on negative representation of woman in media, specifically in terms of sexual objectification; &#x201C;very few studies appear to be available on the relationship between media representation and non-sexual objectification&#x201D; of women [<xref ref-type="bibr" rid="ref13">13</xref>]. Similarly, many aspects of social reality, such as economic, health, and well-being outcomes, have been studied with respect to media representation (although not explicitly through the lens of gender). For example, there is a rich history of research on how representation in the media influences the commission of intentional self-harm [<xref ref-type="bibr" rid="ref14">14</xref>]. In summary, the media typically does not accurately portray official suicide data, and the most comprehensive systematic review on the topic links media reporting and suicidality, with current evidence suggesting increased suicidality trends with increased reporting of suicide [<xref ref-type="bibr" rid="ref14">14</xref>].</p><p>Aside from suicidality, there is a diversity of studies on health issues and their media depiction; a nonexhaustive survey of the literature includes a study on the depiction of obesity in media and mortality in Indigenous Australians [<xref ref-type="bibr" rid="ref15">15</xref>], a study of how bisexual individuals&#x2019; mental health is impacted by depictions of bisexual people in media [<xref ref-type="bibr" rid="ref16">16</xref>], and globally, a scoping review on how media representation of major corporations influence noncommunicable disease risk assessment and public health policy-making related to consumer products [<xref ref-type="bibr" rid="ref17">17</xref>]. Thus, while there is research on how narrative influences health [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref8">8</xref>], and research on health representation and gender representation in media [<xref ref-type="bibr" rid="ref18">18</xref>-<xref ref-type="bibr" rid="ref23">23</xref>], there is little research that explores the overlap between health outcomes and gender representation in media, a gap we aimed to address in this study.</p><p>To examine the connection between media and mortality in this study, we downloaded counts by year of all-time cinematic deaths (referred to here as film deaths) from the crowd-sourced Cinemorgue Wiki database [<xref ref-type="bibr" rid="ref24">24</xref>] and compared them with the 2021 NVSS [<xref ref-type="bibr" rid="ref1">1</xref>] counts of top 10 causes of mortality by gender. Using natural language processing, we extracted the Cinemorgue counts, classified the deaths by gender, and consolidated these data against the NVSS counts. We then analyzed the comparative ratios by gender between real life and film and considered significant differences in these ratios using the chi-square test. The aim of this study is to understand the extent to which cinematic deaths in Cinemorgue reflect real-world mortality by gender and cause of death.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><p>There are 2 main data sources for this project: the Cinemorgue Wiki database of film deaths [<xref ref-type="bibr" rid="ref24">24</xref>] and the 2021 NVSS Leading Causes of Mortality Report [<xref ref-type="bibr" rid="ref1">1</xref>].</p><sec id="s2-1"><title>Collecting and Cleaning Data</title><p>First, we identified all-time film deaths using the Cinemorgue Wiki [<xref ref-type="bibr" rid="ref24">24</xref>] which is a crowd-sourced database that allows any members of Fandom to update death by cause by film and film year (1895&#x2010;2023), with a short description of the death. The site is organized by death type or by actor (not by character) and each entry is a short 1&#x2010;2 sentence description of the film death. It is inclusive of any movies publicly entered, and thus not limited to American film deaths only. Conveniently, Cinemorgue has historically provided an .xml download of their entire website (as of August 16, 2023) and other researchers have previously classified cinematic deaths using Federal Bureau of Investigation (FBI) homicide specifications [<xref ref-type="bibr" rid="ref25">25</xref>]. Refer to <xref ref-type="table" rid="table1">Table 1</xref> for a basic description of the database entries.</p><p>Using this existing script, we adjusted the classifying portion to identify deaths according to the CDC NVSS&#x2019;s top mortality causes by year for 2021 [<xref ref-type="bibr" rid="ref1">1</xref>]. Our script parsed the description of each film and reduced it to word stems by film entry. We used generally broad word stems that captured the colloquial terms describing different mortality causes (eg, &#x201C;heart attack&#x201D; and &#x201C;heart failure&#x201D;). We then categorized film deaths by gender using a reasonably comprehensive and inclusive classifier from PyPi project gender-guesser, which was trained on a representative international database of names that were independently validated by native speakers of many languages [<xref ref-type="bibr" rid="ref26">26</xref>]. When applying gender-guesser in this study, all 40,000 plus names were included to account for various languages and ethnic backgrounds of actors represented in film (the Cinemorgue Wiki includes movies from many different countries). Furthermore, the code allowed for the classification of mostly male, mostly female, androgynous, and unknown names. <xref ref-type="table" rid="table2">Table 2</xref> enumerates the initial name classification.</p><p>Based on a random manual review of classification, &#x201C;mostly male&#x201D; and &#x201C;mostly female&#x201D; seemed to accurately categorize well-known actors, &#x201C;mostly male&#x201D; was grouped with male, and &#x201C;mostly female&#x201D; was grouped with female. Based on the size of the data and this classifier, we removed androgynous or unknown names (collectively referred to here as &#x201C;other&#x201D;), discussed in the Limitations section. The 2021 top 10 leading causes of death in the United States are depicted in <xref ref-type="table" rid="table3">Table 3</xref> [<xref ref-type="bibr" rid="ref1">1</xref>]. This list actually comprises 13 leading causes of death because the ninth and tenth leading causes of death by gender differ, and a category of &#x201C;other&#x201D; is including to reflect the remaining causes. If absent from the official report, these data were queried directly from the CDC WONDER database [<xref ref-type="bibr" rid="ref27">27</xref>] using the same <italic>International Classification of Diseases, Tenth Revision</italic> (<italic>ICD-10</italic>) parameters from the NVSS [<xref ref-type="bibr" rid="ref1">1</xref>]. We calculated the ratio of mortality by gender by performing a simple ratio of male or female deaths by mortality cause over total deaths by that cause. It is important to note that the top 10 leading mortality causes differ year-to-year, and 2021 was the second year to include COVID-19 deaths. In addition, the medical terms describing these causes of death are extensive and often highly technical; for ease of understanding, we provide additional notations to specify the colloquial terms for these diseases.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>All film death entries by year percentiles as per Cinemorgue (total deaths=68,535).</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Percentile</td><td align="left" valign="bottom">Year</td></tr></thead><tbody><tr><td align="left" valign="top">Minimum</td><td align="left" valign="top">1895</td></tr><tr><td align="left" valign="top">25th</td><td align="left" valign="top">1976</td></tr><tr><td align="left" valign="top">50th</td><td align="left" valign="top">1995</td></tr><tr><td align="left" valign="top">75th</td><td align="left" valign="top">2010</td></tr><tr><td align="left" valign="top">Maximum</td><td align="left" valign="top">2023</td></tr></tbody></table></table-wrap><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Results of the gender classifier, gender-guesser, used on all Cinemorgue data, before and after consolidation.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Gender</td><td align="left" valign="bottom">Count before, n</td><td align="left" valign="bottom">Count after, n</td></tr></thead><tbody><tr><td align="left" valign="top">Women</td><td align="left" valign="top">15,673</td><td align="left" valign="top">17,451</td></tr><tr><td align="left" valign="top">Men</td><td align="left" valign="top">39,627</td><td align="left" valign="top">42,458</td></tr><tr><td align="left" valign="top">Unknown</td><td align="left" valign="top">7383</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td></tr><tr><td align="left" valign="top">Mostly men</td><td align="left" valign="top">2831</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Mostly women</td><td align="left" valign="top">1778</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Androgynous</td><td align="left" valign="top">1243</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Nonmale or nonfemale<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">8626</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Categories collapsed after consolidation.</p></fn><fn id="table2fn2"><p><sup>b</sup>For the purposes of this table, the terms &#x201C;male&#x201D; and &#x201C;female&#x201D; are used to be consistent with the name classification package configuration.</p></fn></table-wrap-foot></table-wrap><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Percentage by gender of the National Vital Statistics System 2021 leading causes of mortality in the United States.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Mortality cause, type (women rank, men rank)</td><td align="left" valign="bottom">Total, n</td><td align="left" valign="bottom" colspan="2">Female, n (%)</td><td align="left" valign="bottom" colspan="2">Male, n (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Diseases of the heart (1, 1)</td><td align="left" valign="top">695,547</td><td align="left" valign="top" colspan="2">310,661 (44.6)</td><td align="left" valign="top" colspan="2">384,886 (55.4)</td></tr><tr><td align="left" valign="top">Malignant neoplasm, cancer<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> (2, 2)</td><td align="left" valign="top">605,213</td><td align="left" valign="top" colspan="2">286,543 (47.3)</td><td align="left" valign="top" colspan="2">318,670 (52.7)</td></tr><tr><td align="left" valign="top">COVID-19 (3, 3)</td><td align="left" valign="top">416,893</td><td align="left" valign="top" colspan="2">180,283 (43.2)</td><td align="left" valign="top" colspan="2">236,610 (56.8)</td></tr><tr><td align="left" valign="top">Accidents, unintentional injuries (6, 4)</td><td align="left" valign="top">224,935</td><td align="left" valign="top" colspan="2">75,333 (33.5)</td><td align="left" valign="top" colspan="2">149,602 (66.5)</td></tr><tr><td align="left" valign="top">Cerebrovascular disease, stroke<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup>, brain hemorrhage<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> (4, 5)</td><td align="left" valign="top">162,890</td><td align="left" valign="top" colspan="2">92,038 (56.5)</td><td align="left" valign="top" colspan="2">70,852 (43.5)</td></tr><tr><td align="left" valign="top">Chronic lower respiratory disease, COPD<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup><sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup>, emphysema<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> (7, 6)</td><td align="left" valign="top">142,342</td><td align="left" valign="top" colspan="2">74,814 (52.6)</td><td align="left" valign="top" colspan="2">67,528 (47.4)</td></tr><tr><td align="left" valign="top">Alzheimer disease (5, 8)</td><td align="left" valign="top">119,399</td><td align="left" valign="top" colspan="2">82,424 (69)</td><td align="left" valign="top" colspan="2">36,975 (31)</td></tr><tr><td align="left" valign="top">Diabetes mellitus (8, 7)</td><td align="left" valign="top">103,294</td><td align="left" valign="top" colspan="2">44,666 (43.2)</td><td align="left" valign="top" colspan="2">56,628 (54.8)</td></tr><tr><td align="left" valign="top">Chronic liver disease and cirrhosis (11, 9)</td><td align="left" valign="top">56,585</td><td align="left" valign="top" colspan="2">20,878 (36.9)</td><td align="left" valign="top" colspan="2">35,707 (63.1)</td></tr><tr><td align="left" valign="top">Nephritis (9, 10)</td><td align="left" valign="top">54,358</td><td align="left" valign="top" colspan="2">25,769 (47.4)</td><td align="left" valign="top" colspan="2">28,589 (52.6)</td></tr><tr><td align="left" valign="top">Suicide, intentional self-harm (15, 8)</td><td align="left" valign="top">48,183</td><td align="left" valign="top" colspan="2">9825 (20.4)</td><td align="left" valign="top" colspan="2">38,358 (79.6)</td></tr><tr><td align="left" valign="top">Essential hypertension (10, 15)</td><td align="left" valign="top">42,816</td><td align="left" valign="top" colspan="2">22,730 (53.1)</td><td align="left" valign="top" colspan="2">20,086 (46.9)</td></tr><tr><td align="left" valign="top">Other</td><td align="left" valign="top">791,776</td><td align="left" valign="top" colspan="2">400,159 (50.5)</td><td align="left" valign="top" colspan="2">391,617 (49.5)</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>Colloquial term.</p></fn><fn id="table3fn2"><p><sup>b</sup>COPD: chronic obstructive pulmonary disease.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-2"><title>Analysis of Gender Ratios: Visualization and Chi-Square Testing</title><p>In both datasets, we calculated the ratio of mortality by gender by cause by performing a simple ratio of male death (or female death) by mortality cause over total deaths by that cause. Thus, the sum of all ratios should equal 1. From the ratios of mortality by gender in film and NVSS data, we constructed a bar graph visualization. Then, we explored the significance of the difference in gender ratio by cause of death between film and real life using the Pearson chi-square test [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref29">29</xref>].</p><p>It is important to underscore how to interpret significant <italic>P</italic> values in this context [<xref ref-type="bibr" rid="ref30">30</xref>-<xref ref-type="bibr" rid="ref32">32</xref>]. Accordingly, <italic>P</italic> values &#x003C;.5 do not &#x201C;measure the probability that the studied hypothesis is true, or the probability that the data were produced by random chance alone&#x201D;, and are merely &#x201C;one approach to summarizing the incompatibility between a particular set of data and a proposed model for the data&#x201D; [<xref ref-type="bibr" rid="ref30">30</xref>]. That is, if there is a significant <italic>P</italic> value for the chi-square test for any given cause of mortality, this means that the data seem to suggest there is a significant difference between expected and observed frequencies of causes of death by gender between film and real-life but does not establish causality.</p></sec><sec id="s2-3"><title>Ethical Considerations</title><p>All US mortality data used for this study are publicly available, anonymous, and consolidated at the national level. All data have been deidentified. Cinemorgue data comprise fictional, in-film deaths. This study is exempt from ethical approval, as the research involves the analysis of large-scale, publicly available datasets that are legally accessible to the public and do not require any special access or permissions. The data do not include any information through which individuals can be readily identified, either directly or indirectly. Because the data are both publicly available and do not involve interaction or intervention with human participants, nor do they involve the collection of private, identifiable information, this study qualifies for exemption from institutional review board oversight.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><p>In general, the Cinemorgue dataset underrepresents most real-life leading mortality causes as compared with cinematic mortality causes by proportion of deaths in the database. There are 2 exceptions where suicide and accidents are overrepresented. <xref ref-type="fig" rid="figure1">Figure 1</xref> depicts the identity line or line of no difference at which representation would be equal between both sources.</p><p>When considering gender in addition to raw count by database, the differences between film and real life are also apparent. <xref ref-type="fig" rid="figure2">Figure 2</xref> is a subplot panel depicting the relative proportions of 2021 NVSS leading causes of mortality by gender versus all-time film deaths by gender from Cinemorgue. Across almost all causes of death except cancer and chronic liver disease, there are visible and apparent shifts between film representation and real-life representation, with women underrepresented in film across nearly all categories except for suicide. Diabetes and essential hypertension are not represented in the cleaned Cinemorgue dataset. The counts used to construct the ratio shift figure are contained in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><p>In <xref ref-type="table" rid="table4">Table 4</xref>, we show the significance (if observed frequency <italic>&#x003E;</italic>5) of the ratio shift for each cause of death. The ratios by gender of accidents, cerebrovascular disease, diseases of the heart, suicide (intentional self-harm), and the combined category of all other causes of mortality for film deviates significantly from that in real life. As previously mentioned, men are overrepresented in film as compared with women for each of the aforementioned causes of mortality, barring suicide.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Overall number of total deaths in Cinemorgue versus number of recorded deaths in the United States, National Vital Statistics Survey 2021 by cause of mortality. Of total film deaths, suicide and accidents are overrepresented; all other causes of death are underrepresented in film. The identity line depicted the boundary between over- and underrepresentation; causes of death above the line are overrepresented, and causes of death beneath the line are underrepresented in film.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e70853_fig01.png"/></fig><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Top 10 mortality causes by gender in film versus real life. Count and proportion of deaths by gender (blue for men, mauve for women) are shown by mortality cause for film and for real life. Women suicide deaths and accidents are overrepresented in film. Men are overrepresented in all other causes of death. We only included causes of death present in the Cinemorgue dataset.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="formative_v9i1e70853_fig02.png"/></fig><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Chi-square test: statistic and <italic>P</italic> values. Each cause of death and its corresponding chi-square test by gender proportion is depicted, with its significance value.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Cause of death</td><td align="left" valign="bottom">Chi-square (<italic>df</italic>)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Accidents<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td><td align="left" valign="top">15.81 (1)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Alzheimer disease</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup></td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">COVID-19</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Cancer</td><td align="left" valign="top">0.29 (1)</td><td align="left" valign="top">.59</td></tr><tr><td align="left" valign="top">Cerebrovascular disease<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td><td align="left" valign="top">19.72 (1)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Chronic liver disease</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Chronic lower respiratory diseases</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Diseases of heart<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td><td align="left" valign="top">87.57 (1)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Nephritis</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Other<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td><td align="left" valign="top">10,832.92 (1)</td><td align="left" valign="top"><italic>&#x003C;</italic>.001</td></tr><tr><td align="left" valign="top">Suicide<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup></td><td align="left" valign="top">545.54 (1)</td><td align="left" valign="top"><italic>&#x003C;</italic>.001</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>Significant findings (where film deaths by gender are not representative of real life). There is a significant difference in representation for accidents, cerebrovascular disease, diseases of the heart, suicide, and all other causes.</p></fn><fn id="table4fn2"><p><sup>b</sup>Cause of death categories in which there were less than 5 observations in films, and thus the chi-square test was not appropriate [<xref ref-type="bibr" rid="ref25">25</xref>].</p></fn></table-wrap-foot></table-wrap></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>Film and real-life mortality differ significantly for some, but not all, leading causes of death. As expected, film is not representative of real life even setting aside gender considerations. From a practical perspective, this makes sense in the context that high-tempo, salacious, or dramatic deaths are likely far more interesting to an audience than everyday causes of mortality. In film, for example, the proportion of &#x201C;other&#x201D; deaths represented far outpaces the actual leading cause of death (diseases of the heart) at a factor of over 800. When considering gender, there are significant differences in the ratio of represented death for accidents, cerebrovascular disease, diseases of the heart, suicide (intentional self-harm) and all other deaths not captured using the top 10 leading causes of death classifier, among sufficiently large samples within the Cinemorgue Wiki database.</p><p>While our results do not indicate causality, they provide insight to the representation of mortality in popular media. From visualizations and statistical comparison of ratios, there is meaningful descriptive power in the ratios of film versus real-life representation of mortality by gender. In view of recent efforts by the American Heart Association to provide better equality of cardiovascular care for women [<xref ref-type="bibr" rid="ref3">3</xref>] as well as general research regarding treatment differences by gender [<xref ref-type="bibr" rid="ref33">33</xref>], the underrepresentation of film deaths by gender demonstrate that death is also lacking in equitable representation on screen. As there is a general consensus in the literature that stereotypes can be exceedingly harmful and contribute to sexism, harassment, and violence against women [<xref ref-type="bibr" rid="ref13">13</xref>] as well as other gender identities [<xref ref-type="bibr" rid="ref34">34</xref>], it is reasonable to postulate that a lack of representation in film could exacerbate the public&#x2019;s misunderstanding of disease burden and processes, and could hinder the recognition of gender-specific health issues among not only the public but potentially among health care professionals.</p><p>By cause of mortality, some interesting patterns emerge. For the category of &#x201C;other,&#x201D; men are overrepresented in the Cinemorgue Wiki, which is consistent with their overrepresentation writ large in the Wiki (regardless of cause of death). This could indicate that men are represented more often on screen generally, and represented more often in violent deaths, as previously discussed. For diseases of the heart, men are seemingly overrepresented in film, which agrees with the American Heart Association&#x2019;s recent findings on underrepresentation and lack of understanding of women experiencing heart disease [<xref ref-type="bibr" rid="ref3">3</xref>]. Likewise, men are overrepresented for death by cerebrovascular disease. However, suicide and accidents are overrepresented for women in film. Based on the suggestibility and risk associated with suicide representations [<xref ref-type="bibr" rid="ref14">14</xref>], this pattern indicates that future follow-up is needed to understand the relationship between representation and acts of suicide in women.</p></sec><sec id="s4-2"><title>Limitations</title><p>Limitations of this study center on the classification and cleaning of the Cinemorgue film death dataset, as well as the data itself. First, we used only film deaths in this study, on the assumption that films generally have wider ranges of audiences (not confined to certain streaming platforms) and have a similar format. However, the Cinemorgue Wiki database includes all manners of video-represented deaths, including television and video games, which were excluded in this study based on the assumption that video game deaths may overrepresent homicides, due to the violent nature of many video games. Furthermore, we compare the Cinemorgue Wiki database all-time counts with single point-in-time (2021 NVSS) mortality counts; considering that movies are not only watched in the year in which they are filmed, we consider this a reasonable assumption even though movie popularity changes over time. In addition, in <xref ref-type="table" rid="table1">Table 1</xref>, we report that 50% (34,268/68,535) of the film deaths in our dataset are from 1995 and later, with 25% (17,132/68,535) occurring between 2010 and 2023, showing that the preponderance of films occur relatively close to the point-in-time mortality counts with many being topically contemporary to the year in which they were filmed.</p><p>In addition, our removal of androgynous names may have skewed the resultant data; as illustrated previously in <xref ref-type="table" rid="table2">Table 2</xref>, 13% of data are effectively &#x201C;thrown out&#x201D; of the analysis because it was not classifiable as &#x201C;female&#x201D; or &#x201C;mostly female&#x201D; or &#x201C;male&#x201D; or &#x201C;mostly male&#x201D;. While using binary categories is consistent with the CDC&#x2019;s current reporting causes by mortality, reducing gender to solely men and women does not capture the diversity of gender identities. Considering the connection between media representation and suicide, as well as the significantly higher instances of suicidal ideation in transgender and nonbinary youth than cisgender youth [<xref ref-type="bibr" rid="ref35">35</xref>], indicates that further research beyond this study is important for understanding the representation of health outcomes for transgender and nonbinary individuals. In terms of classifying cause of mortality in the Cinemorgue Wiki database, the search terms used on the stemmed text were specific but very broad in order to prevent an undercount of deaths, which could have skewed resultant counts. Intrinsically, the Cinemorgue Wiki database is also subject to the normal risks of crowd-sourced data. Members of the public that are heterogeneous in knowledge, skill, and geographical location comprise the crowd [<xref ref-type="bibr" rid="ref36">36</xref>] that generates the entries in the Cinemorgue Wiki; biases in any of these characteristics could contribute to a geographically skewed or low-fidelity dataset. While CDC data from the United States were used to calculate gender proportions, every film death in the database was included, even if the film was not English-language. Accordingly, while some films may better represent certain realities than others, research has shown that even explicitly far-fetched or out-of-reality story lines can influence beliefs via transportation [<xref ref-type="bibr" rid="ref37">37</xref>], so we have retained all films regardless of location of origin or setting.</p></sec><sec id="s4-3"><title>Future Work</title><p>Future research should further detail the corpus of cinematic mortality, and incorporate additional features of each film (eg, age of actors, setting, location, audience scores, and critic reviews) from film encyclopedias and rating websites. This will further elucidate the nature of mortality representation in film relative to viewership. In addition, future work should examine mortality representation across all forms of media, including books, songs, and social media. This would provide a more global perspective on the impact of media&#x2014;writ large&#x2014;and capture populations that may not interact with cinematic media. With enough data, the Granger causality test&#x2014;used to forecast time series from other time series [<xref ref-type="bibr" rid="ref38">38</xref>]&#x2014;could be used to understand whether media representation of death by gender lags or leads actual causes of mortality by gender. This would contribute to a better understanding of the interplay between media representation and health outcomes over time. Relatedly, visualizations like a Sankey flow diagram&#x2014;which provides visualization of time-series-type data in lieu of a formal time series analysis [<xref ref-type="bibr" rid="ref39">39</xref>]&#x2014;could provide further opportunities for interpretation of how gender representation has morphed over time. Randomized controlled trials centering on these ideas (perhaps priming viewers with biased images of disease before surveying them on perceived prevalence of disease by gender) could provide support for the case of causality between representation and understanding of society&#x2019;s disease burden.</p></sec><sec id="s4-4"><title>Conclusions</title><p>Our study compared mortality causes by gender in film and real life using Cinemorgue Wiki data on all-time film deaths and NVSS mortality by cause data from 2021 in the United States. Based on the comparison of gender ratios by cause of death, we identified significant differences in representation for accidents, cerebrovascular disease, diseases of the heart, and suicide (intentional self-harm). Considering current struggles in appropriately managing diagnosis and treatment of disease by gender, highlighting how representation of mortality is skewed by gender in films may encourage a more equitable culture surrounding gender and health. Future work should expand this query to include other forms of media to understand the interplay of representation and mortality.</p></sec></sec></body><back><ack><p>The authors are grateful for support from the National Science Foundation (award #2242829) and the Massachusetts Mutual Life Insurance Company. We thank Story Lab members Ashley Fehr and Julia Zimmerman for their feedback on ideas presented in this manuscript. The authors attest that there was no use of generative artificial intelligence technology in the generation of texts, figures, or other informational content of this manuscript.</p></ack><notes><sec><title>Data Availability</title><p>The datasets generated and analyzed during this study are available in the University of Vermont Story Lab repository [<xref ref-type="bibr" rid="ref40">40</xref>].</p></sec></notes><fn-group><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">CDC</term><def><p>Centers for Disease Control and Prevention</p></def></def-item><def-item><term id="abb2"><italic>ICD-10</italic></term><def><p><italic>International Classification of Diseases, Tenth Revision</italic></p></def></def-item><def-item><term id="abb3">NVSS</term><def><p>National Survey of Vital Statistics</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Curtin</surname><given-names>SC</given-names> </name><name name-style="western"><surname>Tejada-Vera</surname><given-names>B</given-names> </name><name name-style="western"><surname>Bastian</surname><given-names>BA</given-names> </name></person-group><article-title>Deaths: leading causes for 2021</article-title><source>Natl Vital Stat Rep</source><year>2024</year><access-date>2025-05-29</access-date><volume>73</volume><issue>4</issue><comment><ext-link ext-link-type="uri" xlink:href="https://www.cdc.gov/nchs/data/nvsr/nvsr73/nvsr73-04.pdf">https://www.cdc.gov/nchs/data/nvsr/nvsr73/nvsr73-04.pdf</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Isakadze</surname><given-names>N</given-names> </name><name name-style="western"><surname>Mehta</surname><given-names>PK</given-names> </name><name name-style="western"><surname>Law</surname><given-names>K</given-names> </name><name name-style="western"><surname>Dolan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Lundberg</surname><given-names>GP</given-names> </name></person-group><article-title>Addressing the gap in physician preparedness to assess cardiovascular risk in women: a comprehensive approach to cardiovascular risk assessment in women</article-title><source>Curr Treat Options Cardiovasc Med</source><year>2019</year><month>07</month><day>29</day><volume>21</volume><issue>9</issue><fpage>47</fpage><pub-id pub-id-type="doi">10.1007/s11936-019-0753-0</pub-id><pub-id pub-id-type="medline">31359165</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wenger</surname><given-names>NK</given-names> </name><name name-style="western"><surname>Lloyd-Jones</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Elkind</surname><given-names>MSV</given-names> </name><etal/></person-group><article-title>Call to action for cardiovascular disease in women: epidemiology, awareness, access, and delivery of equitable health care: a Presidential Advisory from the American Heart Association</article-title><source>Circulation</source><year>2022</year><month>06</month><day>7</day><volume>145</volume><issue>23</issue><fpage>e1059</fpage><lpage>e1071</lpage><pub-id pub-id-type="doi">10.1161/CIR.0000000000001071</pub-id><pub-id pub-id-type="medline">35531777</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Brooks</surname><given-names>D</given-names> </name><name name-style="western"><surname>H&#x00E9;bert</surname><given-names>L</given-names> </name></person-group><article-title>Gender, race, and media representation</article-title><source>The SAGE Handbook of Gender and Communication</source><year>2006</year><publisher-name>SAGE Publications</publisher-name><pub-id pub-id-type="doi">10.4135/9781412976053.n16</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dill&#x2010;Shackleford</surname><given-names>KE</given-names> </name><name name-style="western"><surname>Vinney</surname><given-names>C</given-names> </name><name name-style="western"><surname>Hopper&#x2010;Losenicky</surname><given-names>K</given-names> </name></person-group><article-title>Connecting the dots between fantasy and reality: the social psychology of our engagement with fictional narrative and its functional value</article-title><source>Social &#x0026; Personality Psych</source><year>2016</year><month>11</month><volume>10</volume><issue>11</issue><fpage>634</fpage><lpage>646</lpage><pub-id pub-id-type="doi">10.1111/spc3.12274</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Breen</surname><given-names>AV</given-names> </name><name name-style="western"><surname>McLean</surname><given-names>KC</given-names> </name><name name-style="western"><surname>Cairney</surname><given-names>K</given-names> </name><name name-style="western"><surname>McAdams</surname><given-names>DP</given-names> </name></person-group><article-title>Movies, books, and identity: exploring the narrative ecology of the self</article-title><source>Qualitative Psychology</source><year>2017</year><volume>4</volume><issue>3</issue><fpage>243</fpage><lpage>259</lpage><pub-id pub-id-type="doi">10.1037/qup0000059</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Green</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Brock</surname><given-names>TC</given-names> </name></person-group><article-title>The role of transportation in the persuasiveness of public narratives</article-title><source>J Pers Soc Psychol</source><year>2000</year><volume>79</volume><issue>5</issue><fpage>701</fpage><lpage>721</lpage><pub-id pub-id-type="doi">10.1037/0022-3514.79.5.701</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Green</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Clark</surname><given-names>JL</given-names> </name></person-group><article-title>Transportation into narrative worlds: implications for entertainment media influences on tobacco use</article-title><source>Addiction</source><year>2013</year><month>03</month><volume>108</volume><issue>3</issue><fpage>477</fpage><lpage>484</lpage><pub-id pub-id-type="doi">10.1111/j.1360-0443.2012.04088.x</pub-id><pub-id pub-id-type="medline">22994374</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kubrak</surname><given-names>T</given-names> </name></person-group><article-title>Impact of films: changes in young people&#x2019;s attitudes after watching a movie</article-title><source>Behav Sci (Basel)</source><year>2020</year><month>05</month><day>2</day><volume>10</volume><issue>5</issue><fpage>86</fpage><pub-id pub-id-type="doi">10.3390/bs10050086</pub-id><pub-id pub-id-type="medline">32370280</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gebbers</surname><given-names>A</given-names> </name></person-group><article-title>Transportation into narrative worlds and the motivation to change health-related behavior</article-title><source>International Journal of Communication</source><year>2020</year><volume>14</volume><fpage>6977</fpage><lpage>2203</lpage><pub-id pub-id-type="doi">10.31235/1234567</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gomes</surname><given-names>D</given-names> </name><name name-style="western"><surname>Loth</surname><given-names>A</given-names> </name><name name-style="western"><surname>Hockley</surname><given-names>JRF</given-names> </name><name name-style="western"><surname>John Smith</surname><given-names>E</given-names> </name></person-group><article-title>Gut reaction: the impact of a film on public understanding of gastrointestinal conditions</article-title><source>Scientific Communication and Education</source><year>2022</year><pub-id pub-id-type="doi">10.1101/2021.09.05.459031</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shaw</surname><given-names>KE</given-names> </name><name name-style="western"><surname>Harris</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Diedrich</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Portrayal of acute myocardial infarction in popular film: a review of gender, race, and ethnicity</article-title><source>J Am Heart Assoc</source><year>2024</year><month>08</month><day>20</day><volume>13</volume><issue>16</issue><fpage>e034222</fpage><pub-id pub-id-type="doi">10.1161/JAHA.123.034222</pub-id><pub-id pub-id-type="medline">39140282</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Santoniccolo</surname><given-names>F</given-names> </name><name name-style="western"><surname>Trombetta</surname><given-names>T</given-names> </name><name name-style="western"><surname>Paradiso</surname><given-names>MN</given-names> </name><name name-style="western"><surname>Roll&#x00E8;</surname><given-names>L</given-names> </name></person-group><article-title>Gender and media representations: a review of the literature on gender stereotypes, objectification and sexualization</article-title><source>Int J Environ Res Public Health</source><year>2023</year><month>05</month><day>9</day><volume>20</volume><issue>10</issue><fpage>5770</fpage><pub-id pub-id-type="doi">10.3390/ijerph20105770</pub-id><pub-id pub-id-type="medline">37239498</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sisask</surname><given-names>M</given-names> </name><name name-style="western"><surname>V&#x00E4;rnik</surname><given-names>A</given-names> </name></person-group><article-title>Media roles in suicide prevention: a systematic review</article-title><source>Int J Environ Res Public Health</source><year>2012</year><month>01</month><volume>9</volume><issue>1</issue><fpage>123</fpage><lpage>138</lpage><pub-id pub-id-type="doi">10.3390/ijerph9010123</pub-id><pub-id pub-id-type="medline">22470283</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Islam</surname><given-names>S</given-names> </name><name name-style="western"><surname>Fitzgerald</surname><given-names>L</given-names> </name></person-group><article-title>Indigenous obesity in the news: a media analysis of news representation of obesity in Australia&#x2019;s Indigenous population</article-title><source>BMC Obes</source><year>2016</year><volume>3</volume><fpage>30</fpage><pub-id pub-id-type="doi">10.1186/s40608-016-0109-1</pub-id><pub-id pub-id-type="medline">27354919</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johnson</surname><given-names>HJ</given-names> </name></person-group><article-title>Bisexuality, mental health, and media representation</article-title><source>J Bisex</source><year>2016</year><month>07</month><day>2</day><volume>16</volume><issue>3</issue><fpage>378</fpage><lpage>396</lpage><pub-id pub-id-type="doi">10.1080/15299716.2016.1168335</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weishaar</surname><given-names>H</given-names> </name><name name-style="western"><surname>Dorfman</surname><given-names>L</given-names> </name><name name-style="western"><surname>Freudenberg</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Why media representations of corporations matter for public health policy: a scoping review</article-title><source>BMC Public Health</source><year>2016</year><month>08</month><day>30</day><volume>16</volume><issue>1</issue><fpage>899</fpage><pub-id pub-id-type="doi">10.1186/s12889-016-3594-8</pub-id><pub-id pub-id-type="medline">27577053</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bamman</surname><given-names>D</given-names> </name><name name-style="western"><surname>Samberg</surname><given-names>R</given-names> </name><name name-style="western"><surname>So</surname><given-names>RJ</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>N</given-names> </name></person-group><article-title>Measuring diversity in Hollywood through the large-scale computational analysis of film</article-title><source>Proc Natl Acad Sci USA</source><year>2024</year><month>11</month><day>12</day><volume>121</volume><issue>46</issue><fpage>e2409770121</fpage><pub-id pub-id-type="doi">10.1073/pnas.2409770121</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bleakley</surname><given-names>A</given-names> </name><name name-style="western"><surname>Jamieson</surname><given-names>PE</given-names> </name><name name-style="western"><surname>Romer</surname><given-names>D</given-names> </name></person-group><article-title>Trends of sexual and violent content by gender in top-grossing U.S. films, 1950-2006</article-title><source>J Adolesc Health</source><year>2012</year><month>07</month><volume>51</volume><issue>1</issue><fpage>73</fpage><lpage>79</lpage><pub-id pub-id-type="doi">10.1016/j.jadohealth.2012.02.006</pub-id><pub-id pub-id-type="medline">22727080</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Anderson</surname><given-names>H</given-names> </name><name name-style="western"><surname>Daniels</surname><given-names>M</given-names> </name></person-group><article-title>The largest analysis of film dialogue by gender, ever</article-title><source>The Pudding</source><year>2016</year><access-date>2024-12-12</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://pudding.cool/2017/03/film-dialogue">https://pudding.cool/2017/03/film-dialogue</ext-link></comment></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="report"><person-group person-group-type="author"><name name-style="western"><surname>Smith</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Choueiti</surname><given-names>M</given-names> </name><name name-style="western"><surname>Pieper</surname><given-names>K</given-names> </name></person-group><article-title>Gender bias without borders: an investigation of female characters in popular films across 11 countries</article-title><year>2014</year><publisher-name>Geena Davis Institute on Gender in Media</publisher-name></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="report"><person-group person-group-type="author"><name name-style="western"><surname>Smith</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Choueiti</surname><given-names>M</given-names> </name><name name-style="western"><surname>Pieper</surname><given-names>K</given-names> </name><name name-style="western"><surname>Gillig</surname><given-names>T</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>C</given-names> </name></person-group><article-title>Inequality in 700 popular films: examining portrayals of gender, race, and LGBT status from 2007 to 2014</article-title><year>2015</year><publisher-name>USC Annenberg School for Communication and Journalism</publisher-name></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lindner</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Lindquist</surname><given-names>M</given-names> </name><name name-style="western"><surname>Arnold</surname><given-names>J</given-names> </name></person-group><article-title>Million dollar maybe? The effect of female presence in movies on Box Office returns</article-title><source>Sociol Inq</source><year>2015</year><month>08</month><volume>85</volume><issue>3</issue><fpage>407</fpage><lpage>428</lpage><pub-id pub-id-type="doi">10.1111/soin.12081</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="web"><source>Cinemorgue Wiki</source><access-date>2024-01-24</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://cinemorgue.fandom.com/wiki">https://cinemorgue.fandom.com/wiki</ext-link></comment></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Lindsay</surname><given-names>M</given-names> </name></person-group><article-title>Cinemorgue parsing</article-title><source>Kaggle</source><access-date>2024-01-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.kaggle.com/code/michaellindsay/cinemorgue-parsing/notebook">https://www.kaggle.com/code/michaellindsay/cinemorgue-parsing/notebook</ext-link></comment></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Michael</surname><given-names>J</given-names> </name></person-group><article-title>Gender-guesser 0.4.0: pip install gender-guesser</article-title><source>Python Package Index</source><access-date>2024-07-09</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://pypi.org/project/gender-guesser/">https://pypi.org/project/gender-guesser/</ext-link></comment></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="web"><article-title>CDC WONDER</article-title><source>Centers for Disease Control</source><access-date>2024-07-09</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://wonder.cdc.gov">https://wonder.cdc.gov</ext-link></comment></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Franke</surname><given-names>TM</given-names> </name><name name-style="western"><surname>Ho</surname><given-names>T</given-names> </name><name name-style="western"><surname>Christie</surname><given-names>CA</given-names> </name></person-group><article-title>The chi-square test: often used and more often misinterpreted</article-title><source>Am J Eval</source><year>2012</year><volume>33</volume><fpage>448</fpage><lpage>458</lpage><pub-id pub-id-type="doi">10.1177/1098214011426594</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McHugh</surname><given-names>ML</given-names> </name></person-group><article-title>The chi-square test of independence</article-title><source>Biochem Med (Zagreb)</source><year>2013</year><volume>23</volume><issue>2</issue><fpage>143</fpage><lpage>149</lpage><pub-id pub-id-type="doi">10.11613/bm.2013.018</pub-id><pub-id pub-id-type="medline">23894860</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wasserstein</surname><given-names>RL</given-names> </name><name name-style="western"><surname>Lazar</surname><given-names>NA</given-names> </name></person-group><article-title>The ASA statement on p-values: context, process, and purpose</article-title><source>Am Stat</source><year>2016</year><month>04</month><day>2</day><volume>70</volume><issue>2</issue><fpage>129</fpage><lpage>133</lpage><pub-id pub-id-type="doi">10.1080/00031305.2016.1154108</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wasserstein</surname><given-names>RL</given-names> </name></person-group><article-title>Moving to a world beyond &#x201C;p &#x003C; 0.05&#x201D;</article-title><source>Am Stat</source><year>2019</year><volume>73</volume><fpage>1</fpage><lpage>19</lpage><pub-id pub-id-type="doi">10.1080/00031305.2019.1583913</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Greenland</surname><given-names>S</given-names> </name><name name-style="western"><surname>Senn</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Rothman</surname><given-names>KJ</given-names> </name><etal/></person-group><article-title>Statistical tests, P values, confidence intervals, and power: a guide to misinterpretations</article-title><source>Eur J Epidemiol</source><year>2016</year><month>04</month><volume>31</volume><issue>4</issue><fpage>337</fpage><lpage>350</lpage><pub-id pub-id-type="doi">10.1007/s10654-016-0149-3</pub-id><pub-id pub-id-type="medline">27209009</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dhawan</surname><given-names>S</given-names> </name><name name-style="western"><surname>Bakir</surname><given-names>M</given-names> </name><name name-style="western"><surname>Jones</surname><given-names>E</given-names> </name><name name-style="western"><surname>Kilpatrick</surname><given-names>S</given-names> </name><name name-style="western"><surname>Merz</surname><given-names>CNB</given-names> </name></person-group><article-title>Sex and gender medicine in physician clinical training: results of a large, single-center survey</article-title><source>Biol Sex Differ</source><year>2016</year><volume>7</volume><issue>Suppl 1</issue><fpage>37</fpage><pub-id pub-id-type="doi">10.1186/s13293-016-0096-4</pub-id><pub-id pub-id-type="medline">27785341</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hughto</surname><given-names>JMW</given-names> </name><name name-style="western"><surname>Pletta</surname><given-names>D</given-names> </name><name name-style="western"><surname>Gordon</surname><given-names>L</given-names> </name><name name-style="western"><surname>Cahill</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mimiaga</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Reisner</surname><given-names>SL</given-names> </name></person-group><article-title>Negative transgender-related media messages are associated with adverse mental health outcomes in a multistate study of transgender adults</article-title><source>LGBT Health</source><year>2021</year><month>01</month><volume>8</volume><issue>1</issue><fpage>32</fpage><lpage>41</lpage><pub-id pub-id-type="doi">10.1089/lgbt.2020.0279</pub-id><pub-id pub-id-type="medline">33170060</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Suarez</surname><given-names>NA</given-names> </name><name name-style="western"><surname>Trujillo</surname><given-names>L</given-names> </name><name name-style="western"><surname>McKinnon</surname><given-names>II</given-names> </name><etal/></person-group><article-title>Disparities in school connectedness, unstable housing, experiences of violence, mental health, and suicidal thoughts and behaviors among transgender and cisgender high school students - Youth Risk Behavior Survey, United States, 2023</article-title><source>MMWR Suppl</source><year>2024</year><month>10</month><day>10</day><volume>73</volume><issue>4</issue><fpage>50</fpage><lpage>58</lpage><pub-id pub-id-type="doi">10.15585/mmwr.su7304a6</pub-id><pub-id pub-id-type="medline">39378210</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lenart-Gansiniec</surname><given-names>R</given-names> </name><name name-style="western"><surname>Czakon</surname><given-names>W</given-names> </name><name name-style="western"><surname>Su&#x0142;kowski</surname><given-names>&#x0141;</given-names> </name><name name-style="western"><surname>Pocek</surname><given-names>J</given-names> </name></person-group><article-title>Understanding crowdsourcing in science</article-title><source>Rev Manag Sci</source><year>2023</year><month>11</month><volume>17</volume><issue>8</issue><fpage>2797</fpage><lpage>2830</lpage><pub-id pub-id-type="doi">10.1007/s11846-022-00602-z</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mulligan</surname><given-names>K</given-names> </name><name name-style="western"><surname>Habel</surname><given-names>P</given-names> </name></person-group><article-title>The implications of fictional media for political beliefs</article-title><source>American Politics Research</source><year>2013</year><month>01</month><volume>41</volume><issue>1</issue><fpage>122</fpage><lpage>146</lpage><pub-id pub-id-type="doi">10.1177/1532673X12453758</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shojaie</surname><given-names>A</given-names> </name><name name-style="western"><surname>Fox</surname><given-names>EB</given-names> </name></person-group><article-title>Granger causality: a review and recent advances</article-title><source>Annu Rev Stat Appl</source><year>2022</year><month>03</month><volume>9</volume><issue>1</issue><fpage>289</fpage><lpage>319</lpage><pub-id pub-id-type="doi">10.1146/annurev-statistics-040120-010930</pub-id><pub-id pub-id-type="medline">37840549</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Otto</surname><given-names>E</given-names> </name><name name-style="western"><surname>Culakova</surname><given-names>E</given-names> </name><name name-style="western"><surname>Meng</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Overview of Sankey flow diagrams: focusing on symptom trajectories in older adults with advanced cancer</article-title><source>J Geriatr Oncol</source><year>2022</year><month>06</month><volume>13</volume><issue>5</issue><fpage>742</fpage><lpage>746</lpage><pub-id pub-id-type="doi">10.1016/j.jgo.2021.12.017</pub-id><pub-id pub-id-type="medline">35000890</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="web"><article-title>Film deaths: misrepresentation of mortality</article-title><source>Computational Story Lab</source><access-date>2025-05-29</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://storylab.w3.uvm.edu/deaths-in-films/">https://storylab.w3.uvm.edu/deaths-in-films/</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>All film counts and percentages for causes of mortality in the Cinemorgue database.</p><media xlink:href="formative_v9i1e70853_app1.docx" xlink:title="DOCX File, 24 KB"/></supplementary-material></app-group></back></article>