<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JFR</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Form Res</journal-id>
      <journal-title>JMIR Formative Research</journal-title>
      <issn pub-type="epub">2561-326X</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v6i9e33606</article-id>
      <article-id pub-id-type="pmid">36103223</article-id>
      <article-id pub-id-type="doi">10.2196/33606</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Personalized Energy Expenditure Estimation: Visual Sensing Approach With Deep Learning</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Mavragani</surname>
            <given-names>Amaryllis</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Liu</surname>
            <given-names>Gengbo</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Lim</surname>
            <given-names>Gilbert</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Perrett</surname>
            <given-names>Toby</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>University of Bristol</institution>
            <addr-line>Digital Health, First Floor</addr-line>
            <addr-line>1 Cathedral Square</addr-line>
            <addr-line>Bristol, BS1 5DD</addr-line>
            <country>United Kingdom</country>
            <phone>44 117 45 50375</phone>
            <email>toby.perrett@bristol.ac.uk</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-1676-3729</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Masullo</surname>
            <given-names>Alessandro</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6510-835X</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Damen</surname>
            <given-names>Dima</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8804-6238</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Burghardt</surname>
            <given-names>Tilo</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-8506-012X</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Craddock</surname>
            <given-names>Ian</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6552-8541</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Mirmehdi</surname>
            <given-names>Majid</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6478-1403</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>University of Bristol</institution>
        <addr-line>Bristol</addr-line>
        <country>United Kingdom</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Toby Perrett <email>toby.perrett@bristol.ac.uk</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>9</month>
        <year>2022</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>14</day>
        <month>9</month>
        <year>2022</year>
      </pub-date>
      <volume>6</volume>
      <issue>9</issue>
      <elocation-id>e33606</elocation-id>
      <history>
        <date date-type="received">
          <day>15</day>
          <month>9</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>19</day>
          <month>1</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>15</day>
          <month>3</month>
          <year>2022</year>
        </date>
        <date date-type="accepted">
          <day>25</day>
          <month>3</month>
          <year>2022</year>
        </date>
      </history>
      <copyright-statement>©Toby Perrett, Alessandro Masullo, Dima Damen, Tilo Burghardt, Ian Craddock, Majid Mirmehdi. Originally published in JMIR Formative Research (https://formative.jmir.org), 14.09.2022.</copyright-statement>
      <copyright-year>2022</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Formative Research, is properly cited. The complete bibliographic information, a link to the original publication on https://formative.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://formative.jmir.org/2022/9/e33606" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Calorimetry is both expensive and obtrusive but provides the only way to accurately measure energy expenditure in daily living activities of any specific person, as different people can use different amounts of energy despite performing the same actions in the same manner. Deep learning video analysis techniques have traditionally required a lot of data to train; however, recent advances in few-shot learning, where only a few training examples are necessary, have made developing personalized models without a calorimeter a possibility.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>The primary aim of this study is to determine which activities are most well suited to calibrate a vision-based personalized deep learning calorie estimation system for daily living activities.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>The SPHERE (Sensor Platform for Healthcare in a Residential Environment) Calorie data set is used, which features 10 participants performing 11 daily living activities totaling 4.5 hours of footage. Calorimeter and video data are available for all recordings. A deep learning method is used to regress calorie predictions from video.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Models are personalized with 32 seconds from all 11 actions in the data set, and mean square error (MSE) is taken against a calorimeter ground truth. The best single action for calibration is <italic>wipe</italic> (1.40 MSE). The best pair of actions are <italic>sweep</italic> and <italic>sit</italic> (1.09 MSE). This compares favorably to using a whole 30-minute sequence containing 11 actions to calibrate (1.06 MSE).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>A vision-based deep learning energy expenditure estimation system for a wide range of daily living activities can be calibrated to a specific person with footage and calorimeter data from 32 seconds of sweeping and 32 seconds of sitting.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>energy expenditure</kwd>
        <kwd>calories, calorimetry</kwd>
        <kwd>deep learning</kwd>
        <kwd>computer vision</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>The ability to measure energy expenditure is important in a wide variety of settings. Examples range from sports training [<xref ref-type="bibr" rid="ref1">1</xref>] to diabetes and cardiovascular disease monitoring [<xref ref-type="bibr" rid="ref2">2</xref>]. Of particular interest is obesity management, where the amount of activity found in sedentary people at work and in the home can make a large difference to their overall fitness [<xref ref-type="bibr" rid="ref3">3</xref>], especially when energy expenditure that is not due to exercise is taken into account [<xref ref-type="bibr" rid="ref4">4</xref>]. The most accurate ways to measure person-specific energy expenditure are to use a sealed chamber [<xref ref-type="bibr" rid="ref5">5</xref>] or indirect calorimetry [<xref ref-type="bibr" rid="ref6">6</xref>]. However, other than the upfront costs and time with such equipment, they are also intrusive and cumbersome when used for a significant length of time, and they require expert installation. Further, they are unsuitable for long-term deployment in homes (eg, for health monitoring applications), whether for large scale studies or for individual cases.</p>
        <p>In the absence of such accurate measurements, clinicians have used metabolic equivalent task (MET) tables [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>] as an approximation, where each action has an associated energy expenditure value. This can be a time-consuming process, especially for a long sequence containing multiple activities, as each activity must be manually assigned start and end times. However, most importantly, METs are highly inaccurate compared to calorimetry. Hence, other approaches have sought to bridge the accuracy gap, while also reducing the burden on clinicians and annotators. For example, wearables have been explored as a cheaper, less intrusive, and more portable alternative [<xref ref-type="bibr" rid="ref9">9</xref>-<xref ref-type="bibr" rid="ref16">16</xref>] with improved results over METs. Large-scale home monitoring systems [<xref ref-type="bibr" rid="ref17">17</xref>-<xref ref-type="bibr" rid="ref19">19</xref>] have started to provide enough data to investigate computer vision approaches [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref22">22</xref>], which are cheap, much less intrusive, and more accurate. This provides the opportunity to extend the monitoring of energy consumption from stationary work environments [<xref ref-type="bibr" rid="ref23">23</xref>-<xref ref-type="bibr" rid="ref25">25</xref>], where variation between different people cannot be accurately captured by self-reporting.</p>
        <p>The main problem with noncalorimeter-based approaches is that they still offer a <italic>general model</italic> only. That is, they will provide the same energy expenditure estimation for 2 individuals carrying out an action in a similar way, even though they may be using different amounts of energy.</p>
        <p>Our aim is to estimate energy expenditure from observations of a person’s physical movement. To this end, we train a deep learning model using footage of participants wearing calorimeters. Traditionally, deep learning methods have required a vast amount of data to personalize [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. However, we exploit recent advances that can adapt general models to specific tasks [<xref ref-type="bibr" rid="ref28">28</xref>-<xref ref-type="bibr" rid="ref32">32</xref>] and determine which small set of actions is best suited to personalizing a general model. This will reduce the amount of calorimeter time per participant necessary for model personalization and will demonstrate that vision-based deep learning models are suitable for use in real-world settings. This is the first time in the literature a personalized vision-based energy expenditure estimation training regime has been addressed. On a more fundamental level, determining which actions are most suitable for fine-tuning a deep neural network can also give an indication about which types of activity are necessary to indicate a person’s calorific profile. The approach introduced in this paper will be of practical use in many fields that monitor energy expenditure, such as sports training [<xref ref-type="bibr" rid="ref1">1</xref>], nutrition [<xref ref-type="bibr" rid="ref33">33</xref>], obesity management [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>], and so on.</p>
      </sec>
      <sec>
        <title>Materials</title>
        <p>For this study, we used the SPHERE (Sensor Platform for Healthcare in a Residential Environment) Calorie data set [<xref ref-type="bibr" rid="ref36">36</xref>]. We briefly recap the key properties here before explaining our neural network approach to provide personalized energy expenditure estimations.</p>
      </sec>
      <sec>
        <title>Data Collection</title>
        <p>A total of 10 participants performed a variety of daily living activities while using a K4b2 (COSMED) calorimeter. The activities consisted of the following: <italic>stand</italic>, <italic>sit, walk</italic>, <italic>wipe</italic>, <italic>vacuum</italic>, <italic>sweep</italic>, <italic>lie</italic>, <italic>exercise</italic>, <italic>stretch</italic>, <italic>clean</italic>, <italic>and read</italic>. The participants are filmed using an off-the-shelf RGB-D (Red, Green, Blue plus Depth) sensor, and the video footage is pseudonymized by extracting silhouettes [<xref ref-type="bibr" rid="ref37">37</xref>]. In total, 4.5 hours of footage at 30 frames per second and calorimeter data are available. To obtain a ground truth label for each video frame, calorimeter data are interpolated between each breath reading.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Ethics Approval</title>
        <p>No ethics approval was required for this study, as we only used publicly available anonymized data for the purpose it was designed for.</p>
      </sec>
      <sec>
        <title>Overview</title>
        <p>In this section, we will use our recently developed deep learning method [<xref ref-type="bibr" rid="ref30">30</xref>] and provide a brief overview. Deep learning models consist of a neural network architecture, which processes a data stream (to give the energy expenditure estimation in our case) with an associated training regime to adapt a randomly initialized model to the desired task—often referred to as a learned model.</p>
      </sec>
      <sec>
        <title>Architecture</title>
        <p>Deep neural network video architectures typically consist of 2 subnetworks, which are as follows: (1) a spatial subnetwork to extract useful features from each video frame—this part is necessary as the type of action currently being performed and the participant's body position can be an indicator of how much energy they are consuming. This is the convolutional neural network (<xref rid="figure1" ref-type="fig">Figure 1</xref>). Specifically, ResNet-18 [<xref ref-type="bibr" rid="ref38">38</xref>] with pretrained ImageNet [<xref ref-type="bibr" rid="ref39">39</xref>] weights is used; and (2) a temporal subnetwork to combine features extracted from each frame and to use this information to make an estimation—this part is necessary because just using 1 video frame is insufficient for energy consumption estimation; how fast participants move as well as their previous behavior and actions can have a great effect and must therefore be considered. For this stage, we deploy a temporal convolutional network [<xref ref-type="bibr" rid="ref40">40</xref>] (<xref rid="figure1" ref-type="fig">Figure 1</xref>).</p>
        <p>These 2 subnetworks are trained jointly (in this paper, we refer to this combined architecture as the “network”), so they can learn to specialize short- or long-term observations effectively. Previous works have shown that around 30 seconds of video footage is required to accurately regress calorie values [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref36">36</xref>] as previous activity affects the current calorimeter reading. Thus, we take advantage of an architecture that uses the spatial subnetwork to observe at 1 frame per second and a temporal subnetwork to combine 30 seconds worth of spatial subnetwork features.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Neural network architecture for processing silhouette video streams, consisting of a convolutional neural network (CNN) for extracting frame features and a temporal convolutional network (TCN) for combining frame features over a period of 30 seconds. To achieve an initialization that can be quickly adapted to unseen participants, the main training objective is to minimize the calorie loss while maximizing the person loss. Seq: sequence.</p>
          </caption>
          <graphic xlink:href="formative_v6i9e33606_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Training</title>
        <p>Given an architecture to process the video data, along with silhouette videos and calorimeter readings, a training regime is required to learn from examples in a training set. As a large amount of data is usually required to train a neural network [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>], they are often “pretrained” on a related large data set, then “fine-tuned” on the data set being used. However, in the case of learning a personalized model, the data requirements are still too large to be used for conventional fine-tuning. Thus, we use our recently developed few-shot (otherwise known as “meta-learning” or “learning to learn”) technique [<xref ref-type="bibr" rid="ref30">30</xref>], which aims to learn a model that can be fine-tuned with very little amount of data.</p>
        <p>Instead of optimizing the estimation of the current network, the training process optimizes the estimation of the network after it has been fine-tuned to a random participant from the training set, while an adversarial component aims to make the initialization agnostic to the participants in the training set. <xref rid="figure2" ref-type="fig">Figure 2</xref> provides an illustration of this process. Specifically, it shows that first, a small “task” is constructed from the training set, containing a small amount of silhouette video and associated calorimeter readings. Subsequently, 2 copies of the network initialization (ie, primary weights) are taken, which are named the task specialization and adversarial weights. The task specialization network is fine-tuned for a small number of iterations and becomes well suited to the current task. The adversarial weights are combined with an adversarial classifier, which are trained to predict which participant is used for this specific task. However, during this part, the gradients between the adversarial classifier and adversarial weights are negated. This means that as the adversarial classifier becomes better at classifying the person, the adversarial weights lose the ability to classify the person (ie, they become person agnostic). The task specialization and adversarial weights are finally merged back into the primary set of weights, and the process repeats with a different task. This process results in a set of primary weights that are agnostic to the participants in the training set yet are well suited to fine-tuning to unseen participants (<xref rid="figure2" ref-type="fig">Figure 2</xref>). For evaluation on an unseen participant, the primary set of weights are fine-tuned using a small amount of data from the unseen participant, and the adversarial component is not required because we want the evaluation network to be personalized to the evaluation participant.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Visualization of our data pipeline used to train and fine-tune a neural network, which is then used to provide personalized energy expenditure estimations from video.</p>
          </caption>
          <graphic xlink:href="formative_v6i9e33606_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Overview</title>
        <p>In this section, we outline our experiments and their results. Our aim is to find a network fine-tuning procedure that requires the minimum amount of data. In practice, this means less participant, clinician, and calorimeter time is required to personalize an energy expenditure model.</p>
      </sec>
      <sec>
        <title>Experimental Setup</title>
        <p>A leave-one-out cross validation is used. In other words, 9 participants are used to train the model, and the 10th is used for evaluation. This process is repeated for each participant. To provide context to our results, we compare them against the following baselines: (1) MET value, which is calculated using expert labelled action start and end times; (2) no fine-tuning, which is a general model baseline as it can only make estimations with information learned from participants not being evaluated on; (3) fine-tune on one whole sequence of the participant the model is being personalized to—here, much more data are available to fine-tune than for the rest of our experiments, so this represents an upper bound for performance. The average length of a sequence is 30 minutes; (4) comparison with the work that introduces the meta-learning method in this paper [<xref ref-type="bibr" rid="ref30">30</xref>], but only fine-tuned on the start of a sequence that contains frames without action labels; and (5) fine-tune using data from all 11 actions (32 seconds per action). This shows that standard training or fine-tuning fails with small amounts of data, even if fine-tuned with examples from all actions.</p>
        <p>Mean square error (MSE) of the neural network estimation against the ground truth calorimeter reading is used as the evaluation metric. Note that an error is calculated for every video frame (but the model will have seen the previous 30 seconds of video to make this prediction).</p>
        <p>There are 2 long (20-30 minutes) sequences per participant. For all experiments, the network is fine-tuned using data from sequence 1 and evaluated on sequence 2 and vice versa. This ensures that no data for evaluation have been seen during training or fine-tuning.</p>
      </sec>
      <sec>
        <title>Single-Action Personalization</title>
        <p>To fine-tune to the participant being used for evaluation, 60 video clips are used. As we are assessing how well the model personalizes using a single action, these 60 clips are taken from a 32-second block of video where the fine-tuning action first appears. Each clip contains 30 uniformly sampled frames from 30 seconds of video (ie, sampling 1 frame every second). Given 32 seconds of video at 30 frames per second, there are 32*30=960 frames. The first video clip uses fames 1, 31, …, 901. The second video clip uses frames 2, 32,…, 902, and so on.</p>
        <p>The first row of <xref ref-type="table" rid="table1">Table 1</xref> shows the results of fine-tuning on each action compared against the baselines listed above. We can see that 32 seconds of <italic>wipe</italic> is best for learning a personalized calorific profile. However, it is still short of the upper bound on performance. The model fine-tuned on a whole video sequence has an MSE of 1.06 compared to 1.40 for <italic>wipe</italic>.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Mean square error averaged across all participants.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="180"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="90"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Actions</td>
                <td colspan="2">Stand</td>
                <td colspan="2">Sit</td>
                <td colspan="2">Walk</td>
                <td colspan="2">Wipe</td>
                <td colspan="2">Vacuum</td>
                <td colspan="2">Sweep</td>
                <td colspan="2">Lie</td>
                <td colspan="2">Exercise</td>
                <td colspan="2">Stretch</td>
                <td colspan="2">Clean</td>
                <td>Read</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Single action</td>
                <td colspan="2">2.32</td>
                <td colspan="2">2.20</td>
                <td colspan="2">2.80</td>
                <td colspan="2">1.40<sup>a</sup></td>
                <td colspan="2">1.94</td>
                <td colspan="2">2.15</td>
                <td colspan="2">2.43</td>
                <td colspan="2">6.77</td>
                <td colspan="2">17.85</td>
                <td colspan="2">3.27</td>
                <td>2.47</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Action pairs</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Stand</td>
                <td colspan="2">2.55</td>
                <td colspan="2">—<sup>b</sup></td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Sit</td>
                <td colspan="2">2.65</td>
                <td colspan="2">2.09</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Walk</td>
                <td colspan="2">2.87</td>
                <td colspan="2">2.57</td>
                <td colspan="2">2.72</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Wipe</td>
                <td colspan="2">1.52</td>
                <td colspan="2">1.50</td>
                <td colspan="2">1.72</td>
                <td colspan="2">1.55</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Vacuum</td>
                <td colspan="2">1.40</td>
                <td colspan="2">1.77</td>
                <td colspan="2">1.74</td>
                <td colspan="2">1.34</td>
                <td colspan="2">2.01</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Sweep</td>
                <td colspan="2">1.61</td>
                <td colspan="2">1.09<sup>c</sup></td>
                <td colspan="2">1.59</td>
                <td colspan="2">1.36</td>
                <td colspan="2">1.60</td>
                <td colspan="2">2.55</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Lie</td>
                <td colspan="2">1.56</td>
                <td colspan="2">1.24</td>
                <td colspan="2">2.39</td>
                <td colspan="2">1.38</td>
                <td colspan="2">2.12</td>
                <td colspan="2">2.60</td>
                <td colspan="2">2.34</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Exercise</td>
                <td colspan="2">2.42</td>
                <td colspan="2">1.87</td>
                <td colspan="2">2.82</td>
                <td colspan="2">3.18</td>
                <td colspan="2">2.89</td>
                <td colspan="2">2.62</td>
                <td colspan="2">3.50</td>
                <td colspan="2">5.72</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Stretch</td>
                <td colspan="2">17.70</td>
                <td colspan="2">3.01</td>
                <td colspan="2">4.47</td>
                <td colspan="2">6.34</td>
                <td colspan="2">4.88</td>
                <td colspan="2">4.83</td>
                <td colspan="2">11.79</td>
                <td colspan="2">7.63</td>
                <td colspan="2">12.65</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clean</td>
                <td colspan="2">1.45</td>
                <td colspan="2">1.59</td>
                <td colspan="2">1.71</td>
                <td colspan="2">1.52</td>
                <td colspan="2">2.46</td>
                <td colspan="2">2.03</td>
                <td colspan="2">2.08</td>
                <td colspan="2">5.28</td>
                <td colspan="2">8.06</td>
                <td colspan="2">3.42</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Read</td>
                <td colspan="2">1.98</td>
                <td colspan="2">4.98</td>
                <td colspan="2">2.47</td>
                <td colspan="2">1.40</td>
                <td colspan="2">2.16</td>
                <td colspan="2">2.24</td>
                <td colspan="2">2.44</td>
                <td colspan="2">3.43</td>
                <td colspan="2">3.02</td>
                <td colspan="2">2.42</td>
                <td colspan="2">2.35</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Baselines</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MET<sup>d</sup></td>
                <td colspan="2">2.87</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Before train only</td>
                <td colspan="2">2.17</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>All actions (whole sequence)</td>
                <td colspan="2">1.06<sup>e</sup></td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>All actions (32s/action)</td>
                <td colspan="2">3.30</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Sequence start [<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                <td colspan="2">1.74</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
                <td colspan="2">—</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>Best single action.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>Not applicable.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>Best paired action.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>MET: metabolic equivalent task.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>Best baseline.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Multiple Action Personalization</title>
        <p>With the hypothesis that a broader range of actions provides a better calorific profiling of a person, we deploy multiple actions to fine-tune. This is motivated by the example in <xref rid="figure3" ref-type="fig">Figure 3</xref> and the associated single-action personalization results, where fine-tuning on a whole sequence outperforms models fine-tuned on any single action. For the following experiments, we compare every pair of actions. For each action, the same amount of footage is available to fine-tune as there was in the previous experiments (ie, 32 seconds). <xref ref-type="table" rid="table1">Table 1</xref> also shows the results of all 2-action combinations averaged per participant. To verify that any improvement is not just due to an increase in fine-tuning data (ie, 64 seconds from 2 actions compared to 32 seconds from 1), we include single-action results with the larger 64 seconds of fine-tuning data.</p>
        <p>The best performing pair (<italic>sweep</italic> and <italic>sit</italic>) has an MSE of 1.09, which outperforms the best single-action pair (<italic>wipe</italic>, MSE 1.40). It is also very close to the whole sequence baseline, despite using much less data (64 seconds compared to 30 minutes).</p>
        <p>An example of multiple-action fine-tuning is given in <xref rid="figure4" ref-type="fig">Figure 4</xref>, for which the whole sequence model performs the worst. The best single (<italic>wipe</italic>) and pair (<italic>sweep</italic> and <italic>sit</italic>) fine-tuned models are shown alongside models fine-tuned on the whole sequence and with all actions (32 seconds per action).</p>
        <p>Finally, <xref ref-type="table" rid="table2">Table 2</xref> details the baselines, single-action results, and selected double-action results for each person individually.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Example energy expenditure estimations from silhouettes (recorded at 30 frames per second) using single action fine-tuning. The top example shows a success case where a model fine-tuned using only 32 seconds of wipe outperforms the whole sequence baseline, and that stretch is not a good action to use. The bottom example shows a failure case, where the models fine-tuned on a single action do not adapt to the period of high energy expenditure toward the end of a sequence. Seq: sequence.</p>
          </caption>
          <graphic xlink:href="formative_v6i9e33606_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>An example sequence of silhouettes and energy expenditure estimations. Here, the best pair of actions for calibration across all participants is compared against the best single action, a whole video sequence to calibrate, and shorter footage from every action. Seq: sequence.</p>
          </caption>
          <graphic xlink:href="formative_v6i9e33606_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Mean square error of baselines and single- and selected double-action fine-tuned models. The results are shown for each participant (“Pn”) individually along with the average over all participants. A blank entry indicates the action was not in video sequence used for fine-tuning.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="230"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="60"/>
            <col width="0"/>
            <col width="60"/>
            <col width="0"/>
            <col width="60"/>
            <col width="0"/>
            <col width="60"/>
            <col width="0"/>
            <col width="60"/>
            <col width="0"/>
            <col width="60"/>
            <col width="0"/>
            <col width="70"/>
            <col width="0"/>
            <col width="0"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Actions</td>
                <td colspan="21">Participants</td>
                <td>Average</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <break/>
                </td>
                <td colspan="2">P1</td>
                <td colspan="2">P2</td>
                <td colspan="2">P3</td>
                <td colspan="2">P4</td>
                <td colspan="2">P5</td>
                <td colspan="2">P6</td>
                <td colspan="2">P7</td>
                <td colspan="2">P8</td>
                <td colspan="2">P9</td>
                <td colspan="2">P10</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">
                  <bold>Baselines</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>MET<sup>a</sup></td>
                <td colspan="2">2.19</td>
                <td colspan="2">2.56</td>
                <td colspan="2">1.76</td>
                <td colspan="2">0.22</td>
                <td colspan="2">2.52</td>
                <td colspan="2">3.96</td>
                <td colspan="2">8.81</td>
                <td colspan="2">1.72</td>
                <td colspan="2">1.84</td>
                <td colspan="2">3.14</td>
                <td colspan="3">2.87</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Before train only</td>
                <td colspan="2">1.38</td>
                <td colspan="2">0.82</td>
                <td colspan="2">0.87</td>
                <td colspan="2">0.69</td>
                <td colspan="2">1.46</td>
                <td colspan="2">3.55</td>
                <td colspan="2">7.41</td>
                <td colspan="2">0.71</td>
                <td colspan="2">1.43</td>
                <td colspan="2">3.34</td>
                <td colspan="3">2.17</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>All (whole sequence)</td>
                <td colspan="2">0.60</td>
                <td colspan="2">0.54</td>
                <td colspan="2">0.62</td>
                <td colspan="2">0.14</td>
                <td colspan="2">1.54</td>
                <td colspan="2">1.54</td>
                <td colspan="2">1.75</td>
                <td colspan="2">0.28</td>
                <td colspan="2">0.55</td>
                <td colspan="2">2.02</td>
                <td colspan="3">1.06<sup>b</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>All (32s/action)</td>
                <td colspan="2">0.85</td>
                <td colspan="2">0.41</td>
                <td colspan="2">0.74</td>
                <td colspan="2">0.09</td>
                <td colspan="2">1.11</td>
                <td colspan="2">2.53</td>
                <td colspan="2">22.79</td>
                <td colspan="2">0.79</td>
                <td colspan="2">0.63</td>
                <td colspan="2">3.10</td>
                <td colspan="3">3.30</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Sequence start [<xref ref-type="bibr" rid="ref30">30</xref>]</td>
                <td colspan="2">0.29</td>
                <td colspan="2">0.58</td>
                <td colspan="2">0.54</td>
                <td colspan="2">0.29</td>
                <td colspan="2">1.25</td>
                <td colspan="2">2.30</td>
                <td colspan="2">3.24</td>
                <td colspan="2">3.50</td>
                <td colspan="2">0.65</td>
                <td colspan="2">4.73</td>
                <td colspan="3">1.74</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Single action</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Stand</td>
                <td colspan="2">0.53</td>
                <td colspan="2">0.67</td>
                <td colspan="2">0.60</td>
                <td colspan="2">0.50</td>
                <td colspan="2">1.10</td>
                <td colspan="2">5.04</td>
                <td colspan="2">4.26</td>
                <td colspan="2">2.20</td>
                <td colspan="2">0.59</td>
                <td colspan="2">7.66</td>
                <td colspan="3">2.32</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Sit</td>
                <td colspan="2">0.49</td>
                <td colspan="2">0.92</td>
                <td colspan="2">0.42</td>
                <td colspan="2">0.21</td>
                <td colspan="2">1.13</td>
                <td colspan="2">3.02</td>
                <td colspan="2">3.35</td>
                <td colspan="2">3.12</td>
                <td colspan="2">0.42</td>
                <td colspan="2">8.96</td>
                <td colspan="3">2.20</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Walk</td>
                <td colspan="2">0.80</td>
                <td colspan="2">0.53</td>
                <td colspan="2">0.47</td>
                <td colspan="2">0.29</td>
                <td colspan="2">2.07</td>
                <td colspan="2">7.78</td>
                <td colspan="2">4.32</td>
                <td colspan="2">2.28</td>
                <td colspan="2">0.47</td>
                <td colspan="2">8.97</td>
                <td colspan="3">2.80</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Wipe</td>
                <td colspan="2">0.29</td>
                <td colspan="2">1.36</td>
                <td colspan="2">0.45</td>
                <td colspan="2">0.36</td>
                <td colspan="2">0.73</td>
                <td colspan="2">3.37</td>
                <td colspan="2">2.95</td>
                <td colspan="2">1.80</td>
                <td colspan="2">0.48</td>
                <td colspan="2">2.17</td>
                <td colspan="3">1.40<sup>c</sup></td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Vacuum</td>
                <td colspan="2">0.79</td>
                <td colspan="2">0.63</td>
                <td colspan="2">0.54</td>
                <td colspan="2">0.60</td>
                <td colspan="2">1.67</td>
                <td colspan="2">2.95</td>
                <td colspan="2">5.18</td>
                <td colspan="2">1.89</td>
                <td colspan="2">0.85</td>
                <td colspan="2">4.29</td>
                <td colspan="3">1.94</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Sweep</td>
                <td colspan="2">1.01</td>
                <td colspan="2">0.57</td>
                <td colspan="2">0.81</td>
                <td colspan="2">0.47</td>
                <td colspan="2">0.62</td>
                <td colspan="2">2.85</td>
                <td colspan="2">9.24</td>
                <td colspan="2">3.29</td>
                <td colspan="2">0.39</td>
                <td colspan="2">2.31</td>
                <td colspan="3">2.15</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Lie</td>
                <td colspan="2">1.52</td>
                <td colspan="2">0.70</td>
                <td colspan="2">1.14</td>
                <td colspan="2">1.29</td>
                <td colspan="2">0.92</td>
                <td colspan="2">3.04</td>
                <td colspan="2">10.59</td>
                <td colspan="2">1.53</td>
                <td colspan="2">1.35</td>
                <td colspan="2">2.22</td>
                <td colspan="3">2.43</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Exercise</td>
                <td colspan="2">1.56</td>
                <td colspan="2">0.76</td>
                <td colspan="2">—<sup>d</sup></td>
                <td colspan="2">2.96</td>
                <td colspan="2">0.59</td>
                <td colspan="2">5.74</td>
                <td colspan="2">7.59</td>
                <td colspan="2">7.47</td>
                <td colspan="2">0.80</td>
                <td colspan="2">33.41</td>
                <td colspan="3">6.77</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Stretch</td>
                <td colspan="2">5.93</td>
                <td colspan="2">46.52</td>
                <td colspan="2">0.48</td>
                <td colspan="2">5.82</td>
                <td colspan="2">5.16</td>
                <td colspan="2">21.19</td>
                <td colspan="2">30.64</td>
                <td colspan="2">13.86</td>
                <td colspan="2">30.81</td>
                <td colspan="2">18.05</td>
                <td colspan="3">17.85</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Clean</td>
                <td colspan="2">1.17</td>
                <td colspan="2">2.15</td>
                <td colspan="2">0.94</td>
                <td colspan="2">0.32</td>
                <td colspan="2">1.04</td>
                <td colspan="2">5.93</td>
                <td colspan="2">8.94</td>
                <td colspan="2">2.17</td>
                <td colspan="2">4.65</td>
                <td colspan="2">5.35</td>
                <td colspan="3">3.27</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Read</td>
                <td colspan="2">2.05</td>
                <td colspan="2">1.35</td>
                <td colspan="2">0.84</td>
                <td colspan="2">0.56</td>
                <td colspan="2">0.81</td>
                <td colspan="2">2.53</td>
                <td colspan="2">7.50</td>
                <td colspan="2">1.92</td>
                <td colspan="2">2.22</td>
                <td colspan="2">4.90</td>
                <td colspan="3">2.47</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Action pairs</bold>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td rowspan="2">
                  <break/>
                </td>
                <td>Sweep/sit</td>
                <td colspan="2">0.96</td>
                <td colspan="2">0.67</td>
                <td colspan="2">0.47</td>
                <td colspan="2">0.13</td>
                <td colspan="2">0.90</td>
                <td colspan="2">2.51</td>
                <td colspan="2">1.02</td>
                <td colspan="2">0.99</td>
                <td colspan="2">0.47</td>
                <td colspan="2">2.75</td>
                <td colspan="3">1.09<sup>e</sup></td>
              </tr>
              <tr valign="top">
                <td>Lie/sit</td>
                <td colspan="2">0.61</td>
                <td colspan="2">0.53</td>
                <td colspan="2">0.43</td>
                <td colspan="2">0.45</td>
                <td colspan="2">0.82</td>
                <td colspan="2">2.69</td>
                <td colspan="2">3.00</td>
                <td colspan="2">1.07</td>
                <td colspan="2">0.60</td>
                <td colspan="2">2.24</td>
                <td colspan="3">1.24</td>
              </tr>
              <tr valign="top">
                <td rowspan="2">
                  <break/>
                </td>
                <td>Vacuum/stand</td>
                <td colspan="2">0.87</td>
                <td colspan="2">0.57</td>
                <td colspan="2">0.38</td>
                <td colspan="2">0.14</td>
                <td colspan="2">1.53</td>
                <td colspan="2">3.39</td>
                <td colspan="2">1.73</td>
                <td colspan="2">0.78</td>
                <td colspan="2">0.61</td>
                <td colspan="2">4.04</td>
                <td colspan="3">1.40</td>
              </tr>
              <tr valign="top">
                <td>Vacuum/wipe</td>
                <td colspan="2">0.48</td>
                <td colspan="2">0.64</td>
                <td colspan="2">0.64</td>
                <td colspan="2">0.19</td>
                <td colspan="2">1.21</td>
                <td colspan="2">3.25</td>
                <td colspan="2">1.59</td>
                <td colspan="2">1.63</td>
                <td colspan="2">0.60</td>
                <td colspan="2">3.15</td>
                <td colspan="3">1.34</td>
              </tr>
              <tr valign="top">
                <td rowspan="2">
                  <break/>
                </td>
                <td>Sweep/wipe</td>
                <td colspan="2">0.60</td>
                <td colspan="2">0.59</td>
                <td colspan="2">0.67</td>
                <td colspan="2">0.16</td>
                <td colspan="2">1.01</td>
                <td colspan="2">2.52</td>
                <td colspan="2">4.16</td>
                <td colspan="2">1.02</td>
                <td colspan="2">0.54</td>
                <td colspan="2">2.35</td>
                <td colspan="3">1.36</td>
              </tr>
              <tr valign="top">
                <td>Wipe/wipe</td>
                <td colspan="2">0.57</td>
                <td colspan="2">0.95</td>
                <td colspan="2">0.48</td>
                <td colspan="2">0.11</td>
                <td colspan="2">1.07</td>
                <td colspan="2">3.88</td>
                <td colspan="2">3.43</td>
                <td colspan="2">1.98</td>
                <td colspan="2">0.56</td>
                <td colspan="2">2.42</td>
                <td colspan="3">1.55</td>
              </tr>
              <tr valign="top">
                <td rowspan="2">
                  <break/>
                </td>
                <td>Stretch/exercise</td>
                <td colspan="2">2.83</td>
                <td colspan="2">2.19</td>
                <td colspan="2">—</td>
                <td colspan="2">4.18</td>
                <td colspan="2">3.58</td>
                <td colspan="2">8.74</td>
                <td colspan="2">14.63</td>
                <td colspan="2">8.93</td>
                <td colspan="2">0.93</td>
                <td colspan="2">22.70</td>
                <td colspan="3">7.63</td>
              </tr>
              <tr valign="top">
                <td>Clean/stretch</td>
                <td colspan="2">5.01</td>
                <td colspan="2">5.39</td>
                <td colspan="2">0.57</td>
                <td colspan="2">2.20</td>
                <td colspan="2">2.79</td>
                <td colspan="2">11.90</td>
                <td colspan="2">21.57</td>
                <td colspan="2">7.26</td>
                <td colspan="2">17.12</td>
                <td colspan="2">6.80</td>
                <td colspan="3">8.06</td>
              </tr>
              <tr valign="top">
                <td rowspan="2">
                  <break/>
                </td>
                <td>Stretch/lie</td>
                <td colspan="2">1.78</td>
                <td colspan="2">9.14</td>
                <td colspan="2">0.61</td>
                <td colspan="2">1.19</td>
                <td colspan="2">3.70</td>
                <td colspan="2">2.98</td>
                <td colspan="2">77.20</td>
                <td colspan="2">3.46</td>
                <td colspan="2">9.64</td>
                <td colspan="2">8.23</td>
                <td colspan="3">11.79</td>
              </tr>
              <tr valign="top">
                <td>Stretch/stand</td>
                <td colspan="2">1.72</td>
                <td colspan="2">2.63</td>
                <td colspan="2">0.56</td>
                <td colspan="2">1.72</td>
                <td colspan="2">1.96</td>
                <td colspan="2">8.08</td>
                <td colspan="2">146.70</td>
                <td colspan="2">5.08</td>
                <td colspan="2">3.49</td>
                <td colspan="2">5.01</td>
                <td colspan="3">17.70</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>MET: metabolic equivalent task.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>Best baseline.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>Best single action.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>Blank entries indicate the action was not in the video sequence used for fine-tuning.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>Best action pair.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Single or Pair Difference</title>
        <p>The results presented above raise several points for discussion. Perhaps the most important is why the best single action to fine-tune with (<italic>wipe</italic>) is not part of the best pair to fine-tune with (<italic>sweep</italic> and <italic>sit</italic>). Given a distribution of calorimeter or silhouette sequences (which contain a wide variety of actions and calorific profiles), we would expect fine-tuning with 1 action to cover the middle of this distribution. If 2 actions are available, then each can be representative of more extreme parts of the energy expenditure or silhouette distribution while still adequately covering the middle of the distribution; 2 actions outperforming 1 corresponds to this intuition</p>
      </sec>
      <sec>
        <title>Action Variation</title>
        <p>Another interesting observation is that there is a large amount of variation when fine-tuning using different actions. For example, fine-tuning using <italic>stretch</italic> is much worse than any other single action (17.85 MSE compared to the baseline 1.06 and second worst 6.77). One possible reason is that a participant stretching produces very different silhouettes compared to any of the other actions they perform. If a model is fine-tuned using these silhouettes, it has been conditioned to very different data compared to the other actions and thus gives bad estimations. A similar effect can be seen with <italic>exercise</italic>, which has less extreme but different silhouettes (6.77 MSE). This reasoning also applies to specific actions outperforming models fine-tuned on the sequence start. The sequence start may not provide enough information about a participant’s calorific profile for the fine-tuned model to work well across a wide variety of actions.</p>
      </sec>
      <sec>
        <title>Participant Variation</title>
        <p>There is also a difference in how all methods perform on specific participants. In particular, all models struggle on P10, with even the model fine-tuned on a whole sequence giving an MSE of 2.02. This is unlikely to be caused by visual differences (in the way that models fine-tuned on <italic>stretch</italic> are) as all actions perform poorly. Rather, it is most likely due to P10 having a calorific profile, which is very dissimilar to those found in all the other participants and could possibly be remedied by collecting data from more participants to use during the training of the initialization.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>In this paper, we showed that a personalized calorie expenditure model that is more accurate than other existing techniques (bar intrusive calorimetry devices) is possible using a vision-based deep learning technique. The method can be personalized and can perform indefinitely in clinical and home environments after just 64 seconds of calorimeter calibration.</p>
        <p>Our method uses a state-of-the art deep learning technique, which learns an initialization from a data set containing calorimeter readings of footage from multiple participants. The initialization can then be adapted quickly to a participant unseen in the training set with footage and calorimeter readings of them <italic>sweeping</italic> for 32 seconds and <italic>sitting</italic> for 32 seconds. This personalized model outperforms the general models that have been used in the past.</p>
        <p>The method outlined in this paper provides some benefits. It is suitable for long-term continuous monitoring of energy expenditure in daily-living scenarios and environments as it is noninvasive and does not require any change to participant behavior. It requires very little expensive clinician and calorimeter time to personalize, and it only needs a relatively cheap RGB-D sensor. Further, it does not require any human annotation of actions or activities after recording has finished.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">MET</term>
          <def>
            <p>metabolic equivalent task</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">MSE</term>
          <def>
            <p>mean square error</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">RGB-D</term>
          <def>
            <p>Red, Green, Blue plus Depth</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">SPHERE</term>
          <def>
            <p>Sensor Platform for Healthcare in a Residential Environment</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This work was performed under the SPHERE (Sensor Platform for Healthcare in a Residential Environment) Next Steps Project funded by the UK Engineering and Physical Sciences Research Council (EPSRC), Grant EP/R005273/1.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vogt</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Heinrich</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Schumacher</surname>
              <given-names>YO</given-names>
            </name>
            <name name-style="western">
              <surname>Grosshauser</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Blum</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>König</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Berg</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Schmid</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Energy intake and energy expenditure of elite cyclists during preseason training</article-title>
          <source>Int J Sports Med</source>
          <year>2005</year>
          <month>10</month>
          <volume>26</volume>
          <issue>8</issue>
          <fpage>701</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1055/s-2004-830438</pub-id>
          <pub-id pub-id-type="medline">16158378</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hamilton</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Hamilton</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Zderic</surname>
              <given-names>TW</given-names>
            </name>
          </person-group>
          <article-title>Role of low energy expenditure and sitting in obesity, metabolic syndrome, type 2 diabetes, and cardiovascular disease</article-title>
          <source>Diabetes</source>
          <year>2007</year>
          <month>11</month>
          <volume>56</volume>
          <issue>11</issue>
          <fpage>2655</fpage>
          <lpage>67</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://diabetes.diabetesjournals.org/content/56/11/2655.short"/>
          </comment>
          <pub-id pub-id-type="doi">10.2337/db07-0882</pub-id>
          <pub-id pub-id-type="medline">17827399</pub-id>
          <pub-id pub-id-type="pii">db07-0882</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Epstein</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Paluch</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Consalvi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Riordan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Scholl</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Effects of manipulating sedentary behavior on physical activity and food intake</article-title>
          <source>J Pediatr</source>
          <year>2002</year>
          <month>03</month>
          <volume>140</volume>
          <issue>3</issue>
          <fpage>334</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1067/mpd.2002.122395</pub-id>
          <pub-id pub-id-type="medline">11953732</pub-id>
          <pub-id pub-id-type="pii">S0022-3476(02)98040-6</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Villablanca</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Alegria</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Mookadam</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Wright</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Levine</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Nonexercise activity thermogenesis in obesity management</article-title>
          <source>Mayo Clin Proc</source>
          <year>2015</year>
          <month>04</month>
          <volume>90</volume>
          <issue>4</issue>
          <fpage>509</fpage>
          <lpage>19</lpage>
          <pub-id pub-id-type="doi">10.1016/j.mayocp.2015.02.001</pub-id>
          <pub-id pub-id-type="medline">25841254</pub-id>
          <pub-id pub-id-type="pii">S0025-6196(15)00123-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ravussin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Lillioja</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>TE</given-names>
            </name>
            <name name-style="western">
              <surname>Christin</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bogardus</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Determinants of 24-hour energy expenditure in man. Methods and results using a respiratory chamber</article-title>
          <source>J. Clin. Invest</source>
          <year>1986</year>
          <month>12</month>
          <day>1</day>
          <volume>78</volume>
          <issue>6</issue>
          <fpage>1568</fpage>
          <lpage>1578</lpage>
          <pub-id pub-id-type="doi">10.1172/jci112749</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferrannini</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>The theoretical bases of indirect calorimetry: A review</article-title>
          <source>Metabolism</source>
          <year>1988</year>
          <month>3</month>
          <volume>37</volume>
          <issue>3</issue>
          <fpage>287</fpage>
          <lpage>301</lpage>
          <pub-id pub-id-type="doi">10.1016/0026-0495(88)90110-2</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Byrne</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Hills</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Hunter</surname>
              <given-names>GR</given-names>
            </name>
            <name name-style="western">
              <surname>Weinsier</surname>
              <given-names>RL</given-names>
            </name>
            <name name-style="western">
              <surname>Schutz</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Metabolic equivalent: one size does not fit all</article-title>
          <source>J Appl Physiol (1985)</source>
          <year>2005</year>
          <month>09</month>
          <volume>99</volume>
          <issue>3</issue>
          <fpage>1112</fpage>
          <lpage>9</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.physiology.org/doi/10.1152/japplphysiol.00023.2004?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1152/japplphysiol.00023.2004</pub-id>
          <pub-id pub-id-type="medline">15831804</pub-id>
          <pub-id pub-id-type="pii">00023.2004</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ainsworth</surname>
              <given-names>BE</given-names>
            </name>
            <name name-style="western">
              <surname>Haskell</surname>
              <given-names>WL</given-names>
            </name>
            <name name-style="western">
              <surname>Whitt</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Irwin</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Swartz</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Strath</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>O'Brien</surname>
              <given-names>WL</given-names>
            </name>
            <name name-style="western">
              <surname>Bassett</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Schmitz</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Emplaincourt</surname>
              <given-names>PO</given-names>
            </name>
            <name name-style="western">
              <surname>Jacobs</surname>
              <given-names>DR</given-names>
            </name>
            <name name-style="western">
              <surname>Leon</surname>
              <given-names>AS</given-names>
            </name>
          </person-group>
          <article-title>Compendium of physical activities: an update of activity codes and MET intensities</article-title>
          <source>Med Sci Sports Exerc</source>
          <year>2000</year>
          <month>09</month>
          <volume>32</volume>
          <issue>9 Suppl</issue>
          <fpage>S498</fpage>
          <lpage>504</lpage>
          <pub-id pub-id-type="doi">10.1097/00005768-200009001-00009</pub-id>
          <pub-id pub-id-type="medline">10993420</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berntsen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Hageberg</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Aandstad</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mowinckel</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Anderssen</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Carlsen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Andersen</surname>
              <given-names>LB</given-names>
            </name>
          </person-group>
          <article-title>Validity of physical activity monitors in adults participating in free-living activities</article-title>
          <source>Br J Sports Med</source>
          <year>2010</year>
          <month>07</month>
          <day>15</day>
          <volume>44</volume>
          <issue>9</issue>
          <fpage>657</fpage>
          <lpage>64</lpage>
          <pub-id pub-id-type="doi">10.1136/bjsm.2008.048868</pub-id>
          <pub-id pub-id-type="medline">18628358</pub-id>
          <pub-id pub-id-type="pii">bjsm.2008.048868</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Driscoll</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Turicchi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Beaulieu</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Matu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Deighton</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Finlayson</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Stubbs</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>How well do activity monitors estimate energy expenditure? A systematic review and meta-analysis of the validity of current technologies</article-title>
          <source>Br J Sports Med</source>
          <year>2020</year>
          <month>03</month>
          <day>07</day>
          <volume>54</volume>
          <issue>6</issue>
          <fpage>332</fpage>
          <lpage>340</lpage>
          <pub-id pub-id-type="doi">10.1136/bjsports-2018-099643</pub-id>
          <pub-id pub-id-type="medline">30194221</pub-id>
          <pub-id pub-id-type="pii">bjsports-2018-099643</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Conger</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>SN</given-names>
            </name>
            <name name-style="western">
              <surname>Bassett</surname>
              <given-names>DR</given-names>
            </name>
          </person-group>
          <article-title>Predicting energy expenditure through hand rim propulsion power output in individuals who use wheelchairs</article-title>
          <source>Br J Sports Med</source>
          <year>2014</year>
          <month>07</month>
          <day>13</day>
          <volume>48</volume>
          <issue>13</issue>
          <fpage>1048</fpage>
          <lpage>53</lpage>
          <pub-id pub-id-type="doi">10.1136/bjsports-2014-093540</pub-id>
          <pub-id pub-id-type="medline">24825852</pub-id>
          <pub-id pub-id-type="pii">bjsports-2014-093540</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rosenberger</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Buman</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Haskell</surname>
              <given-names>WL</given-names>
            </name>
            <name name-style="western">
              <surname>McConnell</surname>
              <given-names>MV</given-names>
            </name>
            <name name-style="western">
              <surname>Carstensen</surname>
              <given-names>LL</given-names>
            </name>
          </person-group>
          <article-title>Twenty-four hours of sleep, sedentary behavior, and physical activity with nine wearable devices</article-title>
          <source>Med Sci Sports Exerc</source>
          <year>2016</year>
          <month>03</month>
          <volume>48</volume>
          <issue>3</issue>
          <fpage>457</fpage>
          <lpage>65</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26484953"/>
          </comment>
          <pub-id pub-id-type="doi">10.1249/MSS.0000000000000778</pub-id>
          <pub-id pub-id-type="medline">26484953</pub-id>
          <pub-id pub-id-type="pmcid">PMC4760880</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kuffel</surname>
              <given-names>EE</given-names>
            </name>
            <name name-style="western">
              <surname>Crouter</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Haas</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Frongillo</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Bassett</surname>
              <given-names>DR</given-names>
            </name>
          </person-group>
          <article-title>Validity of estimating minute-by-minute energy expenditure of continuous walking bouts by accelerometry</article-title>
          <source>Int J Behav Nutr Phys Act</source>
          <year>2011</year>
          <month>08</month>
          <day>24</day>
          <volume>8</volume>
          <issue>1</issue>
          <fpage>92</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ijbnpa.biomedcentral.com/articles/10.1186/1479-5868-8-92"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1479-5868-8-92</pub-id>
          <pub-id pub-id-type="medline">21864359</pub-id>
          <pub-id pub-id-type="pii">1479-5868-8-92</pub-id>
          <pub-id pub-id-type="pmcid">PMC3170241</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Driscoll</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Turicchi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hopkins</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Horgan</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Finlayson</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Stubbs</surname>
              <given-names>JR</given-names>
            </name>
          </person-group>
          <article-title>Improving energy expenditure estimates from wearable devices: A machine learning approach</article-title>
          <source>J Sports Sci</source>
          <year>2020</year>
          <month>07</month>
          <day>06</day>
          <volume>38</volume>
          <issue>13</issue>
          <fpage>1496</fpage>
          <lpage>1505</lpage>
          <pub-id pub-id-type="doi">10.1080/02640414.2020.1746088</pub-id>
          <pub-id pub-id-type="medline">32252598</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Driscoll</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Turicchi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hopkins</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Duarte</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Horgan</surname>
              <given-names>GW</given-names>
            </name>
            <name name-style="western">
              <surname>Finlayson</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Stubbs</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>Comparison of the validity and generalizability of machine learning algorithms for the prediction of energy expenditure: validation study</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2021</year>
          <month>08</month>
          <day>04</day>
          <volume>9</volume>
          <issue>8</issue>
          <fpage>e23938</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2021/8/e23938/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/23938</pub-id>
          <pub-id pub-id-type="medline">34346890</pub-id>
          <pub-id pub-id-type="pii">v9i8e23938</pub-id>
          <pub-id pub-id-type="pmcid">PMC8374660</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gilgen-Ammann</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Schweizer</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wyss</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Accuracy of the multisensory wristwatch polar vantage's estimation of energy expenditure in various activities: instrument validation study</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2019</year>
          <month>10</month>
          <day>02</day>
          <volume>7</volume>
          <issue>10</issue>
          <fpage>e14534</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2019/10/e14534/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/14534</pub-id>
          <pub-id pub-id-type="medline">31579020</pub-id>
          <pub-id pub-id-type="pii">v7i10e14534</pub-id>
          <pub-id pub-id-type="pmcid">PMC6777286</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Elsts</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Burghardt</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Byrne</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Camplani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Damen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Fafoutis</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Hannuna</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Harwin</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Holmes</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Janko</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Ponce Lopez</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Masullo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mirmehdi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Oikonomou</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Piechocki</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sherratt</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tonkin</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Twomey</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Vafeas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Woznowski</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Craddock</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>A guide to the SPHERE 100 homes study dataset</article-title>
          <source>arXiv</source>
          <year>2018</year>
          <access-date>2022-07-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/1805.11907">http://arxiv.org/abs/1805.11907</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Das</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Koperski</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Minciullo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Garattoni</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bremond</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Francesca</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Toyota Smarthome: Real-World Activities of Daily Living</article-title>
          <year>2019</year>
          <conf-name>International Conference on Computer Vision (ICCV)</conf-name>
          <conf-date>October 27, 2019 - November 02, 2019</conf-date>
          <conf-loc>Seoul, South Korea</conf-loc>
          <pub-id pub-id-type="doi">10.1109/ICCV.2019.00092</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Salatino</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gower</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Ghrissi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tapus</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Wieczorowska-Tobis</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Suwalska</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Barattini</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Rosso</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Munaro</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bellotto</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>van den Heuvel</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>The EnrichMe Project</article-title>
          <source>Computers Helping People with Special Needs. ICCHP 2016. Lecture Notes in Computer Science</source>
          <year>2016</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>326</fpage>
          <lpage>334</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Burghardt</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mirmehdi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Damen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Camplani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hannuna</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Paiement</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Craddock</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Energy expenditure estimation using visual and inertial sensors</article-title>
          <source>IET Computer Vision</source>
          <year>2017</year>
          <month>10</month>
          <day>27</day>
          <volume>12</volume>
          <issue>1</issue>
          <fpage>36</fpage>
          <lpage>47</lpage>
          <pub-id pub-id-type="doi">10.1049/iet-cvi.2017.0112</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Masullo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Burghardt</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Damen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hannuna</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ponce-López</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Mirmehdi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>CaloriNet: From Silhouettes to Calorie Estimation in Private Environments</article-title>
          <source>arXiv</source>
          <year>2018</year>
          <access-date>2022-07-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1806.08152">https://arxiv.org/abs/1806.08152</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nakamura</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yeung</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Alahi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fei-Fei</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Jointly Learning Energy Expenditures and Activities Using Egocentric Multimodal Signals</article-title>
          <year>2017</year>
          <conf-name>Conference on Computer Vision and Pattern Recognition (CVPR)</conf-name>
          <conf-date>July 21-26, 2017</conf-date>
          <conf-loc>Honolulu, HI, USA</conf-loc>
          <fpage>6817</fpage>
          <lpage>6826</lpage>
          <pub-id pub-id-type="doi">10.1109/cvpr.2017.721</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Levine</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>The energy expenditure of using a "walk-and-work" desk for office workers with obesity</article-title>
          <source>Br J Sports Med</source>
          <year>2007</year>
          <month>09</month>
          <day>01</day>
          <volume>41</volume>
          <issue>9</issue>
          <fpage>558</fpage>
          <lpage>61</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/17504789"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bjsm.2006.032755</pub-id>
          <pub-id pub-id-type="medline">17504789</pub-id>
          <pub-id pub-id-type="pii">bjsm.2006.032755</pub-id>
          <pub-id pub-id-type="pmcid">PMC2465387</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McAlpine</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Manohar</surname>
              <given-names>CU</given-names>
            </name>
            <name name-style="western">
              <surname>McCrady</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Hensrud</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Levine</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>An office-place stepping device to promote workplace physical activity</article-title>
          <source>Br J Sports Med</source>
          <year>2007</year>
          <month>12</month>
          <day>18</day>
          <volume>41</volume>
          <issue>12</issue>
          <fpage>903</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/17513333"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bjsm.2006.034900</pub-id>
          <pub-id pub-id-type="medline">17513333</pub-id>
          <pub-id pub-id-type="pii">bjsm.2006.034900</pub-id>
          <pub-id pub-id-type="pmcid">PMC2658993</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Park</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Predicting energy expenditure during gradient walking with a foot monitoring device: model-based approach</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2019</year>
          <month>10</month>
          <day>23</day>
          <volume>7</volume>
          <issue>10</issue>
          <fpage>e12335</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2019/10/e12335/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12335</pub-id>
          <pub-id pub-id-type="medline">31647467</pub-id>
          <pub-id pub-id-type="pii">v7i10e12335</pub-id>
          <pub-id pub-id-type="pmcid">PMC6913720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krizhevsky</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sutskever</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Hinton</surname>
              <given-names>GE</given-names>
            </name>
          </person-group>
          <article-title>ImageNet classification with deep convolutional neural networks</article-title>
          <source>Commun. ACM</source>
          <year>2017</year>
          <month>05</month>
          <day>24</day>
          <volume>60</volume>
          <issue>6</issue>
          <fpage>84</fpage>
          <lpage>90</lpage>
          <pub-id pub-id-type="doi">10.1145/3065386</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Carreira</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zisserman</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Quo Vadis, Action Recognition? A New Model and the Kinetics Dataset</article-title>
          <year>2017</year>
          <conf-name>Conference on Computer Vision and Pattern Recognition (CVPR)</conf-name>
          <conf-date>July 21-26, 2017</conf-date>
          <conf-loc>Honolulu, HI, USA</conf-loc>
          <fpage>4724</fpage>
          <lpage>4733</lpage>
          <pub-id pub-id-type="doi">10.1109/cvpr.2017.502</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Finn</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Abbeel</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Levine</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Model-agnostic meta-learning for fast adaptation of deep networks</article-title>
          <source>arXiv</source>
          <year>2017</year>
          <access-date>2022-07-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1703.03400?context=cs">https://arxiv.org/abs/1703.03400?context=cs</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Snell</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Swersky</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zemel</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Prototypical Networks for Few-Shot Learning</article-title>
          <source>University of Toronto</source>
          <year>2017</year>
          <access-date>2022-07-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cs.toronto.edu/~zemel/documents/prototypical_networks_nips_2017.pdf">https://www.cs.toronto.edu/~zemel/documents/prototypical_networks_nips_2017.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perret</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Masullo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Burghardt</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mirmehdi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Damen</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Meta-learning with context-agnostic initialisations</article-title>
          <source>Asian Conference on Computer Vision</source>
          <year>2021</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>70</fpage>
          <lpage>86</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ji</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Niebles</surname>
              <given-names>JC</given-names>
            </name>
          </person-group>
          <article-title>Few-shot video classification via temporal alignment</article-title>
          <source>Conference on Computer Vision and Pattern Recognition (CVPR)</source>
          <year>2022</year>
          <fpage>10615</fpage>
          <lpage>10624</lpage>
          <pub-id pub-id-type="doi">10.1109/cvpr42600.2020.01063</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perrett</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Masullo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Burghardt</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mirmehdi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Damen</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Temporal-Relational CrossTransformers for Few-Shot Action Recognition</article-title>
          <source>arXiv</source>
          <year>2021</year>
          <access-date>2022-07-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://arxiv.org/abs/2101.06184">http://arxiv.org/abs/2101.06184</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hopkins</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Blundell</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>NA</given-names>
            </name>
          </person-group>
          <article-title>Individual variability in compensatory eating following acute exercise in overweight and obese women</article-title>
          <source>Br J Sports Med</source>
          <year>2014</year>
          <month>10</month>
          <day>10</day>
          <volume>48</volume>
          <issue>20</issue>
          <fpage>1472</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1136/bjsports-2012-091721</pub-id>
          <pub-id pub-id-type="medline">23666018</pub-id>
          <pub-id pub-id-type="pii">bjsports-2012-091721</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ehrsam</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hoerler-Koerner</surname>
              <given-names>U</given-names>
            </name>
            <name name-style="western">
              <surname>Stoffel</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Melges</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Ainsworth</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Exercise prescription for the overweight and the obese: how to quantify and yet keep it simple</article-title>
          <source>Br J Sports Med</source>
          <year>2009</year>
          <month>12</month>
          <day>16</day>
          <volume>43</volume>
          <issue>12</issue>
          <fpage>951</fpage>
          <lpage>3</lpage>
          <pub-id pub-id-type="doi">10.1136/bjsm.2008.055657</pub-id>
          <pub-id pub-id-type="medline">19293164</pub-id>
          <pub-id pub-id-type="pii">bjsm.2008.055657</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Woo</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Garrow</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Pi-Sunyer</surname>
              <given-names>FX</given-names>
            </name>
          </person-group>
          <article-title>Effect of exercise on spontaneous calorie intake in obesity</article-title>
          <source>Am J Clin Nutr</source>
          <year>1982</year>
          <month>09</month>
          <volume>36</volume>
          <issue>3</issue>
          <fpage>470</fpage>
          <lpage>7</lpage>
          <pub-id pub-id-type="doi">10.1093/ajcn/36.3.470</pub-id>
          <pub-id pub-id-type="medline">7113952</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tao</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Burghardt</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mirmehdi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Damen</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cooper</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hannuna</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Camplani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Paiement</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Craddock</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Calorie counter: RGB-depth visual estimation of energy expenditure at home</article-title>
          <source>Computer Vision – ACCV 2016 Workshops</source>
          <year>2016</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>239</fpage>
          <lpage>251</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Hidalgo</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Simon</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>OpenPose: realtime multi-person 2D pose estimation using part affinity fields</article-title>
          <source>IEEE Trans. Pattern Anal. Mach. Intell</source>
          <year>2021</year>
          <month>1</month>
          <day>1</day>
          <volume>43</volume>
          <issue>1</issue>
          <fpage>172</fpage>
          <lpage>186</lpage>
          <pub-id pub-id-type="doi">10.1109/tpami.2019.2929257</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ren</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Deep Residual Learning for Image Recognition</article-title>
          <year>2016</year>
          <conf-name>Conference on Computer Vision and Pattern Recognition (CVPR)</conf-name>
          <conf-date>December 12, 2016</conf-date>
          <conf-loc>Las Vegas, NV, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/cvpr.2016.90</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dong</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Socher</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fei-Fei</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>ImageNet: A large-scale hierarchical image database</article-title>
          <year>2009</year>
          <conf-name>Conference on Computer Vision and Pattern Recognition</conf-name>
          <conf-date>August 18, 2009</conf-date>
          <conf-loc>Miami, FL, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/cvpr.2009.5206848</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kolter</surname>
              <given-names>JZ</given-names>
            </name>
            <name name-style="western">
              <surname>Koltun</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>An Empirical Evaluation of Generic Convolutional and Recurrent Networks for Sequence Modeling</article-title>
          <source>arXiv</source>
          <year>2018</year>
          <access-date>2022-07-05</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1803.01271">https://arxiv.org/abs/1803.01271</ext-link>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
