<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMU</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Mhealth Uhealth</journal-id>
      <journal-title>JMIR mHealth and uHealth</journal-title>
      <issn pub-type="epub">2291-5222</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v9i1e21926</article-id>
      <article-id pub-id-type="pmid">33507156</article-id>
      <article-id pub-id-type="doi">10.2196/21926</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Deep Learning–Based Multimodal Data Fusion: Case Study in Food Intake Episodes Detection Using Wearable Sensors</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Buis</surname>
            <given-names>Lorraine</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Diou</surname>
            <given-names>Christos</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Goyal</surname>
            <given-names>Dileep</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Bahador</surname>
            <given-names>Nooshin</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Faculty of Information Technology and Electrical Engineering</institution>
            <institution>University of Oulu</institution>
            <addr-line>Pentti Kaiteran katu 1</addr-line>
            <addr-line>Oulu, FIN-90570</addr-line>
            <country>Finland</country>
            <phone>358 417246274</phone>
            <email>nooshin.bahador@oulu.fi</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4992-7275</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Ferreira</surname>
            <given-names>Denzil</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-2195-0449</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Tamminen</surname>
            <given-names>Satu</given-names>
          </name>
          <degrees>DSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-5215-6889</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Kortelainen</surname>
            <given-names>Jukka</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-2585-2376</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Faculty of Information Technology and Electrical Engineering</institution>
        <institution>University of Oulu</institution>
        <addr-line>Oulu</addr-line>
        <country>Finland</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Nooshin Bahador <email>nooshin.bahador@oulu.fi</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>1</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>28</day>
        <month>1</month>
        <year>2021</year>
      </pub-date>
      <volume>9</volume>
      <issue>1</issue>
      <elocation-id>e21926</elocation-id>
      <history>
        <date date-type="received">
          <day>29</day>
          <month>6</month>
          <year>2020</year>
        </date>
        <date date-type="rev-request">
          <day>1</day>
          <month>10</month>
          <year>2020</year>
        </date>
        <date date-type="rev-recd">
          <day>10</day>
          <month>11</month>
          <year>2020</year>
        </date>
        <date date-type="accepted">
          <day>18</day>
          <month>12</month>
          <year>2020</year>
        </date>
      </history>
      <copyright-statement>©Nooshin Bahador, Denzil Ferreira, Satu Tamminen, Jukka Kortelainen. Originally published in JMIR mHealth and uHealth (http://mhealth.jmir.org), 28.01.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR mHealth and uHealth, is properly cited. The complete bibliographic information, a link to the original publication on http://mhealth.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="http://mhealth.jmir.org/2021/1/e21926/" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Multimodal wearable technologies have brought forward wide possibilities in human activity recognition, and more specifically personalized monitoring of eating habits. The emerging challenge now is the selection of most discriminative information from high-dimensional data collected from multiple sources. The available fusion algorithms with their complex structure are poorly adopted to the computationally constrained environment which requires integrating information directly at the source. As a result, more simple low-level fusion methods are needed.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>In the absence of a data combining process, the cost of directly applying high-dimensional raw data to a deep classifier would be computationally expensive with regard to the response time, energy consumption, and memory requirement. Taking this into account, we aimed to develop a data fusion technique in a computationally efficient way to achieve a more comprehensive insight of human activity dynamics in a lower dimension. The major objective was considering statistical dependency of multisensory data and exploring intermodality correlation patterns for different activities.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>In this technique, the information in time (regardless of the number of sources) is transformed into a 2D space that facilitates classification of eating episodes from others. This is based on a hypothesis that data captured by various sensors are statistically associated with each other and the covariance matrix of all these signals has a unique distribution correlated with each activity which can be encoded on a contour representation. These representations are then used as input of a deep model to learn specific patterns associated with specific activity.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>In order to show the generalizability of the proposed fusion algorithm, 2 different scenarios were taken into account. These scenarios were different in terms of temporal segment size, type of activity, wearable device, subjects, and deep learning architecture. The first scenario used a data set in which a single participant performed a limited number of activities while wearing the Empatica E4 wristband. In the second scenario, a data set related to the activities of daily living was used where 10 different participants wore inertial measurement units while performing a more complex set of activities. The precision metric obtained from leave-one-subject-out cross-validation for the second scenario reached 0.803. The impact of missing data on performance degradation was also evaluated.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>To conclude, the proposed fusion technique provides the possibility of embedding joint variability information over different modalities in just a single 2D representation which results in obtaining a more global view of different aspects of daily human activities at hand, and yet preserving the desired performance level in activity recognition.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>deep learning</kwd>
        <kwd>image processing</kwd>
        <kwd>data fusion</kwd>
        <kwd>covariance distribution</kwd>
        <kwd>food intake episode</kwd>
        <kwd>wearable sensors</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>It is a proven fact that chronic diseases including obesity, diabetes, and metabolic disorders are highly correlated with eating behavior and regarding the importance of this issue, application of wearable sensors for capturing eating-related activities has been widely studied in the literature [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref6">6</xref>]. These studies can be categorized into 3 groups, including food intake detection, food type classification, and food content estimation. Among these groups, food intake detection has been considered as the first phase in food intake monitoring, and studies around it mainly focused on detecting chewing activity (acoustic-based assessment) [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref10">10</xref>] or hand gestures movement (motion-based assessment) [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>] during eating episodes. The majority of the proposed methods rely on single sensing approaches, for example, using electromyography sensor, accelerometer sensor, or microphone [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref17">17</xref>]. However, it is believed that precisely discriminating eating episodes from other confounding activities requires processing multiple parameters from several sources. For this reason, multimodal assessment is a common target of interest today. Taking as an example, using data from both accelerometer and gyroscope sensors proposed in [<xref ref-type="bibr" rid="ref18">18</xref>] reached an accuracy of 75% in detecting eating activity. These kinds of sensors quantify specific features of hand-to-mouth gestures as well as jaw motion associated with dietary intake. Later on, adding images of food into data captured by accelerometer and gyroscope was suggested for eating episodes detection [<xref ref-type="bibr" rid="ref19">19</xref>]. Analysis of these meal images can also extract information of food content and estimate dietary energy intake. Data taken by GPS were also added as input parameters to correctly predict eating activity [<xref ref-type="bibr" rid="ref20">20</xref>]. Audio signals of chewing sound was a further option added to a data set of both motion data and meal images which improve the accuracy of eating periods detection up to 85% [<xref ref-type="bibr" rid="ref21">21</xref>]. Therefore, according to the aforementioned studies, it is valuable to develop algorithms that can take advantage of multiple data sources for monitoring applications rather than focusing on a single sensor. The sources of different modalities will provide richer information in comparison to a single source.</p>
      <p>However, although using different modalities provides further opportunities to explore more complementary information, the growing number of different modalities has brought new challenges due to increase in the volume and complexity of the data. For dealing with these high-dimensional data sets and lowering the computational time, some studies implement feature selection process including forward features selection [<xref ref-type="bibr" rid="ref22">22</xref>], random forest [<xref ref-type="bibr" rid="ref23">23</xref>], and principal component analysis [<xref ref-type="bibr" rid="ref24">24</xref>] to reduce the data size and select important parameters/features. For combining the information captured by different sensors, the classification score fusion has been introduced in literature as an option. Papapanagiotou et al [<xref ref-type="bibr" rid="ref25">25</xref>] fused support vector machine scores from both photoplethysmography and audio signals. Regarding discriminating eating episodes from other activities, researchers applied different classification tools from support vector machine [<xref ref-type="bibr" rid="ref26">26</xref>] to artificial neural network [<xref ref-type="bibr" rid="ref27">27</xref>]. They also found that appropriate epoch size ranges from 10 to 30 seconds [<xref ref-type="bibr" rid="ref28">28</xref>]. However, recent advances in machine learning methods have increasingly captured the attention of many research groups for distinguishing food intake intervals from others based on deep learning techniques. Convolutional neural network has been used for automatically detecting intake gestures from raw video frames [<xref ref-type="bibr" rid="ref29">29</xref>]. Convolutional neural network was also proposed by Ciocca et al [<xref ref-type="bibr" rid="ref30">30</xref>] for image-based food recognition.</p>
      <p>The aforementioned studies focused on data represented by features set and its corresponding fusion as well as decision fusion of classifiers. What remains to be addressed is investigating the sensor fusion for quantitatively integrating heterogeneous sources of information. Taking this into account, this study aimed to combine data derived from disparate sensors such that the resulting information has lower dimension and yet maintains the important aspects of original data.</p>
      <p>To the best of our knowledge, there is no research focused on sensor fusion for personalized activity identification using different data sets collected by wearable devices. The proposed fusion here is based on a hypothesis that data captured by multiple sources are statistically correlated with each other and their 2D covariance representation has a unique distribution associated with the type of activity.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Implementation of Sensor Fusion Algorithm</title>
        <p>The proposed algorithm automatically transformed data from different sensors in time into a single 2D color representation that provides fast effective support for discriminating eating episodes from others. The idea of this method was on the hypothesis that data driven by different sensors have correlation with each other and a covariance matrix of all these measurements has a unique distribution associated with each type of activity which can be visualized as a contour plot. With 2D covariance contour as input data sets, deep model–learned specific patterns in 2D correlation representation related to specific activity.</p>
        <p>The following is a summary of the steps followed in the proposed method to detect eating episodes:</p>
        <sec>
          <title>Step 1</title>
          <p>Forming the observation matrix derived from all sensors; the corresponding covariance matrix can then be formed in 2 ways. The first way is to calculate pairwise covariance between each sample across all signals. The second way is to calculate pairwise covariance between each signal across all samples. The algorithm steps based on the second way are as follows:</p>
          <p>The pairwise covariance calculation between each column combination:</p>
          <disp-formula>C<sub>ij</sub> = cov(H(:, i), H(:, j)) <bold>(1)</bold></disp-formula>
          <p>where H is observation matrix.</p>
          <p>The covariance coefficient of 2 columns of i and j can be calculated as follows:</p>
          <p>
            <disp-formula>cov(S<sub>i</sub>, S<sub>j</sub>)=1/(n–1)Σ<sup>m</sup><sub>k=1</sub>(S<sub>ik</sub>–µ<sub>i</sub>)(S<sub>jk</sub>–µ<sub>j</sub>) <bold>(2)</bold>
          </disp-formula>
          </p>
          <p>
            <disp-formula>S<sub>i</sub> = M(:, i), S<sub>j</sub> = M(:, j)
          </disp-formula>
          </p>
          <p>where μ<sub>i</sub> is the mean of S<sub>i</sub>, μ<sub>j</sub> is the mean of S<sub>j</sub>, and m is the number of samples within the window.</p>
        </sec>
        <sec>
          <title>Step 2</title>
          <p>Obtaining the covariance coefficient matrix of all columns according to the following equation:</p>
          <p>
            <disp-formula>
              <graphic xlink:href="mhealth_v9i1e21926_fig13.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
            </disp-formula>
          </p>
          <p>where n is the number of observations.</p>
        </sec>
        <sec>
          <title>Step 3</title>
          <p>Creating a filled contour plot containing the isolines of obtained matrix C so that given a value for covariance, lines are drawn for connecting the (x, y) coordinates where that covariance value occurs. The areas between the lines were then filled in solid color associated with the corresponding covariance value.</p>
        </sec>
        <sec>
          <title>Step 4</title>
          <p>Feeding contour plot to the deep network to classify the sequences related to each activity. Two different scenarios were considered for this study. These scenarios were different in terms of covariance matrix calculation, temporal segment size, type of activity, wearable device, subjects, and deep learning architecture. In the first scenario, calculating pairwise covariance between each sample across all signals was considered. In the second scenario, calculating pairwise covariance between each signal across all samples was taken into consideration.</p>
        </sec>
      </sec>
      <sec>
        <title>First Scenario for Evaluation of Algorithm</title>
        <p>In the first scenario, data were recorded from a single participant wearing the Empatica E4 wristband on the right hand for 3 days. The data set includes the following data: (1) ACC—data from 3-axis accelerometer sensor in the range [–2g, 2g] (sampled at 32 Hz); (2) BVP—data from photoplethysmograph (sampled at 64 Hz); (3) EDA—data from the electrodermal activity sensor in microsiemens (sampled at 4 Hz); (4) IBI—interbeat intervals, which represent the time interval between individual beats of the heart (intermittent output with 1/64-second resolution); (5) TEMP—data from temperature sensor expressed in the °C scale (sampled at 4 Hz); and (6) HR—These data contain the average heart rate values, computed in spans of 10 seconds.</p>
        <p>The window length for this scenario was selected to be 500 samples. This analysis was performed on 2954 500-sample segments after making all signals in the same size with sample frequency of 64 Hz. Segments were picked so that 1000 of them contained sleeping intervals, and 1000 of them captured during working with computer and others were during eating episodes.</p>
        <p>The deep learning architecture used in this scenario was a deep residual network. The proposed deep learning architecture for image-to-label classification is presented in <xref rid="figure1" ref-type="fig">Figure 1</xref> and consisted of a deep residual network with 3 2D convolution layers, followed by batch normalization, ReLU, max pooling, and fully connected layers. The 2D convolutional layer applied sliding convolutional filters to the input contour image. The output of this network is a categorical response, and therefore a softmax and classification layers were also added as last layers. There is also a shortcut to jump over some layers.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Deep learning network architecture.</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p><xref ref-type="table" rid="table1">Table 1</xref> provides detailed information about the proposed network layers. This information includes the sizes of layer activations. The training parameters of the deep learning model are given in <xref ref-type="table" rid="table2">Table 2</xref>. The mini-batch size and the maximum number of epochs were set to 100 and 10, respectively. Fivefold cross-validation was also used to check the performance of the model.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Detailed information about the layers of proposed network.</p>
          </caption>
          <table border="1" rules="groups" cellpadding="5" frame="hsides" width="1000" cellspacing="0">
            <col width="100"/>
            <col width="450"/>
            <col width="450"/>
            <thead>
              <tr valign="top">
                <td>Number</td>
                <td>Layer type</td>
                <td>Activations</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>1</td>
                <td>Image input</td>
                <td>300 × 300 × 3</td>
              </tr>
              <tr valign="top">
                <td>2</td>
                <td>Convolution</td>
                <td>300 × 300 × 32</td>
              </tr>
              <tr valign="top">
                <td>3</td>
                <td>Batch normalization</td>
                <td>300 × 300 × 32</td>
              </tr>
              <tr valign="top">
                <td>4</td>
                <td>ReLU</td>
                <td>300 × 300 × 32</td>
              </tr>
              <tr valign="top">
                <td>5</td>
                <td>Convolution</td>
                <td>150 × 150 × 64</td>
              </tr>
              <tr valign="top">
                <td>6</td>
                <td>Batch normalization</td>
                <td>150 × 150 × 64</td>
              </tr>
              <tr valign="top">
                <td>7</td>
                <td>ReLU</td>
                <td>150 × 150 × 64</td>
              </tr>
              <tr valign="top">
                <td>8</td>
                <td>Convolution</td>
                <td>150 × 150 × 128</td>
              </tr>
              <tr valign="top">
                <td>9</td>
                <td>Batch normalization</td>
                <td>150 × 150 × 128</td>
              </tr>
              <tr valign="top">
                <td>10</td>
                <td>ReLU</td>
                <td>150 × 150 × 128</td>
              </tr>
              <tr valign="top">
                <td>11</td>
                <td>Convolution</td>
                <td>150 × 150 × 128</td>
              </tr>
              <tr valign="top">
                <td>12</td>
                <td>Addition</td>
                <td>150 × 150 × 128</td>
              </tr>
              <tr valign="top">
                <td>13</td>
                <td>Max pooling</td>
                <td>75 × 75 × 128</td>
              </tr>
              <tr valign="top">
                <td>14</td>
                <td>Fully connected</td>
                <td>1 × 1 × 500</td>
              </tr>
              <tr valign="top">
                <td>15</td>
                <td>Fully connected</td>
                <td>1 × 1 × 10</td>
              </tr>
              <tr valign="top">
                <td>16</td>
                <td>Fully connected</td>
                <td>1 × 1 × 3</td>
              </tr>
              <tr valign="top">
                <td>17</td>
                <td>Softmax</td>
                <td>1 × 1 × 3</td>
              </tr>
              <tr valign="top">
                <td>18</td>
                <td>Classification output</td>
                <td>—<sup>a</sup></td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>—: Not available</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>The model training parameters.</p>
          </caption>
          <table border="1" rules="groups" cellpadding="5" frame="hsides" width="1000" cellspacing="0">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Parameter</td>
                <td>Value</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Initial learn rate</td>
                <td>0.001</td>
              </tr>
              <tr valign="top">
                <td>Learn rate drop factor</td>
                <td>0.1</td>
              </tr>
              <tr valign="top">
                <td>Learn rate drop period</td>
                <td>2</td>
              </tr>
              <tr valign="top">
                <td>Mini batch size</td>
                <td>100</td>
              </tr>
              <tr valign="top">
                <td>Max epochs</td>
                <td>10</td>
              </tr>
              <tr valign="top">
                <td>Learn rate schedule</td>
                <td>Piecewise</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Second Scenario for Evaluation of Algorithm</title>
        <p>In the second scenario, an open data set associated with the activities of daily living was considered. The data set was collected from 10 healthy participants, performing 186 activities of daily living while wearing 9-axis inertial measurement units on both left and right arms [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <p>The considered activities can be grouped into 4 separate categories: (1) mobility, including walking, sitting down and standing up, and opening and closing the door; (2) eating, including pouring water and drinking from glass; (3) personal hygiene, including brushing teeth; and (4) housework, including cleaning the table [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <p>The recorded data include quaternions (with resolution of 0.0001), accelerations along the x, y, and z axes (with resolution of 0.1 mG), and angular velocity along the x, y, and z axes (with resolution of 0.01 degrees per second) [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <p>Data annotation for all the experiments was manually performed based on videos recorded by an RGB camera [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
        <p>The window length for this scenario was selected to be 50 samples. This analysis was performed on 4478 50-sample segments. Segments were picked so that 1132 segments contained walking episodes, 20 segments contained sitting down episodes, 16 segments contained standing up episodes, 366 segments contained opening the door episodes, 400 segments contained closing the door episodes, 1208 segments contained pouring water and drinking from glass episodes, 704 segments contained brushing teeth episodes, and 632 segments contained cleaning the table episodes.</p>
        <p>As training from the scratch on relatively small-scale data sets is susceptible to overfitting, a pretrained model for extracting deep features was suggested in this scenario. The deep learning architecture used in this section was the InceptionResNetV2 pretrained model. This pretrained classification network has already learned on more than 1 million images. As this network was trained on extremely large data sets, it is capable of being served as a generic model. Therefore, this section used layer activation of the pretrained InceptionResNetV2 architecture as features to train a support vector machine for classifying different activities. The parallel computing platform of Tesla P100 PCIe 16 GB was used for implementing this deep structure. The depth, size, and number of parameters in the pretrained InceptionResNetV2 network were 164, 209 MB, and 55.9 M, respectively. Leave-one-subject-out cross-validation was considered for performance evaluation of classification.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Applying the Proposed Algorithm on the First Scenario</title>
        <p>Signals captured from different sensors during eating, sleeping, and working with computer are plotted in <xref rid="figure2" ref-type="fig">Figure 2</xref>. This figure illustrates how characteristics of data coming from different sources vary a lot. <xref rid="figure3" ref-type="fig">Figure 3</xref> shows how the values in the eating-related data captured by different sensors are spread out in their boxplots, and how their distributions differ from each other. As these signals cannot be described by the same distribution, they are said to be heterogeneous. This heterogeneity brings up the issue of how to integrate the information from such diverse modalities. This spread in the range of scales across the various modalities causes a simple approach to be not enough for reliable activity detection and a therefore a more sophisticated technique is required.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Time series amplitude of each modality captured during 1 episode of 3 different activities of eating, sleeping, and working with computer (the number of samples per second is 64).</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Distribution of data captured by different sensors for a portion of eating episode.</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p><xref rid="figure4" ref-type="fig">Figure 4</xref> shows the preprocessing steps performed on the raw data to prepare input data for a 2D deep residual network. As shown in <xref rid="figure5" ref-type="fig">Figure 5</xref>, covariance coefficients between channels were first derived and presented in the form of contour map. The obtained image was fed to a deep network as input image.</p>
        <p><xref rid="figure5" ref-type="fig">Figure 5</xref> shows examples of covariance coefficients contour generated from different modalities. The horizontal and vertical axes represent the sample number. The value of correlation coefficients is represented by the color, with dark colors corresponding to low values and bright colors corresponding to high values. As seen in figures, there is a visible difference in the color patterns of correlation coefficients contour for different activities.</p>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Generating covariance coefficients contour for a 500-sample eating episode (pairwise covariance was calculated between each sample across all signals).</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Examples of covariance coefficients contour for different activities. (A) Eating; (B) Working with computer; (C) Sleeping.</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>The performance metrics variations including epoch number, iteration number, time elapsed, mini-batch accuracy, validation accuracy, and loss function value for the validation data are plotted in <xref rid="figure6" ref-type="fig">Figure 6</xref>. The number of epochs was chosen to be 10 over 200 iterations. The training and testing proportions, being considered as 70% and 30%, respectively, were randomly assigned from each label. The training data were also shuffled before every epoch. Learning rate was reduced over epochs and its speed was updated by decreasing the learning rate, and multiplying it by a fractional learn rate drop factor over a specific number of epochs. According to <xref rid="figure6" ref-type="fig">Figure 6</xref>, the small validation loss allows to conclude that this method has generalization capability.</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Deep learning model performance over observations in the mini-batch.</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>Convergence of average accuracy and loss function during training and validation for 10 epochs was plotted in <xref rid="figure7" ref-type="fig">Figures 7</xref> and <xref rid="figure8" ref-type="fig">8</xref>. The result of the covariance-based model has rapidly converged to a stable value with no sign of overfitting.</p>
        <p>Confusion matrix in <xref rid="figure9" ref-type="fig">Figure 9</xref> shows the results obtained from validation data sets of covariance coefficients contour.</p>
        <fig id="figure7" position="float">
          <label>Figure 7</label>
          <caption>
            <p>Accuracy variation in each epoch of deep residual network with input images of covariance coefficients contour.</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure8" position="float">
          <label>Figure 8</label>
          <caption>
            <p>Loss function variation in each epoch of deep residual network with input images of covariance coefficients contour.</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure9" position="float">
          <label>Figure 9</label>
          <caption>
            <p>Confusion matrix for the validation set of deep residual network with input images of covariance coefficients contour.</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Applying the Proposed Algorithm on the Second Scenario</title>
        <p><xref rid="figure10" ref-type="fig">Figure 10</xref> shows an example of covariance map generated from different modalities in the second scenario.</p>
        <p>The visualization of performance of the fusion method applied on the second scenario is plotted in <xref rid="figure11" ref-type="fig">Figure 11</xref> and shows how the algorithm is confusing 2 classes.</p>
        <p>The elapsed time for the training process of the model was 39.2714 seconds. The latency for making decision on the new input was 0.1459 seconds. Various statistics calculated from the confusion matrix for a comprehensive study are listed in <xref ref-type="table" rid="table3">Table 3</xref>. Based on classification results, it is possible to find how well classification of different activities was done by taking advantage of the proposed sensor fusion.</p>
        <fig id="figure10" position="float">
          <label>Figure 10</label>
          <caption>
            <p>Covariance map for a 50-sample walking episode (pairwise covariance was calculated between each signal across all samples was taken into consideration).</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig10.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure11" position="float">
          <label>Figure 11</label>
          <caption>
            <p>The results of applying pretrained deep learning architecture on the fused data.</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig11.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Comprehensive study of pretrained deep learning classifier’s performance.</p>
          </caption>
          <table border="1" rules="groups" cellpadding="5" frame="hsides" width="1000" cellspacing="0">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Metrics of classifier’s performance</td>
                <td>Values</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Accuracy</td>
                <td>0.95083</td>
              </tr>
              <tr valign="top">
                <td>Precision (positive predictive value)</td>
                <td>0.80335</td>
              </tr>
              <tr valign="top">
                <td>False discovery rate</td>
                <td>0.19664</td>
              </tr>
              <tr valign="top">
                <td>False omission rate</td>
                <td>0.02809</td>
              </tr>
              <tr valign="top">
                <td>Negative predictive value</td>
                <td>0.97190</td>
              </tr>
              <tr valign="top">
                <td>Prevalence</td>
                <td>0.12500</td>
              </tr>
              <tr valign="top">
                <td>Recall (hit rate, sensitivity, true positive rate)</td>
                <td>0.80335</td>
              </tr>
              <tr valign="top">
                <td>False-positive rate (fall-out)</td>
                <td>0.02809</td>
              </tr>
              <tr valign="top">
                <td>Positive likelihood ratio</td>
                <td>28.5965</td>
              </tr>
              <tr valign="top">
                <td>False-negative rate (miss rate)</td>
                <td>0.19664</td>
              </tr>
              <tr valign="top">
                <td>True-negative rate (specificity)</td>
                <td>0.97190</td>
              </tr>
              <tr valign="top">
                <td>Negative likelihood ratio</td>
                <td>0.20233</td>
              </tr>
              <tr valign="top">
                <td>Diagnostic odds ratio</td>
                <td>141.334</td>
              </tr>
              <tr valign="top">
                <td>Informedness</td>
                <td>0.77525</td>
              </tr>
              <tr valign="top">
                <td>Markedness</td>
                <td>0.77525</td>
              </tr>
              <tr valign="top">
                <td>F-score</td>
                <td>0.80335</td>
              </tr>
              <tr valign="top">
                <td>G-measure</td>
                <td>0.80335</td>
              </tr>
              <tr valign="top">
                <td>Matthews correlation coefficient</td>
                <td>0.77525</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Comparison With Similar Studies</title>
        <p>Data captured by different sensors in order to detect eating intervals have been explored by many studies. These studies focused on analyzing several types of data captured by different sensors from accelerometers and gyroscopes to respiratory inductance plethysmography and oral cavity. However, as seen in <xref ref-type="table" rid="table3">Table 3</xref>, the number of modalities involved in detecting food intake intervals has been up to 2. Therefore, this study investigated whether eating event detection by simultaneous processing of 8 different modalities (eg, 3-axis accelerometer sensor, photoplethysmography, electrodermal activity sensor, interbeat intervals, temperature sensor and heart rate) is feasible. The obtained results showed an overall validation accuracy comparable to the approaches proposed earlier in the literature (<xref ref-type="table" rid="table4">Table 4</xref>). Furthermore, the proposed data fusion framework in this research provided a simple way of integrating multiple data sources applicable for deep learning methods in human activity monitoring, while previous studies focused on applying raw data. When it comes to cloud computing as well as big data for the purpose of human activity monitoring using wearable sensor-based technologies, the cost of directly applying high-dimensional raw data to a deep classifier would be computationally expensive.</p>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Comparison of previous studies on food intake episodes detection.</p>
          </caption>
          <table border="1" rules="groups" cellpadding="5" frame="hsides" width="1000" cellspacing="0">
            <col width="70"/>
            <col width="330"/>
            <col width="500"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td>Study</td>
                <td>Modalities</td>
                <td>Method</td>
                <td>Accuracy, %</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref32">32</xref>]</td>
                <td>Acoustic signal</td>
                <td>Correlation matching</td>
                <td>85</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref33">33</xref>]</td>
                <td>Food image and speech recording</td>
                <td>Support vector machine classification</td>
                <td>90.6</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref34">34</xref>]</td>
                <td>Electroglottograph</td>
                <td>Artificial neural network</td>
                <td>86.6</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref35">35</xref>]</td>
                <td>Piezoelectricity</td>
                <td>Time and amplitude thresholding</td>
                <td>86</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref36">36</xref>]</td>
                <td>Accelerometer and gyroscope</td>
                <td>Decision tree classifier</td>
                <td>85.5</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref37">37</xref>]</td>
                <td>Chewing sound</td>
                <td>(1) Deep Boltzmann and (2) Machine with deep neural network classifier</td>
                <td>77</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref38">38</xref>]</td>
                <td>Piezoelectricity</td>
                <td>Convolutional neural network</td>
                <td>91.9</td>
              </tr>
              <tr valign="top">
                <td>[<xref ref-type="bibr" rid="ref39">39</xref>]</td>
                <td>Acceleration and orientation velocity</td>
                <td>Convolutional-recurrent neural network</td>
                <td>82.5-96.4</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Investigating the Effect of Missing Values</title>
        <p>The proposed data fusion technique also has the challenge of data imperfection, which could be overcome by using data imputation methods. Missing samples can affect the contour representation of covariance matrix to a great extent which makes it necessary to be recovered using missing value filling methods.</p>
        <p><xref rid="figure12" ref-type="fig">Figure 12</xref> demonstrates how the moving median method (as a sample of interpolation methods) can recover the contour representation suffered from the missing data. The moving median was done over a window of length 20. However, there is still a huge gap for addressing the issue of data inconsistencies, which will let the gates open for future studies.</p>
        <p><xref ref-type="table" rid="table5">Table 5</xref> shows the impact of missing data without using any imputation on performance degradation in the second scenario.</p>
        <fig id="figure12" position="float">
          <label>Figure 12</label>
          <caption>
            <p>Contour representation (A and C) before and (B and D) after applying moving median for missing data.</p>
          </caption>
          <graphic xlink:href="mhealth_v9i1e21926_fig12.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Impact of missing data on performance degradation.</p>
          </caption>
          <table border="1" rules="groups" cellpadding="5" frame="hsides" width="1000" cellspacing="0">
            <col width="400"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td rowspan="2">Metrics of classifier’s performance</td>
                <td colspan="6">Missing value percentage</td>
              </tr>
              <tr valign="top">
                <td>0</td>
                <td>1.11</td>
                <td>2.22</td>
                <td>8.33</td>
                <td>15.5</td>
                <td>25</td>
              </tr>
              <tr valign="top">
                <td/>
                <td/>
                <td/>
                <td/>
                <td/>
                <td/>
                <td/>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Accuracy</td>
                <td>0.95083</td>
                <td>0.91400</td>
                <td>0.89591</td>
                <td>0.89533</td>
                <td>0.88501</td>
                <td>0.88326</td>
              </tr>
              <tr valign="top">
                <td>Precision (positive predictive value)</td>
                <td>0.80335</td>
                <td>0.65603</td>
                <td>0.58365</td>
                <td>0.58132</td>
                <td>0.54007</td>
                <td>0.53307</td>
              </tr>
              <tr valign="top">
                <td>False discovery rate</td>
                <td>0.19664</td>
                <td>0.34396</td>
                <td>0.41634</td>
                <td>0.41867</td>
                <td>0.45992</td>
                <td>0.46692</td>
              </tr>
              <tr valign="top">
                <td>False omission rate</td>
                <td>0.02809</td>
                <td>0.04913</td>
                <td>0.05947</td>
                <td>0.05981</td>
                <td>0.06570</td>
                <td>0.06670</td>
              </tr>
              <tr valign="top">
                <td>Negative predictive value</td>
                <td>0.97190</td>
                <td>0.95086</td>
                <td>0.94052</td>
                <td>0.94018</td>
                <td>0.93429</td>
                <td>0.93329</td>
              </tr>
              <tr valign="top">
                <td>Prevalence</td>
                <td>0.12500</td>
                <td>0.12500</td>
                <td>0.12500</td>
                <td>0.12500</td>
                <td>0.12500</td>
                <td>0.12500</td>
              </tr>
              <tr valign="top">
                <td>Recall (hit rate, sensitivity, true-positive rate)</td>
                <td>0.80335</td>
                <td>0.65603</td>
                <td>0.58365</td>
                <td>0.58132</td>
                <td>0.54007</td>
                <td>0.53307</td>
              </tr>
              <tr valign="top">
                <td>False positive rate (fall-out)</td>
                <td>0.02809</td>
                <td>0.04913</td>
                <td>0.05947</td>
                <td>0.05981</td>
                <td>0.06570</td>
                <td>0.06670</td>
              </tr>
              <tr valign="top">
                <td>Positive likelihood ratio</td>
                <td>28.5965</td>
                <td>13.3506</td>
                <td>9.81308</td>
                <td>9.71933</td>
                <td>8.21996</td>
                <td>7.99166</td>
              </tr>
              <tr valign="top">
                <td>False-negative rate (miss rate)</td>
                <td>0.19664</td>
                <td>0.34396</td>
                <td>0.41634</td>
                <td>0.41867</td>
                <td>0.45992</td>
                <td>0.46692</td>
              </tr>
              <tr valign="top">
                <td>True-negative rate (specificity)</td>
                <td>0.97190</td>
                <td>0.95086</td>
                <td>0.94052</td>
                <td>0.94018</td>
                <td>0.93429</td>
                <td>0.93329</td>
              </tr>
              <tr valign="top">
                <td>Negative likelihood ratio</td>
                <td>0.20233</td>
                <td>0.36174</td>
                <td>0.44267</td>
                <td>0.44531</td>
                <td>0.49226</td>
                <td>0.50029</td>
              </tr>
              <tr valign="top">
                <td>Diagnostic odds ratio</td>
                <td>141.334</td>
                <td>36.9063</td>
                <td>22.1678</td>
                <td>21.8259</td>
                <td>16.6982</td>
                <td>15.9738</td>
              </tr>
              <tr valign="top">
                <td>Informedness</td>
                <td>0.77525</td>
                <td>0.60689</td>
                <td>0.52418</td>
                <td>0.52151</td>
                <td>0.47437</td>
                <td>0.46637</td>
              </tr>
              <tr valign="top">
                <td>Markedness</td>
                <td>0.77525</td>
                <td>0.60689</td>
                <td>0.52418</td>
                <td>0.52151</td>
                <td>0.47437</td>
                <td>0.46637</td>
              </tr>
              <tr valign="top">
                <td><italic>F</italic>-score</td>
                <td>0.80335</td>
                <td>0.65603</td>
                <td>0.58365</td>
                <td>0.58132</td>
                <td>0.54007</td>
                <td>0.53307</td>
              </tr>
              <tr valign="top">
                <td>G-measure</td>
                <td>0.80335</td>
                <td>0.65603</td>
                <td>0.58365</td>
                <td>0.58132</td>
                <td>0.54007</td>
                <td>0.53307</td>
              </tr>
              <tr valign="top">
                <td>Matthews correlation coefficient</td>
                <td>0.77525</td>
                <td>0.60689</td>
                <td>0.52418</td>
                <td>0.52151</td>
                <td>0.47437</td>
                <td>0.46637</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Recent advances in biosensor technologies [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref41">41</xref>] and consumer electronics have led to precise physiological monitoring and more specifically accurate activity recognition. Activity recognition based on wearable device is one of the most rapidly growing research areas in personalization of analyses. Physical characteristics, health state, lifestyle, moving style, and gender are parameters that can be highly personalized. Therefore, in order to consider generalization of prediction or classification models, the data should be labeled personally, and the focus of research should be more on personalized analysis [<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref43">43</xref>]. One way to personalize data is automatic identification of human activities and consequently labeling data based on different activities.</p>
        <p>Regarding human activity recognition, we are facing upcoming transition from analyzing single modality to processing data collected from multiple sources with enormous diversity in terms of information, size, and behavior. This increases the complexity of classification problems and requires low-level data fusion to simultaneously integrate significant information in all modalities, and yet compressing the data directly at the source. This fusion process is important in a sense that reduction of communication load to other device or to the cloud requires local extraction of information from raw data stream in the sensor level. Therefore, fused raw data in a compressed form are super important in terms of minimizing the amount of data needed to be stored or needed to be sent. It is also important in saving battery power and reducing transmission time.</p>
        <p>Regarding the importance of implementing a low-level fusion method with simple structure, this study presented a general framework for implementing efficient fusion based on covariance map. The promising classification results reached precision of 80.3% and showed that global 2D covariance representation can reliably quantify the difference between activities, as it provides a simple abstract representation of correlation over modalities.</p>
        <p>For performance assessment of the proposed algorithm, the method was implemented on 2 separate scenarios. These scenarios were different regarding the temporal segment size, type of activity, wearable device, subjects, and deep learning architecture. The obtained results showed the ability of the proposed fusion technique to generalize to other data sets with different modalities, participants, and tasks.</p>
      </sec>
      <sec>
        <title>Limitations in Existing Literature</title>
        <p>There are many ways of integrating modalities for activity recognition task [<xref ref-type="bibr" rid="ref44">44</xref>-<xref ref-type="bibr" rid="ref57">57</xref>], with the 3 major groups being sensor-level [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>], feature-level [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref57">57</xref>], and decision-level [<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref56">56</xref>] fusion. Fusion at the decision level is the most frequently used method which takes advantage of training machine learning and deep learning models for each modality. When it comes to merging scores of these networks for the purpose of data fusion, the practical applications are limited by their complex process which lead to more computationally heavy processing and make them inapplicable for implementing on low-power systems. Therefore, such techniques cannot be considered as low-level data fusion.</p>
        <p>There are only a few methods for low-level data fusion, with 2 focused on using Bayesian network for sensor-level fusion [<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]. These Bayesian networks usually involve a time-consuming process of hyperparameter tuning. Correctly implementing hyperparameter optimization is usually complex and computationally expensive. A small change in the values of hyperparameters can highly affect the performance of model. In this sense, it could be said that the low-level fusion methods with simple structure can outperform sophisticated ones.</p>
      </sec>
      <sec>
        <title>Strengths of the Proposed Method</title>
        <p>Unlike complex fusion techniques based on evolutionary computation [<xref ref-type="bibr" rid="ref48">48</xref>], machine learning approaches [<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref51">51</xref>,<xref ref-type="bibr" rid="ref53">53</xref>,<xref ref-type="bibr" rid="ref54">54</xref>], Bayesian models [<xref ref-type="bibr" rid="ref44">44</xref>,<xref ref-type="bibr" rid="ref45">45</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref55">55</xref>], Kalman filtering [<xref ref-type="bibr" rid="ref49">49</xref>], and neural networks [<xref ref-type="bibr" rid="ref46">46</xref>], the proposed fusion method had very simple implementing procedure, and yet capable of revealing the common trends and similarities among recorded modalities. It was also free of the number and type of sensors used for collecting data. This could be an important benefit as there is high diversity in sensor technology deployed for activity recognition and the choice of sensors vary a lot from one case to another. The sensors used in activity recognition studies include vibration and contact sensor [<xref ref-type="bibr" rid="ref44">44</xref>], tap sensor [<xref ref-type="bibr" rid="ref45">45</xref>], motion sensor [<xref ref-type="bibr" rid="ref46">46</xref>], ventilation sensor [<xref ref-type="bibr" rid="ref47">47</xref>], heart rate sensor [<xref ref-type="bibr" rid="ref48">48</xref>], magnetometer sensor [<xref ref-type="bibr" rid="ref49">49</xref>], temperature sensor [<xref ref-type="bibr" rid="ref50">50</xref>], electrocardiogram sensor [<xref ref-type="bibr" rid="ref51">51</xref>], accelerometer sensor [<xref ref-type="bibr" rid="ref52">52</xref>], and gyroscope [<xref ref-type="bibr" rid="ref54">54</xref>]. Furthermore, this method is universal in a sense that it can cover a wide spectrum of problems including tracking activity of daily living, elderly monitoring, fall detection, smart home, ambient assisted living, behavior analysis, among others. It could help in decreasing the final cost of the monitoring framework by deploying fusion in the first step of classification process (applying fusion algorithm in the final step needs independently analyzing data for every single component and combining the final results which make the implementation computationally expensive). Providing the possibility of visually representing the correlation among modalities and reducing dimension by embedding the sensory data in just a single 2D representation can be considered as other strengths of the studied technique.</p>
      </sec>
      <sec>
        <title>Future Work</title>
        <p>A limitation to this research is that both tested scenarios were performed on healthy volunteers, which may be far from the cases including actual patients who suffer from movement disability or major health problem. This could be included in future work.</p>
        <p>Future research direction will also include implementing the fusion algorithms for the scenarios in which one or more modalities are missing. The applicability of the findings will be also tested for other problems rather than activity recognition.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <ack>
      <p>This work was supported by a grant (No. 308935) from the Academy of Finland and Infotech, and Orion Research Foundation sr, Oulu, Finland.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van den Boer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van der Lee</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Papapanagiotou</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Diou</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Delopoulos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Mars</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>The SPLENDID Eating Detection Sensor: Development and Feasibility Study</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2018</year>
          <month>09</month>
          <day>04</day>
          <volume>6</volume>
          <issue>9</issue>
          <fpage>e170</fpage>
          <pub-id pub-id-type="doi">10.2196/mhealth.9781</pub-id>
          <pub-id pub-id-type="medline">30181111</pub-id>
          <pub-id pub-id-type="pii">v6i9e170</pub-id>
          <pub-id pub-id-type="pmcid">PMC6231803</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Selamat</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>SHM</given-names>
            </name>
          </person-group>
          <article-title>Automatic Food Intake Monitoring Based on Chewing Activity: A Survey</article-title>
          <source>IEEE Access</source>
          <year>2020</year>
          <volume>8</volume>
          <fpage>48846</fpage>
          <lpage>48869</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2020.2978260</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bell</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Alam</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Alshurafa</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Thomaz</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Mondol</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>de la Haye</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Stankovic</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Lach</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Spruijt-Metz</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Automatic, wearable-based, in-field eating detection approaches for public health research: a scoping review</article-title>
          <source>NPJ Digit Med</source>
          <year>2020</year>
          <month>3</month>
          <day>13</day>
          <volume>3</volume>
          <issue>1</issue>
          <fpage>38</fpage>
          <pub-id pub-id-type="doi">10.1038/s41746-020-0246-2</pub-id>
          <pub-id pub-id-type="medline">32195373</pub-id>
          <pub-id pub-id-type="pii">246</pub-id>
          <pub-id pub-id-type="pmcid">PMC7069988</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chun</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Bhattacharya</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Thomaz</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Detecting Eating Episodes by Tracking Jawbone Movements with a Non-Contact Wearable Sensor</article-title>
          <source>Proc. ACM Interact. Mob. Wearable Ubiquitous Technol</source>
          <year>2018</year>
          <month>03</month>
          <day>26</day>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>21</lpage>
          <pub-id pub-id-type="doi">10.1145/3191736</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Q</given-names>
            </name>
          </person-group>
          <article-title>Your Glasses Know Your Diet: Dietary Monitoring Using Electromyography Sensors</article-title>
          <source>IEEE Internet Things J</source>
          <year>2017</year>
          <month>6</month>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>705</fpage>
          <lpage>712</lpage>
          <pub-id pub-id-type="doi">10.1109/jiot.2017.2656151</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Prioleau</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ghovanloo</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Unobtrusive and Wearable Systems for Automatic Dietary Monitoring</article-title>
          <source>IEEE Trans. Biomed. Eng</source>
          <year>2017</year>
          <month>9</month>
          <volume>64</volume>
          <issue>9</issue>
          <fpage>2075</fpage>
          <lpage>2089</lpage>
          <pub-id pub-id-type="doi">10.1109/tbme.2016.2631246</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pasler</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fischer</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Food Intake Monitoring: Automated Chew Event Detection in Chewing Sounds</article-title>
          <source>IEEE J. Biomed. Health Inform</source>
          <year>2014</year>
          <month>1</month>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>278</fpage>
          <lpage>289</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2013.2268663</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Amft</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>A wearable earpad sensor for chewing monitoring</article-title>
          <year>2010</year>
          <month>11</month>
          <day>1</day>
          <conf-name>SENSORS, 2010 IEEE</conf-name>
          <conf-date>November 1-4, 2010</conf-date>
          <conf-loc>Waikoloa, HI</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <pub-id pub-id-type="doi">10.1109/jsen.2011.2172411</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Farooq</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Sazonov</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Segmentation and Characterization of Chewing Bouts by Monitoring Temporalis Muscle Using Smart Glasses With Piezoelectric Sensor</article-title>
          <source>IEEE J. Biomed. Health Inform</source>
          <year>2017</year>
          <month>11</month>
          <volume>21</volume>
          <issue>6</issue>
          <fpage>1495</fpage>
          <lpage>1503</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2016.2640142</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Amft</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Monitoring Chewing and Eating in Free-Living Using Smart Eyeglasses</article-title>
          <source>IEEE J. Biomed. Health Inform</source>
          <year>2018</year>
          <month>1</month>
          <volume>22</volume>
          <issue>1</issue>
          <fpage>23</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2017.2698523</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fan</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Lach</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Eating gestures detection by tracking finger motion</article-title>
          <year>2016</year>
          <conf-name>2016 IEEE Wireless Health (WH)</conf-name>
          <conf-date>October 25-27, 2016</conf-date>
          <conf-loc>Bethesda, MD</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>1</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1109/WH.2016.7764549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Parate</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ganesan</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Rehg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Kumar</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Detecting eating and smoking behaviors using smartwatches</article-title>
          <source>Mobile Health</source>
          <year>2017</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>175</fpage>
          <lpage>201</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Heydarian</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Adam</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Burrows</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Collins</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rollo</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>Assessing Eating Behaviour Using Upper Limb Mounted Motion Sensors: A Systematic Review</article-title>
          <source>Nutrients</source>
          <year>2019</year>
          <month>05</month>
          <day>24</day>
          <volume>11</volume>
          <issue>5</issue>
          <fpage>1168</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=nu11051168"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/nu11051168</pub-id>
          <pub-id pub-id-type="medline">31137677</pub-id>
          <pub-id pub-id-type="pii">nu11051168</pub-id>
          <pub-id pub-id-type="pmcid">PMC6566929</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Amft</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Free-living eating event spotting using EMG-monitoring eyeglasses</article-title>
          <year>2018</year>
          <conf-name>2018 IEEE EMBS International Conference on Biomedical &#38; Health Informatics (BHI)</conf-name>
          <conf-date>March 4-7, 2018</conf-date>
          <conf-loc>Las Vegas, NV</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>128</fpage>
          <lpage>132</lpage>
          <pub-id pub-id-type="doi">10.1109/bhi.2018.8333386</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Assisting food journaling with automatic eating detection, in Proceedings of the 2016 CHI Conference Extended Abstracts on Human Factors in Computing Systems, 3255?3262, 2016</article-title>
          <year>2016</year>
          <conf-name>CHI EA '16: Proceedings of the 2016 CHI Conference Extended Abstracts on Human Factors in Computing Systems</conf-name>
          <conf-date>May 2016</conf-date>
          <conf-loc>San Jose, CA</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>ACM</publisher-name>
          <fpage>3255</fpage>
          <lpage>3262</lpage>
          <pub-id pub-id-type="doi">10.1145/2851581.2892426</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thomaz</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Essa</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Abowd</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>A Practical Approach for Recognizing Eating Moments with Wrist-Mounted Inertial Sensing</article-title>
          <source>Proc ACM Int Conf Ubiquitous Comput</source>
          <year>2015</year>
          <month>09</month>
          <volume>2015</volume>
          <fpage>1029</fpage>
          <lpage>1040</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29520397"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2750858.2807545</pub-id>
          <pub-id pub-id-type="medline">29520397</pub-id>
          <pub-id pub-id-type="pmcid">PMC5839104</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Schiboni</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Wasner</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Amft</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>A Privacy-Preserving Wearable Camera Setup for Dietary Event Spotting in Free-Living</article-title>
          <year>2018</year>
          <month>03</month>
          <day>19</day>
          <conf-name>2018 IEEE International Conference on Pervasive Computing and Communications Workshops (PerCom Workshops)</conf-name>
          <conf-date>March 19-23, 2018</conf-date>
          <conf-loc>Athens, Greece</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <pub-id pub-id-type="doi">10.1109/percomw.2018.8480222</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jasper</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Muth</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Hoover</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Automatic Detection of Periods of Eating Using Wrist Motion Tracking</article-title>
          <year>2016</year>
          <month>06</month>
          <day>27</day>
          <conf-name>2016 IEEE First International Conference on Connected Health: Applications, Systems and Engineering Technologies (CHASE)</conf-name>
          <conf-date>June 27-29, 2016</conf-date>
          <conf-loc>Washington, DC, USA</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>A</fpage>
          <pub-id pub-id-type="doi">10.1109/chase.2016.15</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Subbaraju</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Misra</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Balan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Annapurna: Building a Real-World Smartwatch-Based Automated Food Journal</article-title>
          <year>2018</year>
          <month>06</month>
          <day>12</day>
          <conf-name>2018 IEEE 19th International Symposium on</conf-name>
          <conf-date>June 12-15, 2018</conf-date>
          <conf-loc>Chania, Greece</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <pub-id pub-id-type="doi">10.1109/wowmom.2018.8449755</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Navarathna</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Bequette</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Wearable Device Based Activity Recognition and Prediction for Improved Feedforward Control</article-title>
          <year>2018</year>
          <month>06</month>
          <day>27</day>
          <conf-name>2018 Annual American Control Conference (ACC)</conf-name>
          <conf-date>June 27-29, 2018</conf-date>
          <conf-loc>Milwaukee, WI</conf-loc>
          <pub-id pub-id-type="doi">10.23919/acc.2018.8430775</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mirtchouk</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lustig</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ching</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Zheng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kleinberg</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Recognizing Eating from Body-Worn Sensors</article-title>
          <source>Proc. ACM Interact. Mob. Wearable Ubiquitous Technol</source>
          <year>2017</year>
          <month>09</month>
          <day>11</day>
          <volume>1</volume>
          <issue>3</issue>
          <fpage>1</fpage>
          <lpage>20</lpage>
          <pub-id pub-id-type="doi">10.1145/3131894</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sazonov</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Fontana</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>A Sensor System for Automatic Detection of Food Intake Through Non-Invasive Monitoring of Chewing</article-title>
          <source>IEEE Sensors J</source>
          <year>2012</year>
          <month>05</month>
          <volume>12</volume>
          <issue>5</issue>
          <fpage>1340</fpage>
          <lpage>1348</lpage>
          <pub-id pub-id-type="doi">10.1109/jsen.2011.2172411</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lopez-Meyer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schuckers</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Makeyev</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Sazonov</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Detection of periods of food intake using Support Vector Machines</article-title>
          <year>2010</year>
          <month>08</month>
          <day>31</day>
          <conf-name>2010 Annual International Conference of the IEEE Engineering in Medicine and Biology</conf-name>
          <conf-date>August 31 to September 4, 2010</conf-date>
          <conf-loc>Buenos Aires, Argentina</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <pub-id pub-id-type="doi">10.1109/chase.2016.14</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bedri</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Verlekar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thomaz</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Avva</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Starner</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Detecting Mastication: A Wearable Approach</article-title>
          <year>2015</year>
          <month>11</month>
          <day>13</day>
          <conf-name>Proceedings of the 2015 ACM on International Conference on Multimodal Interaction</conf-name>
          <conf-date>November 13, 2015</conf-date>
          <conf-loc>Seattle, WA</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>ACM</publisher-name>
          <fpage>247</fpage>
          <pub-id pub-id-type="doi">10.1145/2818346.2820767</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Papapanagiotou</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Diou</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>van den Boer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Mars</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Delopoulos</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A Novel Chewing Detection System Based on PPG, Audio, and Accelerometry</article-title>
          <source>IEEE J. Biomed. Health Inform</source>
          <year>2017</year>
          <month>5</month>
          <volume>21</volume>
          <issue>3</issue>
          <fpage>607</fpage>
          <lpage>618</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2016.2625271</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chung</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Yoo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Bang</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A glasses-type wearable device for monitoring the patterns of food intake and facial activity</article-title>
          <source>Sci Rep</source>
          <year>2017</year>
          <month>01</month>
          <day>30</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>41690</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/srep41690"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/srep41690</pub-id>
          <pub-id pub-id-type="medline">28134303</pub-id>
          <pub-id pub-id-type="pii">srep41690</pub-id>
          <pub-id pub-id-type="pmcid">PMC5278398</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Farooq</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fontana</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>A Comparative Study of Food Intake Detection Using Artificial Neural Network and Support Vector Machine</article-title>
          <year>2013</year>
          <month>12</month>
          <day>04</day>
          <conf-name>12th International Conference on Machine Learning and Applications</conf-name>
          <conf-date>December 4-7, 2013</conf-date>
          <conf-loc>Miami, FL</conf-loc>
          <pub-id pub-id-type="doi">10.1109/icmla.2013.33</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bedri</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Haynes</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kosaraju</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Grover</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Prioleau</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Beh</surname>
              <given-names>MY</given-names>
            </name>
            <name name-style="western">
              <surname>Goel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Starner</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Abowd</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>EarBit: Using Wearable Sensors to Detect Eating Episodes in Unconstrained Environments</article-title>
          <source>Proc ACM Interact Mob Wearable Ubiquitous Technol</source>
          <year>2017</year>
          <month>09</month>
          <day>11</day>
          <volume>1</volume>
          <issue>3</issue>
          <fpage>1</fpage>
          <lpage>20</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30135957"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3130902</pub-id>
          <pub-id pub-id-type="medline">30135957</pub-id>
          <pub-id pub-id-type="pmcid">PMC6101257</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rouast</surname>
              <given-names>PV</given-names>
            </name>
            <name name-style="western">
              <surname>Adam</surname>
              <given-names>MTP</given-names>
            </name>
          </person-group>
          <article-title>Learning Deep Representations for Video-Based Intake Gesture Detection</article-title>
          <source>IEEE J. Biomed. Health Inform</source>
          <year>2020</year>
          <month>6</month>
          <volume>24</volume>
          <issue>6</issue>
          <fpage>1727</fpage>
          <lpage>1737</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2019.2942845</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ciocca</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Napoletano</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schettini</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Battiato</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Farinella</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Leo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gallo</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Learning CNN-based Features for Retrieval of Food Images</article-title>
          <source>New Trends in Image Analysis and Processing – ICIAP 2017</source>
          <year>2017</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>426</fpage>
          <lpage>434</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ruzzon</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Carfì</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ishikawa</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Mastrogiovanni</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Murakami</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>A multi-sensory dataset for the activities of daily living</article-title>
          <source>Data Brief</source>
          <year>2020</year>
          <month>10</month>
          <volume>32</volume>
          <fpage>106122</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2352-3409(20)31016-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.dib.2020.106122</pub-id>
          <pub-id pub-id-type="medline">32904359</pub-id>
          <pub-id pub-id-type="pii">S2352-3409(20)31016-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC7452700</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Olubanjo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ghovanloo</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Detecting food intake acoustic events in noisy recordings using template matching</article-title>
          <year>2016</year>
          <month>02</month>
          <day>24</day>
          <conf-name>2016 IEEE-EMBS International Conference on Biomedical and Health Informatics (BHI)</conf-name>
          <conf-date>February 24-27, 2016</conf-date>
          <conf-loc>Las Vegas, NV</conf-loc>
          <pub-id pub-id-type="doi">10.1109/bhi.2016.7455916</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Puri</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Divakaran</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sawhney</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Recognition and volume estimation of food intake using a mobile device</article-title>
          <year>2009</year>
          <month>12</month>
          <day>07</day>
          <conf-name>2009 Workshop on Applications of Computer Vision (WACV)</conf-name>
          <conf-date>December 7-8, 2009</conf-date>
          <conf-loc>Snowbird, UT</conf-loc>
          <pub-id pub-id-type="doi">10.1109/wacv.2009.5403087</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Farooq</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fontana</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Sazonov</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>A novel approach for food intake detection using electroglottography</article-title>
          <source>Physiol Meas</source>
          <year>2014</year>
          <month>05</month>
          <day>26</day>
          <volume>35</volume>
          <issue>5</issue>
          <fpage>739</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24671094"/>
          </comment>
          <pub-id pub-id-type="doi">10.1088/0967-3334/35/5/739</pub-id>
          <pub-id pub-id-type="medline">24671094</pub-id>
          <pub-id pub-id-type="pmcid">PMC4036630</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Subbaraju</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Misra</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Balan</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>The case for smartwatch-based diet monitoring</article-title>
          <year>2015</year>
          <month>03</month>
          <day>23</day>
          <conf-name>2015 IEEE International Conference on Pervasive Computing and Communication Workshops (PerCom Workshops)</conf-name>
          <conf-date>March 23-27, 2015</conf-date>
          <conf-loc>St. Louis, MO</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>585</fpage>
          <lpage>590</lpage>
          <pub-id pub-id-type="doi">10.1109/percomw.2015.7134103</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Cao</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>iHear foodating detection using commodity Bluetooth headsets</article-title>
          <year>2016</year>
          <conf-name>2016 IEEE First International Conference on Connected Health: Applications, Systems and Engineering Technologies (CHASE)</conf-name>
          <conf-date>June 27-29, 2016</conf-date>
          <conf-loc>Washington, DC</conf-loc>
          <publisher-loc>New York, NY</publisher-loc>
          <publisher-name>IEEE</publisher-name>
          <fpage>172</fpage>
          <pub-id pub-id-type="doi">10.1109/CHASE.2016.14</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Srivastava</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Salakhutdinov</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Pereira</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Burges</surname>
              <given-names>CJC</given-names>
            </name>
            <name name-style="western">
              <surname>Bottou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Weinberger</surname>
              <given-names>KQ</given-names>
            </name>
          </person-group>
          <article-title>Multimodal learning with deep Boltzmann machines</article-title>
          <source>NIPS'12: Proceedings of the 25th International Conference on Neural Information Processing Systems (Volume 2)</source>
          <year>2012</year>
          <month>12</month>
          <publisher-loc>Red Hook, NY</publisher-loc>
          <publisher-name>Curran Associates Inc</publisher-name>
          <fpage>2222</fpage>
          <lpage>2230</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Maheshwari</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Memon</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Jabbar</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Javed</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A CNN Based Automated Activity and Food Recognition Using Wearable Sensor for Preventive Healthcare</article-title>
          <source>Electronics</source>
          <year>2019</year>
          <month>11</month>
          <day>29</day>
          <volume>8</volume>
          <issue>12</issue>
          <fpage>1425</fpage>
          <pub-id pub-id-type="doi">10.3390/electronics8121425</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kyritsis</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Diou</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Delopoulos</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A Data Driven End-to-End Approach for In-the-Wild Monitoring of Eating Behavior Using Smartwatches</article-title>
          <source>IEEE J. Biomed. Health Inform</source>
          <year>2021</year>
          <month>1</month>
          <volume>25</volume>
          <issue>1</issue>
          <fpage>22</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2020.2984907</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Asgari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fabritius</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Tunable Mid-Infrared Graphene Plasmonic Cross-Shaped Resonator for Demultiplexing Application</article-title>
          <source>Applied Sciences</source>
          <year>2020</year>
          <month>02</month>
          <day>10</day>
          <volume>10</volume>
          <issue>3</issue>
          <fpage>1193</fpage>
          <pub-id pub-id-type="doi">10.3390/app10031193</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Asgari</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Granpayeh</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Fabritius</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Controllable terahertz cross-shaped three-dimensional graphene intrinsically chiral metastructure and its biosensing application</article-title>
          <source>Optics Communications</source>
          <year>2020</year>
          <month>11</month>
          <volume>474</volume>
          <fpage>126080</fpage>
          <pub-id pub-id-type="doi">10.1016/j.optcom.2020.126080</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Habre</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Deng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Urman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Morrison</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gilliland</surname>
              <given-names>FD</given-names>
            </name>
            <name name-style="western">
              <surname>Ambite</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Stripelis</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chiang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bui</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>King</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hosseini</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Vliet</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Sarrafzadeh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Eckel</surname>
              <given-names>SP</given-names>
            </name>
          </person-group>
          <article-title>Applying Multivariate Segmentation Methods to Human Activity Recognition From Wearable Sensors' Data</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2019</year>
          <month>02</month>
          <day>07</day>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>e11201</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2019/2/e11201/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/11201</pub-id>
          <pub-id pub-id-type="medline">30730297</pub-id>
          <pub-id pub-id-type="pii">v7i2e11201</pub-id>
          <pub-id pub-id-type="pmcid">PMC6386646</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferrari</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Micucci</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Mobilio</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Napoletano</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>On the Personalization of Classification Models for Human Activity Recognition</article-title>
          <source>IEEE Access</source>
          <year>2020</year>
          <volume>8</volume>
          <fpage>32066</fpage>
          <lpage>32079</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2020.2973425</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>C-H</given-names>
            </name>
            <name name-style="western">
              <surname>Fu</surname>
              <given-names>L-C</given-names>
            </name>
          </person-group>
          <article-title>Robust Location-Aware Activity Recognition Using Wireless Sensor Network in an Attentive Home</article-title>
          <source>IEEE Trans. Automat. Sci. Eng</source>
          <year>2009</year>
          <month>10</month>
          <volume>6</volume>
          <issue>4</issue>
          <fpage>598</fpage>
          <lpage>609</lpage>
          <pub-id pub-id-type="doi">10.1109/tase.2009.2021981</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liao</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Nugent</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Using the Dempster–Shafer Theory of Evidence With a Revised Lattice Structure for Activity Recognition</article-title>
          <source>IEEE Trans. Inform. Technol. Biomed</source>
          <year>2011</year>
          <month>01</month>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>74</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="doi">10.1109/titb.2010.2091684</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Sheng</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Wearable Sensor-Based Hand Gesture and Daily Activity Recognition for Robot-Assisted Living</article-title>
          <source>IEEE Trans. Syst., Man, Cybern. A</source>
          <year>2011</year>
          <month>05</month>
          <volume>41</volume>
          <issue>3</issue>
          <fpage>569</fpage>
          <lpage>573</lpage>
          <pub-id pub-id-type="doi">10.1109/tsmca.2010.2093883</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>RX</given-names>
            </name>
            <name name-style="western">
              <surname>John</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Staudenmayer</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Freedson</surname>
              <given-names>PS</given-names>
            </name>
          </person-group>
          <article-title>Multisensor Data Fusion for Physical Activity Assessment</article-title>
          <source>IEEE Trans. Biomed. Eng</source>
          <year>2012</year>
          <month>03</month>
          <volume>59</volume>
          <issue>3</issue>
          <fpage>687</fpage>
          <lpage>696</lpage>
          <pub-id pub-id-type="doi">10.1109/tbme.2011.2178070</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chernbumroong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Cang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Genetic Algorithm-Based Classifiers Fusion for Multisensor Activity Recognition of Elderly People</article-title>
          <source>IEEE J. Biomed. Health Inform</source>
          <year>2015</year>
          <month>1</month>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>282</fpage>
          <lpage>289</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2014.2313473</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Motion Measurement Using Inertial Sensors, Ultrasonic Sensors, and Magnetometers With Extended Kalman Filter for Data Fusion</article-title>
          <source>IEEE Sensors J</source>
          <year>2012</year>
          <month>05</month>
          <volume>12</volume>
          <issue>5</issue>
          <fpage>943</fpage>
          <lpage>953</lpage>
          <pub-id pub-id-type="doi">10.1109/jsen.2011.2166066</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>De Paola</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ferraro</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Gaglio</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Re</surname>
              <given-names>GL</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>SK</given-names>
            </name>
          </person-group>
          <article-title>An Adaptive Bayesian System for Context-Aware Data Fusion in Smart Environments</article-title>
          <source>IEEE Trans Mobile Comput</source>
          <year>2017</year>
          <month>6</month>
          <day>1</day>
          <volume>16</volume>
          <issue>6</issue>
          <fpage>1502</fpage>
          <lpage>1515</lpage>
          <pub-id pub-id-type="doi">10.1109/tmc.2016.2599158</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Peng</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Hierarchical Complex Activity Representation and Recognition Using Topic Model and Classifier Level Fusion</article-title>
          <source>IEEE Trans Biomed Eng</source>
          <year>2017</year>
          <month>6</month>
          <volume>64</volume>
          <issue>6</issue>
          <fpage>1369</fpage>
          <lpage>1379</lpage>
          <pub-id pub-id-type="doi">10.1109/tbme.2016.2604856</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chowdhury</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Tjondronegoro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Chandran</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Trost</surname>
              <given-names>SG</given-names>
            </name>
          </person-group>
          <article-title>Physical Activity Recognition Using Posterior-Adapted Class-Based Fusion of Multiaccelerometer Data</article-title>
          <source>IEEE J. Biomed. Health Inform</source>
          <year>2018</year>
          <month>5</month>
          <volume>22</volume>
          <issue>3</issue>
          <fpage>678</fpage>
          <lpage>685</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2017.2705036</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kanhangad</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Human Activity Classification in Smartphones Using Accelerometer and Gyroscope Sensors</article-title>
          <source>IEEE Sensors J</source>
          <year>2018</year>
          <month>2</month>
          <day>1</day>
          <volume>18</volume>
          <issue>3</issue>
          <fpage>1169</fpage>
          <lpage>1177</lpage>
          <pub-id pub-id-type="doi">10.1109/jsen.2017.2782492</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Cang</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>A Data Fusion-Based Hybrid Sensory System for Older People’s Daily Activity and Daily Routine Recognition</article-title>
          <source>IEEE Sensors J</source>
          <year>2018</year>
          <month>8</month>
          <day>15</day>
          <volume>18</volume>
          <issue>16</issue>
          <fpage>6874</fpage>
          <lpage>6888</lpage>
          <pub-id pub-id-type="doi">10.1109/jsen.2018.2833745</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Acharya</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mongan</surname>
              <given-names>WM</given-names>
            </name>
            <name name-style="western">
              <surname>Rasheed</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Anday</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Dion</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Fontecchio</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kurzweg</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dandekar</surname>
              <given-names>KR</given-names>
            </name>
          </person-group>
          <article-title>Ensemble Learning Approach via Kalman Filtering for a Passive Wearable Respiratory Monitor</article-title>
          <source>IEEE J. Biomed. Health Inform</source>
          <year>2019</year>
          <month>5</month>
          <volume>23</volume>
          <issue>3</issue>
          <fpage>1022</fpage>
          <lpage>1031</lpage>
          <pub-id pub-id-type="doi">10.1109/jbhi.2018.2857924</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>An</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>A Multisensor Multiclassifier Hierarchical Fusion Model Based on Entropy Weight for Human Activity Recognition Using Wearable Inertial Sensors</article-title>
          <source>IEEE Trans. Human-Mach. Syst</source>
          <year>2019</year>
          <month>2</month>
          <volume>49</volume>
          <issue>1</issue>
          <fpage>105</fpage>
          <lpage>111</lpage>
          <pub-id pub-id-type="doi">10.1109/thms.2018.2884717</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Muaaz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chelli</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Abdelgawwad</surname>
              <given-names>AA</given-names>
            </name>
            <name name-style="western">
              <surname>Mallofre</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Patzold</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>WiWeHAR: Multimodal Human Activity Recognition Using Wi-Fi and Wearable Sensing Modalities</article-title>
          <source>IEEE Access</source>
          <year>2020</year>
          <volume>8</volume>
          <fpage>164453</fpage>
          <lpage>164470</lpage>
          <pub-id pub-id-type="doi">10.1109/access.2020.3022287</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
