<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Mhealth Uhealth</journal-id><journal-id journal-id-type="publisher-id">mhealth</journal-id><journal-id journal-id-type="index">13</journal-id><journal-title>JMIR mHealth and uHealth</journal-title><abbrev-journal-title>JMIR Mhealth Uhealth</abbrev-journal-title><issn pub-type="epub">2291-5222</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v14i1e81123</article-id><article-id pub-id-type="doi">10.2196/81123</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Determining a Likely Mechanism of Missingness in Repeated Measures Sleep Data From Wearable Fitness Trackers: Longitudinal Analysis</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Mobley</surname><given-names>Kate</given-names></name><degrees>BS, MS, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Gittner</surname><given-names>Kevin B</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Nielsen</surname><given-names>Karen</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Matheny</surname><given-names>Lauren M</given-names></name><degrees>MPH, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Taasoobshirazi</surname><given-names>Gita</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Natuhamya</surname><given-names>Charles</given-names></name><degrees>MS</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Swahn</surname><given-names>Monica H</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib></contrib-group><aff id="aff1"><institution>School of Data Science and Analytics, College of Computing and Software Engineering, Kennesaw State University</institution><addr-line>680 Arntson Drive Atrium J333, MD 9104</addr-line><addr-line>Marietta</addr-line><addr-line>GA</addr-line><country>United States</country></aff><aff id="aff2"><institution>Department of Health Promotion and Physical Education, Wellstar College of Health and Human Services, Kennesaw State University</institution><addr-line>Kennesaw</addr-line><addr-line>GA</addr-line><country>United States</country></aff><aff id="aff3"><institution>Department of Population Health Sciences, School of Public Health, Georgia State University</institution><addr-line>Atlanta</addr-line><addr-line>GA</addr-line><country>United States</country></aff><aff id="aff4"><institution>Uganda Youth Development Link</institution><addr-line>Kampala</addr-line><country>Uganda</country></aff><aff id="aff5"><institution>School of Public Health, Virginia Commonwealth University</institution><addr-line>Richmond</addr-line><addr-line>VA</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Badicu</surname><given-names>Georgian</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Martinko</surname><given-names>Antonio</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Mauriello</surname><given-names>Matthew Louis</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Kate Mobley, BS, MS, PhD, School of Data Science and Analytics, College of Computing and Software Engineering, Kennesaw State University, 680 Arntson Drive Atrium J333, MD 9104, Marietta, GA, 30060, United States, 1-470-578-2865; <email>mobley.kate@gmail.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>31</day><month>3</month><year>2026</year></pub-date><volume>14</volume><elocation-id>e81123</elocation-id><history><date date-type="received"><day>22</day><month>07</month><year>2025</year></date><date date-type="rev-recd"><day>25</day><month>01</month><year>2026</year></date><date date-type="accepted"><day>09</day><month>02</month><year>2026</year></date></history><copyright-statement>&#x00A9; Kate Mobley, Kevin B Gittner, Karen Nielsen, Lauren M Matheny, Gita Taasoobshirazi, Charles Natuhamya, Monica H Swahn. Originally published in JMIR mHealth and uHealth (<ext-link ext-link-type="uri" xlink:href="https://mhealth.jmir.org">https://mhealth.jmir.org</ext-link>), 31.3.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR mHealth and uHealth, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://mhealth.jmir.org/">https://mhealth.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://mhealth.jmir.org/2026/1/e81123"/><abstract><sec><title>Background</title><p>Wearable fitness trackers have become a valuable tool in public health research due to their ability to collect large-scale, individual-level data at a low cost. Because of this, wearables have the potential to mitigate the urgent need for health research in low-resource settings. However, their use has been largely limited to high-income settings, and a major challenge remains: high rates of missing data. This problem may be exacerbated in low-resource environments where logistical and operational barriers further complicate data collection. Wearable sleep data collected in an urban informal settlement in Uganda during The Onward Project on Well-being and Adversity project revealed substantial challenges related to missingness in low-resource research settings.</p></sec><sec><title>Objective</title><p>The study aimed to characterize the patterns and frequency of missing data and to demonstrate the use of analytical methods to determine the underlying missingness mechanism.</p></sec><sec sec-type="methods"><title>Methods</title><p>For this study, 300 women in slum communities in Kampala were equipped with Garmin smartwatches that collected data over 5 days. The nature of missingness was assessed through four methods: pattern analysis, the Little test, a random forest classification model, and a logistic regression classification model. Pattern analysis is an established method of identifying missing data patterns, while the Little test is used specifically to identify missing completely at random data. Random forest and logistic regression models are more recent methods proposed to identify the mechanism of missingness; both were used to examine agreement between the 2 methods and to ensure a thorough examination of missingness patterns.</p></sec><sec sec-type="results"><title>Results</title><p>Approximately 30% of nighttime data were missing. Three patterns were identified that occurred in over 10% of participants&#x2019; data: no data missing, fifth night of data missing, and all nights of data missing. Pattern analysis and the Little test (<italic>P</italic>&#x003C;.001) indicated that the data were not missing completely at random. Both the random forest (area under the curve=0.7) and logistic regression models suggested that the data were missing at random (MAR).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Evidence of missingness in this dataset was consistent with MAR. Potential causes of missingness include device removal, battery failure, and technical malfunctions. These findings have important implications for both wearable device users and future research. Understanding the mechanisms behind missingness can inform strategies to improve data quality, particularly in low-resource settings, and allow researchers to manage missingness using appropriate strategies designed to handle MAR data without introducing bias into the results.</p></sec></abstract><kwd-group><kwd>global health</kwd><kwd>wearable electronic devices</kwd><kwd>sleep</kwd><kwd>missing data</kwd><kwd>informal settlements</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Wearable Fitness Trackers in Health Research</title><p>Originally intended for personal health and fitness tracking, wearable fitness trackers have gained traction in research due to their ability to collect large-scale, real-world data from participants in natural settings [<xref ref-type="bibr" rid="ref1">1</xref>]. According to Fitabase, a platform monitoring research applications of Fitbit devices, over 1300 studies incorporated Fitbit devices between 2012 and 2025 [<xref ref-type="bibr" rid="ref2">2</xref>] and that number increases when factoring in the studies that have used other fitness trackers. Wearable fitness trackers provide real-time data collection, including physical activity, heart rate metrics, biometric and health indicators, location, behavior, and sleep. These data are critical for identifying risk factors for various health conditions, tracking health outcomes over time, evaluating interventions, and advancing personalized medicine. Wearable device data, when limitations are managed, have the potential to advance understanding of how lifestyle behaviors interact with physical and mental health across diverse populations, supporting more effective, data-driven public health strategies and clinical practices. Despite their growing adoption in research, these technologies remain disproportionately used in high-income countries and among wealthier populations [<xref ref-type="bibr" rid="ref1">1</xref>,<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>].</p></sec><sec id="s1-2"><title>Research in Urban Slum Communities</title><p>Wearable devices hold significant promise for research, particularly in low-resource settings such as urban slums [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. These settings, defined by constraints across finances, health care, infrastructure, knowledge, research capacity, social resources, environmental factors, human resources, and cultural practices [<xref ref-type="bibr" rid="ref6">6</xref>], pose unique challenges for data collection. Furthermore, over 1 billion people, or 24% of the world&#x2019;s urban population, currently live in slums, with this figure rising to 56% in sub-Saharan Africa [<xref ref-type="bibr" rid="ref7">7</xref>]. Wearables offer a practical solution to the need for health research in these settings with large populations and disproportionately high risks of physical and mental health conditions [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref10">10</xref>]. They are cost-effective, scalable, minimally intrusive, and capable of gathering individual-level data for multiple days without reliance on external power or additional technology. These advantages make them especially valuable for research in resource-limited environments [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Understanding missingness in sleep data from wearable fitness trackers can provide important foundational information for this research.</p><p>Understanding the physical and mental health challenges in urban slums and other low-resource settings is a critical public health priority, and sleep serves as a key indicator of overall well-being. Sleep problems, including poor sleep quality and short sleep duration, are common among residents of slum communities and have been linked to mental illness, but this topic is still understudied, especially so in low- and middle-income countries [<xref ref-type="bibr" rid="ref4">4</xref>]. Wearable technology presents a transformative opportunity for such studies, offering cost-effective, minimally intrusive methods to collect longitudinal health data in challenging urban environments. For instance, while poor sleep is a documented issue in slums, existing research has relied primarily on subjective and unreliable self-reports rather than objective sensor-based measurements [<xref ref-type="bibr" rid="ref4">4</xref>].</p><p>However, while missing data is an issue present in all research involving wearable fitness trackers, the difficulties associated with doing research in low-resource settings like urban slums can contribute to higher rates of missing data [<xref ref-type="bibr" rid="ref11">11</xref>]. Residents of urban slums often have unreliable electricity access, are unfamiliar with wearable fitness tracker technologies, and face logistical barriers to implementing these technologies [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. Additionally, many wearable fitness trackers are reliant on connection to a smartphone or the internet, and rates of internet access and smartphone usage are low in urban slums [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref14">14</xref>]. Because of these challenges associated with low-resource settings like urban slums, rates of missing data can be higher when wearable fitness trackers are used in these settings. Though wearable studies in slums remain limited and are often clinic-based, there is potential for scalable, real-world data collection using wearable devices [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref17">17</xref>]. To realize this potential, understanding critical challenges like missing data must become a priority.</p></sec><sec id="s1-3"><title>Missing Data</title><p>Missing data remains a pervasive challenge in human research, arising from diverse sources. Participant-related factors, such as missed study visits or attrition, and researcher limitations in follow-up capacity are well-documented contributors [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref19">19</xref>]. The growing integration of digital devices and sensors in research has introduced additional technical sources of missingness, including equipment malfunctions, battery failures, and connectivity issues [<xref ref-type="bibr" rid="ref20">20</xref>]. Longitudinal studies, which require sustained data collection across multiple timepoints, face compounded risks of missing data, making this issue particularly acute in such designs [<xref ref-type="bibr" rid="ref21">21</xref>].</p><p>Missing data in wearable device studies typically stems from two primary sources: device-related factors and wearer-related behaviors [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. Technical issues such as battery failure, sensor displacement, software malfunctions, connectivity problems, or synchronization errors frequently contribute to device-related missingness [<xref ref-type="bibr" rid="ref22">22</xref>-<xref ref-type="bibr" rid="ref24">24</xref>]. Wearer-related missingness most commonly results from nonadherence, including device removal or improper wear [<xref ref-type="bibr" rid="ref23">23</xref>]. There has been some study of missing data in wearable data, but very little in low-resource settings where wearables have only been used in a small number of studies outside of clinical settings, where conditions are much more controlled. Researchers in low-resource settings have theorized that a higher prevalence of manual labor in these settings results in exposure to extreme conditions, contributing to both device- and wearer-related challenges, which may contribute to the deterioration of wearable devices and increased missingness [<xref ref-type="bibr" rid="ref5">5</xref>]. Wearables also differ widely in the types of data they collect, and only a few studies have considered missingness in wearable sleep data specifically [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. Despite the growing use of wearable devices to collect sleep data, limited research has examined patterns and mechanisms of missingness, particularly in low-resource settings, where contextual challenges may further exacerbate missing data [<xref ref-type="bibr" rid="ref11">11</xref>].</p><p>The prevalence of missing data significantly impacts data quality and poses substantial analytical challenges [<xref ref-type="bibr" rid="ref26">26</xref>]. Effective handling of missing data through methods like imputation becomes crucial for ensuring accurate analyses [<xref ref-type="bibr" rid="ref24">24</xref>]. A comprehensive review of wearable studies in biomedical research confirms that data missingness remains among the most significant obstacles researchers face [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. Few researchers have used wearables in low-resource settings, but among those who have, numerous studies have found data missingness to be a substantial issue, underscoring the need to understand the mechanisms of missingness and to find robust solutions to this persistent issue [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref28">28</xref>].</p><p>Missing data can be categorized into three primary mechanisms: missing completely at random (MCAR), missing at random (MAR), and missing not at random (MNAR). When data are MCAR, the probability of missingness is entirely independent of both observed and unobserved data [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. In contrast, MAR occurs when missingness depends only on observed variables, not the missing values themselves [<xref ref-type="bibr" rid="ref30">30</xref>]. The most challenging scenario, MNAR, arises when missingness is related to the unobserved data [<xref ref-type="bibr" rid="ref18">18</xref>,<xref ref-type="bibr" rid="ref31">31</xref>]. Understanding these common classifications of missing data is necessary, as these distinctions depend on whether missingness is related to observed or unobserved information and has important implications for analysis and interpretation [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref31">31</xref>].</p></sec><sec id="s1-4"><title>Analytical Methods for Determining the Mechanism of Missingness</title><p>Determining the exact mechanism of missingness is challenging, but several methods can provide evidence for specific patterns. Visualization techniques offer a preliminary approach to identifying missingness patterns through graphical exploration [<xref ref-type="bibr" rid="ref32">32</xref>]. For formal testing, the Little test, a well-established method, assesses whether data are MCAR [<xref ref-type="bibr" rid="ref33">33</xref>]. To explore whether data are MAR, two analytical approaches are commonly used: random forest and logistic regression. Both methods model relationships between observed variables and a binary indicator of missingness. If significant associations exist between observed variables and missingness, this supports the MAR mechanism [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>]. However, in longitudinal studies, where observations within participants are correlated, these methods require modifications to account for dependencies. In addition to contributing to the body of knowledge on missingness in wearable sleep data, this study demonstrates the use of these analytical methods on wearable sleep data, and on repeated measures data, where adjustments are necessary to preserve the dependencies between observations from the same person.</p></sec><sec id="s1-5"><title>Wearable Fitness Trackers in Sleep Research</title><p>Since around 2017, consumer wearable fitness trackers have measured time spent in each sleep stage using a combination of motion detection, heart rate variability, and respiratory rate monitoring [<xref ref-type="bibr" rid="ref36">36</xref>]. While questions remain about the absolute accuracy of sleep-stage classification, the devices&#x2019; ability to detect sleep-wake patterns has significantly improved [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref38">38</xref>]. Importantly, wearable fitness trackers provide more objective sleep data than self-reports, as individuals often cannot accurately recall specific sleep metrics like sleep onset time or nighttime awakenings [<xref ref-type="bibr" rid="ref36">36</xref>]. Although wearable sleep tracking technology still has limitations, it represents a substantial improvement over subjective reporting for research purposes, with accuracy continuing to advance through technological innovations [<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref39">39</xref>].</p><p>Garmin devices like the ones used in this study have been assessed for the validity of their measurements. Existing studies indicate that they provide highly valid step count measurements, though their accuracy for distance, energy expenditure, and heart rate data remains more variable [<xref ref-type="bibr" rid="ref40">40</xref>]. Garmin devices demonstrate reasonable agreement with polysomnography for measuring sleep duration and staging [<xref ref-type="bibr" rid="ref41">41</xref>], and they more accurately identify deep sleep stages than some other wearable fitness trackers [<xref ref-type="bibr" rid="ref42">42</xref>]. Manufacturers release new models frequently, and different models from the same brand can vary. Therefore, the comprehensive evaluation of wearable devices across all models and brands, including validity, reliability, proprietary algorithms, cost differences, and feature variability, remains challenging. Overall, however, modern wearable technologies that combine heart rate and motion tracking demonstrate comparable effectiveness for sleep monitoring, despite some variation in specific metrics across models and brands.</p></sec><sec id="s1-6"><title>Wearable Sleep Data Missingness</title><p>While the problem of missingness in wearables data, including sleep data, has been well documented, only 2 studies were identified that considered how to address this problem in sleep data [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. However, these studies differed substantially from this work. First, both studies used sleep and wakefulness data collected every few seconds for up to 50 days, so that missingness was determined by measuring the length of time during the data collection period that no data was collected (a method typically referred to as measuring data completeness). Additionally, one of these studies used data from individuals with very irregular sleep patterns so that the results may be used by those studying sleep disorders, while the other removed participants who had removed the device at any point, a common cause of missing data [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. Neither study used data from low-resource settings where missingness is likely to be even higher than in data from high-income populations.</p></sec><sec id="s1-7"><title>Study Purpose</title><p>The limited research on missing data in wearable sleep data that has been conducted so far uses sleep data that is in a significantly different format from that used in this study. To the authors&#x2019; knowledge, this is the first study to examine missingness in wearable sleep data aggregated by night within a low-resource setting. This innovative approach to analyzing missingness in wearable sleep data is closely aligned with the typical use and analysis of this type of data.</p><p>Wearable fitness trackers offer a promising tool for collecting sleep data in diverse environments, which can allow for further study of sleep and the impact of poor sleep on health. However, missing data remain a significant limitation, and the unique logistical challenges of conducting research in low-resource settings, where sleep and health research is urgently needed, may exacerbate this issue. Addressing the patterns of missingness is essential not only for improving data quality but also for advancing research on sleep&#x2019;s role in health in all settings. This study has two primary objectives: (1) to characterize the patterns and frequency of missing data and (2) to determine the underlying missingness mechanism using analytical techniques appropriate for longitudinal repeated measures data. Enders [<xref ref-type="bibr" rid="ref43">43</xref>] comprehensive work on missing data argues that MAR is the most reasonable assumption for the mechanism of missing data in most cases of research, and this assumption should be adopted unless there is evidence to the contrary. Therefore, this study will focus on evidence that the missingness is MCAR or MAR.</p></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>The TOPOWA Project</title><p>The data for this study were collected through The Onward Project on Wellbeing and Adversity (TOPOWA), a mixed methods investigation examining the social determinants of mental health among women in Kampala, Uganda&#x2019;s urban slums. Details of the study have been reported previously [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]. Participant recruitment was conducted across 3 slum communities (Banda, Bwaise, and Makindye) in collaboration with the local community leaders and Uganda Youth Development Link, a nongovernmental organization serving youth in Kampala&#x2019;s informal settlements.</p><p>TOPOWA project used multiple research components, including focus group discussions, Photovoice methodology, and a longitudinal cohort study which includes the collection of sleep data via wearable fitness trackers to study the prevalence of sleep disturbance and its association with mental health in this population.</p></sec><sec id="s2-2"><title>Ethical Considerations</title><p>All study procedures were designed in compliance with the Declaration of Helsinki and received ethical approval from both the Makerere University School of Social Sciences Research Ethics Committee (MAKSSREC MUSSS-2022&#x2010;172) and the Uganda National Council of Science and Technology (SS1560ES).</p><p>Uganda Youth Development Link staff at each study site described the TOPOWA study including risks, benefits, and expectations regarding follow-up assessments to interested participants. Informed consent in writing was obtained from those who agreed to participate in the study. Participants were compensated in the local currency for each component of the study that they participated in, including wearing and returning the wearable device and completing the survey, as well as being provided with food and transportation on the days that they traveled to the research hub to complete assessments. All research assistants involved in participant enrollment and data collection were trained in participant privacy, confidentiality, and safety measures. Data were deidentified before being uploaded to REDCap (Research Electronic Data Capture) for storage and shared with members of the research team for analysis.</p></sec><sec id="s2-3"><title>Data Collection and Processing</title><p>The TOPOWA project enrolled 300 women from Kampala&#x2019;s urban slums, equipping each participant with a Garmin v&#x00ED;voactive 3 device to wear continuously for 5 days and nights. These devices were specifically selected for their field suitability: they operate independently without smartphone connectivity, feature a 5-day battery life, and automatically collect sleep data each night. During data collection, 299 devices were successfully returned, with only 1 unit lost. The v&#x00ED;voactive 3 devices record heart rate, heart rate variability, and movement data, which Garmin&#x2019;s proprietary algorithms analyze to classify sleep into 4 stages (rapid eye movement [REM], deep, light, and awake) plus an &#x201C;unmeasurable&#x201D; category for periods that cannot be classified [<xref ref-type="bibr" rid="ref45">45</xref>]. For each sleep session, the devices generate detailed outputs including the duration (in seconds) spent in each sleep stage and precise timestamps marking the beginning and end of the primary sleep period. Notably, when multiple sleep periods occur within a day, the system prioritizes and reports only the longest continuous sleep bout, overriding shorter naps. This design ensures researchers obtain standardized, comparable metrics for a person&#x2019;s main sleep period, which will be discussed as nightly sleep for simplicity, while maintaining the practicality required for field studies in low-resource settings.</p><p>During the compilation of baseline sleep data, specific criteria were established for identifying missing data. These criteria focused on total sleep duration, treating nights with no sleep information as missing while retaining nights with vague or low-quality data. Notably, the absence of data for a particular sleep stage on nights when other stages were recorded was not classified as missing data. This pattern could indicate either that the participant genuinely did not enter that sleep stage or that the device failed to detect it&#x2014;a distinction that cannot be determined from the available data. Consequently, 0 values for specific stages on otherwise recorded nights were treated as valid observations rather than missing data. No nights with data had a 0 recorded for light sleep, but there were nights that contained 0 for the deep sleep, REM sleep, and awake categories. Less than 2.5% of nights with data had a 0 recorded for multiple sleep stages. Similarly, &#x201C;unmeasurable&#x201D; sleep seconds were considered (periods the device could not classify into any stage) as legitimate data points and included in total sleep duration calculations, rather than being treated as missing values. Zeros were common in the &#x201C;unmeasurable&#x201D; category, indicating that there were no seconds of sleep that the device was unable to classify into one of the other sleep stage categories during those nights. This approach ensured that the analysis reflected the complete sleep architecture as captured by the device while maintaining methodological consistency.</p><p>The presence or absence of heart rate and activity data was also recorded. If heart rate data were present for the prior day, then a 1 was recorded, and if heart rate data were not present for the day before the night in question, then a 0 was recorded. If at least 1 activity was recorded during the 5 days that the participant wore the device, then a 1 was recorded for activity data, and if no activity was recorded over the 5 days, then a 0 was recorded. The presence or absence of heart rate data was used in the statistical analysis to determine the likely mechanism of missingness; however, since activity data was only collected during prolonged periods of physical activity and was therefore much less frequent, they were not included in the statistical models. While the Garmin sleep stage classification algorithm uses concurrently collected heart rate data, the missing data definition used in this study allowed for inclusion of nights with unclassified stages&#x2014;therefore, the presence of heart rate data was not perfectly correlated with missingness.</p></sec><sec id="s2-4"><title>Statistical Analysis</title><p>The analysis of missing data followed a systematic approach. First, a pattern analysis was conducted using the <italic>naniar</italic> (version 1.1.0; Nicholas Tierney and Dianne Cook) package in R to visually examine the structure of missingness in the dataset [<xref ref-type="bibr" rid="ref46">46</xref>]. Next, the Little test, a likelihood ratio-based test that compares the expected means for each variable across different missingness patterns [<xref ref-type="bibr" rid="ref33">33</xref>], was applied to evaluate whether the data were MCAR. For the Little test, the data were converted to wide format, and the 5 sleep category variables (deep, light, REM, awake, and unmeasurable) were included as well as the variables for marital status, household size, education level, and employment status. This test was conducted first because the MCAR criteria are more restrictive than the MAR criteria.</p><p>Following this initial assessment, 2 distinct classification methods, a random forest model and a generalized estimating equations (GEE) model with a logit link function, were used to explore whether the missingness pattern was consistent with MAR. For both models, a binary dependent variable indicating whether data were present or missing for each night was created. Both models incorporated six predictor variables: (1) night sequence number (1-5), (2) household size, (3) education level, (4) employment status (binary), (5) marital status (binary), and (6) presence of heart rate data for the day before the night of sleep (binary). These covariates were selected based on established relationships between socioeconomic factors and sleep behaviors in prior research [<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]. The results from both models were then used to strengthen the conclusions about the nature of the missing data mechanism.</p><p>The dataset included participants with complete missingness across all 5 nights of sleep monitoring, represented by NA (not available) values for all sleep stages. While standard practice might suggest listwise deletion for such cases, these participants were retained in this analysis for three key reasons: (1) they provided complete data for all independent variables (household size, marital status, education level, employment status, and heart rate data availability), (2) this study specifically aimed to develop alternatives to conventional listwise deletion approaches, and (3) missingness, even complete missingness, can be informative when evaluating the mechanism and patterns behind the missingness.</p><p>While the random forest classification and GEE modeling with logit link functions serve similar analytical purposes for MAR assessment, their concurrent application provides methodological robustness, given that (1) each approach has distinct strengths in handling different data characteristics and (2) their use for MAR determination remains relatively novel in the literature, with foundational publications emerging only in the early 2000s [<xref ref-type="bibr" rid="ref34">34</xref>,<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref49">49</xref>]. This dual-method approach strengthened the conclusions by assessing consistency across complementary analytical frameworks.</p></sec><sec id="s2-5"><title>Random Forest Classification Model</title><p>A random forest classification model was used using the <italic>randomForest</italic> R package (version 4.7.1.1; Andy Liaw and Matthew Wiener) to assess whether the data were consistent with MAR, as this approach can effectively capture complex, nonlinear relationships among observed variables [<xref ref-type="bibr" rid="ref35">35</xref>]. Model performance was evaluated using the area under the receiver operating characteristic curve. An area under the curve (AUC) value significantly greater than 0.5 provided evidence for MAR, as this indicates that the missingness pattern was systematically related to the observed variables in the dataset [<xref ref-type="bibr" rid="ref35">35</xref>]. Low AUC values (less than 0.5) indicate that the model performs no better than random guessing and would be expected if the data were MCAR. AUC values above 0.5 can occur if the data are MNAR but are more likely to occur if the data are MAR [<xref ref-type="bibr" rid="ref35">35</xref>].</p><p>A critical consideration in the analysis was that standard random forest classification assumes independence between observations, an assumption violated in longitudinal data where multiple measurements come from the same individual. To address this dependency, a cluster-adjusted bootstrap sampling approach [<xref ref-type="bibr" rid="ref50">50</xref>] was implemented, which resampled participants (rather than individual nights) to preserve within-subject correlations. While the use of a random forest model to assess evidence of MAR is not novel, modifying that model to account for dependencies between observations in repeated measures data is not a standard use of the method. For this reason, a second method of modeling patterns between observed variables was used.</p></sec><sec id="s2-6"><title>GEE Model With Logit Link Function</title><p>The second approach implemented for exploring a MAR mechanism was a logistic regression model. This method tests whether observed variables can systematically predict missingness patterns&#x2014;a key criterion for MAR. While several logistic regression-based approaches exist for MAR assessment (including Ridout&#x2019;s method for dropout analysis in longitudinal studies [<xref ref-type="bibr" rid="ref34">34</xref>] and Fairclough&#x2019;s method for missingness prediction), Fairclough&#x2019;s framework [<xref ref-type="bibr" rid="ref34">34</xref>] was adapted for this analysis since its purpose was closely aligned with the goal of this study. Independent variables were entered sequentially into the model to assess their association with missingness. A variable&#x2019;s contribution was evaluated based on the regression coefficient estimates, with statistical significance determined using robust standard errors derived from the GEE, to characterize predictors of missingness. Five total models were created with an additional variable added in each model. This iterative approach using forward selection allowed for assessing how different participant characteristics and study factors influenced the probability of data being missing for a given night.</p><p>While traditional logistic regression assumes independence between observations, this assumption is violated in repeated measures designs where observations from the same participant are inherently correlated [<xref ref-type="bibr" rid="ref51">51</xref>]. To address this dependency, a GEE model with a logit link function was used using the <italic>geepack</italic> package in R (version 1.3.12; S&#x00F8;ren H&#x00F8;jsgaard, Ulrich Halekoh, Jun Yan, and Claus Thorn Ekstr&#x00F8;m), which extends generalized linear models by incorporating specified covariance structures [<xref ref-type="bibr" rid="ref52">52</xref>]. Working correlation structures were assessed for fit, including the unstructured, exchangeable, and autoregressive (1). The quasi-likelihood under the independence model information criterion was used to assess which working correlation structure was most suitable [<xref ref-type="bibr" rid="ref52">52</xref>]. For this analysis, an exchangeable working correlation structure was selected, which assumes that the correlations between observations from the same participant are equally correlated [<xref ref-type="bibr" rid="ref52">52</xref>]. This selection is appropriate because the data were collected over just 5 consecutive days, so significant correlation decay is not expected in such a short time period. The GEE framework allowed for properly accounting for within-participant correlations while examining how various factors predicted missingness patterns.</p><p>While the GEE model with a logit link function and the random forest model perform similarly in that they both model relationships between observed variables, neither is a standard method of assessing the mechanism of missingness that has been well documented in previous publications, as is the case for the Little test. Literature was identified that supported the validity of these methods, but no prior studies using these methods were identified. For these reasons, both modeling methods were performed so that their results could be compared.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Participant Characteristics</title><p>All women who participated in the TOPOWA project were aged between 18 and 24 years old. All participants had completed some primary school and could read and write, but only 8% (24/300) had completed secondary school. Over half, 62% (186/300), had given birth and 82% (152/186) of those who had given birth lived with her child(ren). Only 15% (45/300) of the women lived in a single generation household, while the remaining 85% (255/300) lived in households with 2 or more generations. Women who had a job represented 32% (97/300) while the remaining 68% (203/300) of the women were unemployed.</p></sec><sec id="s3-2"><title>Missing Data in the TOPOWA Baseline Sleep Data</title><p>Participants wore Garmin devices continuously for 5 days and nights, yielding sleep data from 299 individuals. However, 37 (12%) devices recorded no sleep data across all 5 nights (complete missingness). The dataset exhibited a notable missing data pattern: nights were either fully observed (all sleep stages recorded) or fully missing (no data for any sleep stage). Consequently, missingness proportions were identical across all sleep metrics (deep, light, REM, awake, and unmeasurable seconds), with an overall missing data rate of 30% (455 nights missing out of 1495 total nights). The rate of missingness was similar across the 3 study sites (Banda, Bwaise, and Makindye) with Banda having a slightly higher rate of missingness than Bwaise and Makindye (<xref ref-type="table" rid="table1">Table 1</xref>). The rate of missingness in the sleep data remained consistent as household size increased but increased slightly with each additional child a woman had, so that participants with no children had the lowest rate of missingness (155/570 nights of data, 27%) and participants with 3 children had the highest rate of missingness (18/25 nights of data, 72%) (<xref ref-type="table" rid="table1">Table 1</xref>). The rate of missingness in the sleep data was approximately equal across changes in income, employment status, education level, and marital status. Notably, 58% (173/299) of participants experienced at least 1 night of missing data, demonstrating the pervasiveness of this issue.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Proportion of missing data by study site, night of data collection, and number of children.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Rate and number of nights of data missing</td><td align="left" valign="bottom">Nights of data (n=495) missing from Banda participants, n/N (%)</td><td align="left" valign="bottom">Nights of data (n=500) missing from Bwaise participants, n/N (%)</td><td align="left" valign="bottom">Nights of data (n=500) missing from Makindye participants, n/N (%)</td><td align="left" valign="bottom">Total nights of data (n=1495) missing from all participants, n/N (%)</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="5">Night of data collection</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">22/99 (22)</td><td align="left" valign="top">25/100 (25)</td><td align="left" valign="top">20/100 (20)</td><td align="left" valign="top">67/299 (22)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">32/99 (32)</td><td align="left" valign="top">26/100 (26)</td><td align="left" valign="top">21/100 (21)</td><td align="left" valign="top">79/299 (26)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">32/99 (32)</td><td align="left" valign="top">25/100 (25)</td><td align="left" valign="top">24/100 (24)</td><td align="left" valign="top">81/299 (27)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4</td><td align="left" valign="top">35/99 (35)</td><td align="left" valign="top">21/100 (21)</td><td align="left" valign="top">32/100 (32)</td><td align="left" valign="top">88/299 (29)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>5</td><td align="left" valign="top">49/99 (49)</td><td align="left" valign="top">44/100 (44)</td><td align="left" valign="top">47/100 (47)</td><td align="left" valign="top">140/299 (47)</td></tr><tr><td align="left" valign="top" colspan="5">Number of children</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>0</td><td align="left" valign="top">34/155 (22)</td><td align="left" valign="top">65/155 (42)</td><td align="left" valign="top">56/155 (36)</td><td align="left" valign="top">155/570 (27)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1</td><td align="left" valign="top">89/188 (47)</td><td align="left" valign="top">45/188 (24)</td><td align="left" valign="top">54/188 (29)</td><td align="left" valign="top">188/625 (30)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>2</td><td align="left" valign="top">35/94 (37)</td><td align="left" valign="top">26/94 (28)</td><td align="left" valign="top">33/94 (35)</td><td align="left" valign="top">94/275 (34)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>3</td><td align="left" valign="top">11/18 (61)</td><td align="left" valign="top">7/18 (39)</td><td align="left" valign="top">N/A<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="top">18/25 (72)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>N/A: not available.</p></fn></table-wrap-foot></table-wrap><p>The 37 cases of complete missingness for all 5 nights of sleep data can be categorized into 3 distinct scenarios with varying probable causes, detailed in <xref ref-type="table" rid="table2">Table 2</xref>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Categorization of the 37 cases of complete sleep data missingness.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Status of sleep and heart rate data</td><td align="left" valign="bottom">Number of cases</td></tr></thead><tbody><tr><td align="left" valign="top">No sleep or heart rate data collected</td><td align="left" valign="top">1 device</td></tr><tr><td align="left" valign="top">Partial data collection&#x2014;either heart rate or activity (but not both) data collected for at least 1 day</td><td align="left" valign="top">8 devices</td></tr><tr><td align="left" valign="top">Selective sleep data missingness&#x2014;devices collected both heart rate and activity data for at least 1 day, but no sleep data</td><td align="left" valign="top">28 devices</td></tr></tbody></table></table-wrap></sec><sec id="s3-3"><title>Data Exploration</title><p>The distributions of time spent in each sleep stage and total time asleep were examined to determine if the distributions differed based on the day of the data collection (1-5). For each sleep stage, as well as total time asleep, the distribution was the same both when the 5 nights of data were considered together and when the data were grouped by night. There were no changes in the distribution of sleep times over the course of the 5 days of data collection.</p><p>There were some outliers in the total sleep durations. For 1 participant, less than 1 hour of sleep was recorded in 1 night, and for another participant, just over 12.5 hours of sleep was recorded on 1 night. Because the outlier values present in the data are not outside the realm of possibility, these observations were retained when assessing the missing data mechanism.</p></sec><sec id="s3-4"><title>Missingness Patterns</title><p>The first night of data collection has the least amount of missing data, with 22% (66/300) of nights missing data. The rate of missing data increases for each subsequent night, and the fifth and final night of data collection has 47% (141/300) of data missing (<xref ref-type="table" rid="table1">Table 1</xref>). There were 29 missingness patterns identified in the data (<xref ref-type="fig" rid="figure1">Figure 1</xref>), with no nights missing being the most common (126 cases), followed by missing only the last night of data (48 cases) and then missing all nights of data (37 cases).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Patterns of missingness in the sleep data. Missingness patterns are ordered from most common at the top (no missing nights of data) to the least common (bottom).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="mhealth_v14i1e81123_fig01.png"/></fig></sec><sec id="s3-5"><title>The Little Test</title><p>When running the Little test, the null hypothesis is that the data are MCAR while the alternative hypothesis is that the data are not MCAR and are therefore either MAR or MNAR. The <italic>&#x03C7;</italic><sup>2</sup> statistic was 969 and the degrees of freedom was 587, which resulted in a <italic>P</italic> value for the Little test of <italic>P</italic>&#x003C;.001. Therefore, the null hypothesis is rejected. This suggests that the data were not MCAR.</p></sec><sec id="s3-6"><title>Random Forest Classification Model</title><p>The AUC value of 0.70 for the random forest classification model indicated that the model was generally able to distinguish missingness, which is consistent with data MAR. The sensitivity, a measure of how well true positives (ie, missing data) are predicted, was 0.30 and the specificity, a measure of how well true negatives (ie, data present) are identified, was 0.94. The overall accuracy for the model was 0.75. <xref ref-type="table" rid="table3">Table 3</xref> shows the confusion matrix for the random forest classification model.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Random forest classification model confusion matrix.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Predicted values</td><td align="left" valign="bottom" colspan="2">True values</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">0 (data present)</td><td align="left" valign="bottom">1 (data missing)</td></tr></thead><tbody><tr><td align="left" valign="top">0 (data present)</td><td align="left" valign="top">978</td><td align="left" valign="top">319</td></tr><tr><td align="left" valign="top">1 (data missing)</td><td align="left" valign="top">62</td><td align="left" valign="top">136</td></tr></tbody></table></table-wrap></sec><sec id="s3-7"><title>GEE Model With Logit Link Function</title><p>The results of the GEE model with a logit link function also yielded results that were consistent with a MAR assumption. The independent variables were added to the model in an iterative process to determine the extent to which each of the variables was able to predict missingness. The final model (<xref ref-type="table" rid="table4">Table 4</xref>) contained only 2 predictor variables that were statistically significant, number of night in the 5-night sequence (1-5) and whether the participant had a job. The model had an accuracy of 0.70. The sensitivity was 0.12, while the specificity was 0.96. The confusion matrix for the model is displayed in <xref ref-type="table" rid="table5">Table 5</xref>.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Results of generalized estimating equations model with logit link function.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Parameter estimate</td><td align="left" valign="bottom">SE</td><td align="left" valign="bottom" colspan="2">Odds ratio (95% CI)</td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Intercept</td><td align="left" valign="top">&#x2013;1.8546</td><td align="left" valign="top">0.1850</td><td align="left" valign="top" colspan="2">0.156 (0.109&#x2010;0.225)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Number of night in the 5-night sequence</td><td align="left" valign="top">0.2554</td><td align="left" valign="top">0.0357</td><td align="left" valign="top" colspan="2">1.291 (1.204&#x2010;1.384)</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Job</td><td align="left" valign="top">0.6671</td><td align="left" valign="top">0.2016</td><td align="left" valign="top" colspan="2">1.948 (1.312&#x2010;2.893)</td><td align="left" valign="top">.001</td></tr></tbody></table></table-wrap><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Confusion matrix for the generalized estimating equations model with logit link function.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Predicted values</td><td align="left" valign="bottom" colspan="2">True values</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">0 (data present)</td><td align="left" valign="bottom">1 (data missing)</td></tr></thead><tbody><tr><td align="left" valign="top">0 (data present)</td><td align="left" valign="top">996</td><td align="left" valign="top">402</td></tr><tr><td align="left" valign="top">1 (data missing)</td><td align="left" valign="top">44</td><td align="left" valign="top">53</td></tr></tbody></table></table-wrap></sec><sec id="s3-8"><title>Comparing the Results of the 2 Classification Models</title><p>The random forest model and the logistic regression model agreed in 90% (1346) of cases. <xref ref-type="table" rid="table6">Table 6</xref> contains the confusion matrix showing how often the 2 models agreed and how often they disagreed in their classifications.</p><table-wrap id="t6" position="float"><label>Table 6.</label><caption><p>Confusion matrix comparing the random forest and logistic regression models.</p></caption><table id="table6" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Logistic regression predictions</td><td align="left" valign="bottom" colspan="2">Random forest predictions</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">0 (data present)</td><td align="left" valign="bottom">1 (data missing)</td></tr></thead><tbody><tr><td align="left" valign="top">0 (data present)</td><td align="char" char="." valign="top">1281</td><td align="char" char="." valign="top">117</td></tr><tr><td align="left" valign="top">1 (data missing)</td><td align="char" char="." valign="top">32</td><td align="char" char="." valign="top">65</td></tr></tbody></table></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Results</title><p>Our comprehensive analysis provides evidence that the missing sleep data in the TOPOWA study follows a MAR pattern, thereby permitting the use of imputation and likelihood-based methods that would be inappropriate under an MNAR mechanism. Furthermore, Enders [<xref ref-type="bibr" rid="ref43">43</xref>] recommends adopting MAR as the default assumption in most realistic research scenarios. The findings in this study indicate that missingness was systematically related to observable variables rather than unobserved sleep characteristics [<xref ref-type="bibr" rid="ref21">21</xref>,<xref ref-type="bibr" rid="ref53">53</xref>]. Both the random forest model and the GEE model with a logit link function had high specificity values, indicating that the models identified true negatives well (present data values), but the values for sensitivity were low, indicating that the models performed worse at identifying true positives (missing data values). The classification models more accurately identified when data values were present than when data values were missing. However, previous researchers who have used this method to check for evidence that missing data are MAR have focused on the AUC value and did not report sensitivity and specificity [<xref ref-type="bibr" rid="ref35">35</xref>].</p><p>While additional studies using varying types of data, such as supplementary self-reported sleep data, are necessary to further validate the methodology used in this study, the results suggest that a GEE model with a logit link function and a random forest classification model can be used to identify evidence that missing data are MAR in repeated measures data when modifications are made to account for the dependencies between observations from the same person. This finding has the potential to improve researchers&#x2019; handling of missing data in longitudinal data, common in health research, by providing a way to empirically determine the likely mechanism of missingness prior to analysis and decide how best to handle the missing data based on that mechanism of missingness.</p></sec><sec id="s4-2"><title>Possible Explanations for Missing Data</title><p>Several key observations support the conclusion that the missingness is MAR. First, the temporal pattern of missingness showed a clear progression, with later nights (particularly night 5) having higher rates of missingness than earlier nights. Second, known explanations for missingness&#x2014;including device failure (n=1 likely case), nonadherence (n=3 self-reported cases), or improper device fit&#x2014;would generally qualify as MAR mechanisms. While 37 participants had no sleep data for any of the 5 nights, the available evidence suggests these cases resulted from technical or behavioral factors rather than being related to the missing sleep values themselves.</p><p>Missing data in the baseline sleep dataset likely stemmed from multiple sources, each with distinct implications for analysis. Battery depletion emerged as a primary factor, with some devices failing to maintain charge through all 5 nights, according to reports from the research assistants. This explanation aligns with the observed increase in missingness across successive nights and qualifies as MAR, as battery failure was unrelated to participants&#x2019; sleep patterns. The most common missingness pattern in the data was data missing on the fifth night only, which likely occurred because the battery was depleted before the fifth night. The third most common missingness pattern was data present for the first 3 nights and missing for the fourth and fifth nights, which also likely occurred due to a depleted battery. A subset of cases involved unpredictable device malfunctions (MCAR), where hardware failures caused complete data loss independent of user behavior or sleep characteristics. This was likely the case for the 1 participant for which no heart rate, activity, or sleep data was collected, and may have been the case for the 8 participants for whom either heart rate data or activity data was collected (but not both) and no sleep data was collected. Another possibility is that the missing data in the underlying raw data (heart rate variability and motion data) resulted in insufficient physiological data for sleep algorithm processing. This pattern highlights the technical and behavioral challenges inherent in wearable research, where algorithm-derived outcomes (like sleep duration and stages) depend on sensor data.</p><p>Participant-related issues also contributed: some women reported removing devices due to social discomfort (eg, partner or child concerns) [<xref ref-type="bibr" rid="ref14">14</xref>], while improper fit (eg, loose wrist placement) prevented sensor contact, mimicking nonwear. In the case of the 8 participants for whom no sleep data was collected but either heart rate or activity data was collected, and the 28 participants for which heart rate and activity data was collected but sleep data was not, intermittent device removal (ie, at night) may have been a factor contributing to sleep data missingness. The coexistence of these mechanisms, and the potential for both technical and behavioral reasons for missingness, highlights the complexity of missingness in wearable research and underscores the need for robust analytical approaches to mitigate bias.</p><p>While only 3 women reported removing the device for any period of time during the 5-day data collection period, the missingness patterns in the data from considerably more devices suggested that device removal was a possible factor. The second most common missingness pattern in the data was data missing for all 5 nights, which could indicate the participants removed the device. Notably, the discrepancy between self-reported and probable nonwear suggests possible social desirability bias, as participants received compensation for participation.</p></sec><sec id="s4-3"><title>Limitations</title><p>Several important limitations should be considered when interpreting this study&#x2019;s findings. The presence or absence of other physiological or behavioral metrics that wearable devices can capture (eg, activity levels, heart rate variability) was examined, but only the presence or absence of this data was tracked. Detailed information on heart rate or activity was not analyzed. Low-quality data may also mask data that should have been marked as missing. Some extreme sleep duration values (both small and large) were identified that could represent either genuine biological variation or measurement artifacts. Wearable devices may misclassify wakefulness as sleep during prolonged sedentary periods or conversely interpret restless sleep as wakefulness. While these devices generally provide more objective sleep measurements than self-reports, such classification errors underscore the importance of interpreting extreme values cautiously. Future studies could benefit from incorporating complementary data sources such as self-reported sleep to validate these outlier observations.</p><p>While it is possible that the day of the week may impact missingness, this was not explored in this analysis for 2 reasons. The women in this study were issued Garmin devices for 5-day periods on a rolling basis, meaning that not all women wore the devices over the weekend. The second reason that considering weekday versus weekend missingness is not ideal using this data is that the lifestyle and employment status of these women are very different from those of middle- and working-class populations, as well as Western assumptions of a structured 5-day work week, who typically have consistent and differing routines on weekdays and weekends. Most of these women did not have jobs with regular Monday-Friday hours.</p><p>Lastly, questions regarding the validity and reliability of consumer-grade wearable devices remain and should be further researched, especially because validity can vary between different device models from the same brand using similar technology. As health research using wearable devices continues and expands, the study of the validity of these devices should continue as well, especially as new models and technology that have not been previously studied are released. Additionally, self-reported sleep data has long been used for sleep research and can be a valuable tool when used as complementary data for validating sleep data from wearable technology.</p></sec><sec id="s4-4"><title>Conclusion</title><p>This work demonstrates the process researchers can undertake when assessing missing data assumptions prior to the analysis of wearable data. Taken together, these findings suggest that a MAR mechanism can be assumed for sleep data in the TOPOWA study, with missingness driven primarily by observable technical and behavioral factors rather than unobserved sleep characteristics. This distinction is critical for selecting appropriate imputation strategies and ensuring valid inferences in future analyses. As wearable methods expand in global health research, especially in urban informal settlements, addressing the practical and ethical complexities of data missingness will be essential for advancing equity, rigor, and reproducibility. In addition to considering data collected in a low-resource setting, where research faces additional challenges, this study contributes meaningful information on missingness in wearable sleep data aggregated by night, closely aligning it with the common use and analysis of this type of data.</p></sec></sec></body><back><ack><p>The authors would like to thank their partners at Uganda Youth Development Link staff and research assistants who supported The Onward Project on Well-being and Adversity project.</p></ack><notes><sec><title>Funding</title><p>Research reported in this publication was funded by the National Institute of Mental Health, of the National Institutes of Health, under award number R01MH128930 to Swahn. The content is solely the responsibility of the authors and does not necessarily represent the official views of the National Institutes of Health.</p></sec><sec><title>Data Availability</title><p>The deidentified participant-level sleep data may be obtained by reasonable request to the principal investigator or corresponding author.</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: KM (lead), KBG (supporting), KN (supporting), LMM (supporting)</p><p>Data curation: MHS, KM, KN</p><p>Formal analysis: KM</p><p>Funding acquisition: MHS</p><p>Investigation: MHS, KM, KN, KBG</p><p>Methodology: KM (lead), KBG (supporting), KN (supporting), LMM (supporting), GT (supporting)</p><p>Project administration: MHS (lead), KM, KN, CN, KBG</p><p>Resources: MHS</p><p>Supervision: KBG, MHS, KN, LMM, GT</p><p>Writing &#x2013; original draft: KM</p><p>Writing &#x2013; review &#x0026; editing: KM, KBG, KN, LMM, GT, CN, MHS</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AUC</term><def><p>area under the curve</p></def></def-item><def-item><term id="abb2">GEE</term><def><p>generalized estimating equations</p></def></def-item><def-item><term id="abb3">MAR</term><def><p>missing at random</p></def></def-item><def-item><term id="abb4">MCAR</term><def><p>missing completely at random</p></def></def-item><def-item><term id="abb5">MNAR</term><def><p>missing not at random</p></def></def-item><def-item><term id="abb6">REDCap</term><def><p>Research Electronic Data Capture</p></def></def-item><def-item><term id="abb7">REM</term><def><p>rapid eye movement</p></def></def-item><def-item><term id="abb8">TOPOWA</term><def><p>The Onward Project on Well-being and Adversity</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huhn</surname><given-names>S</given-names> </name><name name-style="western"><surname>Axt</surname><given-names>M</given-names> </name><name name-style="western"><surname>Gunga</surname><given-names>HC</given-names> </name><etal/></person-group><article-title>The impact of wearable technologies in health research: scoping review</article-title><source>JMIR Mhealth Uhealth</source><year>2022</year><month>01</month><day>25</day><volume>10</volume><issue>1</issue><fpage>e34384</fpage><pub-id pub-id-type="doi">10.2196/34384</pub-id><pub-id pub-id-type="medline">35076409</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="web"><article-title>Fitbit research library</article-title><source>Fitabase</source><access-date>2025-06-02</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.fitabase.com/research-library/">https://www.fitabase.com/research-library/</ext-link></comment></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Holko</surname><given-names>M</given-names> </name><name name-style="western"><surname>Litwin</surname><given-names>TR</given-names> </name><name name-style="western"><surname>Munoz</surname><given-names>F</given-names> </name><etal/></person-group><article-title>Wearable fitness tracker use in federally qualified health center patients: strategies to improve the health of all of us using digital health devices</article-title><source>NPJ Digit Med</source><year>2022</year><month>04</month><day>25</day><volume>5</volume><issue>1</issue><fpage>53</fpage><pub-id pub-id-type="doi">10.1038/s41746-022-00593-x</pub-id><pub-id pub-id-type="medline">35469045</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nielsen</surname><given-names>K</given-names> </name><name name-style="western"><surname>Mobley</surname><given-names>K</given-names> </name><name name-style="western"><surname>Culbreth</surname><given-names>R</given-names> </name><name name-style="western"><surname>Palmier</surname><given-names>J</given-names> </name><name name-style="western"><surname>Nabulya</surname><given-names>A</given-names> </name><name name-style="western"><surname>Swahn</surname><given-names>MH</given-names> </name></person-group><article-title>Feasibility and acceptability of wearable devices and daily diaries to assess sleep and other health indicators among young women in the slums of Kampala, Uganda</article-title><source>Digit Health</source><year>2024</year><volume>10</volume><fpage>20552076241288754</fpage><pub-id pub-id-type="doi">10.1177/20552076241288754</pub-id><pub-id pub-id-type="medline">39430703</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huhn</surname><given-names>S</given-names> </name><name name-style="western"><surname>Matzke</surname><given-names>I</given-names> </name><name name-style="western"><surname>Koch</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Using wearable devices to generate real-world, individual-level data in rural, low-resource contexts in Burkina Faso, Africa: a case study</article-title><source>Front Public Health</source><year>2022</year><volume>10</volume><fpage>972177</fpage><pub-id pub-id-type="doi">10.3389/fpubh.2022.972177</pub-id><pub-id pub-id-type="medline">36249225</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>van Zyl</surname><given-names>C</given-names> </name><name name-style="western"><surname>Badenhorst</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hanekom</surname><given-names>S</given-names> </name><name name-style="western"><surname>Heine</surname><given-names>M</given-names> </name></person-group><article-title>Unravelling &#x201C;low-resource settings&#x201D;: a systematic scoping review with qualitative content analysis</article-title><source>BMJ Glob Health</source><year>2021</year><month>06</month><volume>6</volume><issue>6</issue><fpage>e005190</fpage><pub-id pub-id-type="doi">10.1136/bmjgh-2021-005190</pub-id><pub-id pub-id-type="medline">34083239</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="web"><article-title>Make cities and human settlements inclusive, safe, resilient and sustainable</article-title><source>United Nations Statistics Division</source><access-date>2025-06-02</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://unstats.un.org/sdgs/report/2021/goal-11/">https://unstats.un.org/sdgs/report/2021/goal-11/</ext-link></comment></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sclar</surname><given-names>ED</given-names> </name><name name-style="western"><surname>Garau</surname><given-names>P</given-names> </name><name name-style="western"><surname>Carolini</surname><given-names>G</given-names> </name></person-group><article-title>The 21st century health challenge of slums and cities</article-title><source>Lancet</source><year>2005</year><volume>365</volume><issue>9462</issue><fpage>901</fpage><lpage>903</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(05)71049-7</pub-id><pub-id pub-id-type="medline">15752535</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nejad</surname><given-names>FN</given-names> </name><name name-style="western"><surname>Ghamari</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Kamal</surname><given-names>SHM</given-names> </name><name name-style="western"><surname>Tabatabaee</surname><given-names>SS</given-names> </name><name name-style="western"><surname>Ganjali</surname><given-names>R</given-names> </name></person-group><article-title>The most important social determinants of slum dwellers&#x2019; health: a scoping review</article-title><source>J Prev Med Public Health</source><year>2021</year><month>07</month><volume>54</volume><issue>4</issue><fpage>265</fpage><lpage>274</lpage><pub-id pub-id-type="doi">10.3961/jpmph.21.073</pub-id><pub-id pub-id-type="medline">34370940</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ompad</surname><given-names>DC</given-names> </name><name name-style="western"><surname>Galea</surname><given-names>S</given-names> </name><name name-style="western"><surname>Caiaffa</surname><given-names>WT</given-names> </name><name name-style="western"><surname>Vlahov</surname><given-names>D</given-names> </name></person-group><article-title>Social determinants of the health of urban populations: methodologic considerations</article-title><source>J Urban Health</source><year>2007</year><month>05</month><volume>84</volume><issue>3 Suppl</issue><fpage>i42</fpage><lpage>53</lpage><pub-id pub-id-type="doi">10.1007/s11524-007-9168-4</pub-id><pub-id pub-id-type="medline">17458704</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ustinov</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Lichstein</surname><given-names>KL</given-names> </name></person-group><article-title>Actigraphy reliability with normal sleepers</article-title><source>Behav Sleep Med</source><year>2013</year><volume>11</volume><issue>5</issue><fpage>313</fpage><lpage>320</lpage><pub-id pub-id-type="doi">10.1080/15402002.2012.688779</pub-id><pub-id pub-id-type="medline">23268697</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gupta</surname><given-names>N</given-names> </name><name name-style="western"><surname>Crowley</surname><given-names>P</given-names> </name><name name-style="western"><surname>Holtermann</surname><given-names>A</given-names> </name><name name-style="western"><surname>Straker</surname><given-names>L</given-names> </name><name name-style="western"><surname>Stamatakis</surname><given-names>E</given-names> </name><name name-style="western"><surname>Ding</surname><given-names>D</given-names> </name></person-group><article-title>Are we ready for wearable-based global physical activity surveillance?</article-title><source>Br J Sports Med</source><year>2024</year><month>03</month><day>21</day><volume>58</volume><issue>7</issue><fpage>356</fpage><lpage>358</lpage><pub-id pub-id-type="doi">10.1136/bjsports-2023-106780</pub-id><pub-id pub-id-type="medline">38336382</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liverani</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ir</surname><given-names>P</given-names> </name><name name-style="western"><surname>Perel</surname><given-names>P</given-names> </name><name name-style="western"><surname>Khan</surname><given-names>M</given-names> </name><name name-style="western"><surname>Balabanova</surname><given-names>D</given-names> </name><name name-style="western"><surname>Wiseman</surname><given-names>V</given-names> </name></person-group><article-title>Assessing the potential of wearable health monitors for health system strengthening in low- and middle-income countries: a prospective study of technology adoption in Cambodia</article-title><source>Health Policy Plan</source><year>2022</year><month>09</month><day>13</day><volume>37</volume><issue>8</issue><fpage>943</fpage><lpage>951</lpage><pub-id pub-id-type="doi">10.1093/heapol/czac019</pub-id><pub-id pub-id-type="medline">35262172</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Swahn</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Gittner</surname><given-names>KB</given-names> </name><name name-style="western"><surname>Lyons</surname><given-names>MJ</given-names> </name><etal/></person-group><article-title>Advancing mHealth research in low-resource settings: young women&#x2019;s insights and implementation challenges with wearable smartwatch devices in Uganda</article-title><source>Sensors (Basel)</source><year>2024</year><month>08</month><day>29</day><volume>24</volume><issue>17</issue><fpage>5591</fpage><pub-id pub-id-type="doi">10.3390/s24175591</pub-id><pub-id pub-id-type="medline">39275502</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Garbern</surname><given-names>S</given-names> </name><name name-style="western"><surname>Mbanjumucyo</surname><given-names>G</given-names> </name><name name-style="western"><surname>Umuhoza</surname><given-names>C</given-names> </name><etal/></person-group><article-title>Feasibility and accuracy of a wearable biosensor device for vital sign monitoring in septic emergency department patients in Rwanda</article-title><source>Prehosp Disaster med</source><year>2019</year><month>05</month><volume>34</volume><issue>s1</issue><fpage>s85</fpage><lpage>s86</lpage><pub-id pub-id-type="doi">10.1017/S1049023X1900178X</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ghomrawi</surname><given-names>HM</given-names> </name><name name-style="western"><surname>Many</surname><given-names>BT</given-names> </name><name name-style="western"><surname>Holl</surname><given-names>JL</given-names> </name><etal/></person-group><article-title>Clinicians&#x2019; perspectives on wearable sensor technology as an alternative bedside monitoring tool in two West African countries</article-title><source>Int J Med Inform</source><year>2023</year><month>07</month><volume>175</volume><fpage>105046</fpage><pub-id pub-id-type="doi">10.1016/j.ijmedinf.2023.105046</pub-id><pub-id pub-id-type="medline">37148867</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Van</surname><given-names>HMT</given-names> </name><name name-style="western"><surname>Hao</surname><given-names>NV</given-names> </name><name name-style="western"><surname>Phan Nguyen Quoc</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Vital sign monitoring using wearable devices in a Vietnamese intensive care unit</article-title><source>BMJ Innov</source><year>2021</year><month>03</month><volume>7</volume><issue>Suppl 1</issue><fpage>s7</fpage><lpage>s11</lpage><pub-id pub-id-type="doi">10.1136/bmjinnov-2021-000707</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cao</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Allore</surname><given-names>H</given-names> </name><name name-style="western"><surname>Vander Wyk</surname><given-names>B</given-names> </name><name name-style="western"><surname>Gutman</surname><given-names>R</given-names> </name></person-group><article-title>Review and evaluation of imputation methods for multivariate longitudinal data with mixed-type incomplete variables</article-title><source>Stat Med</source><year>2022</year><month>12</month><day>30</day><volume>41</volume><issue>30</issue><fpage>5844</fpage><lpage>5876</lpage><pub-id pub-id-type="doi">10.1002/sim.9592</pub-id><pub-id pub-id-type="medline">36220138</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>De</surname><given-names>A</given-names> </name></person-group><article-title>Multiple imputation by fully conditional specification for dealing with missing data in a large epidemiologic study</article-title><source>Int J Stat Med Res</source><year>2015</year><volume>4</volume><issue>3</issue><fpage>287</fpage><lpage>295</lpage><pub-id pub-id-type="doi">10.6000/1929-6029.2015.04.03.7</pub-id><pub-id pub-id-type="medline">27429686</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Adhikari</surname><given-names>D</given-names> </name><name name-style="western"><surname>Jiang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Zhan</surname><given-names>J</given-names> </name><etal/></person-group><article-title>A comprehensive survey on imputation of missing data in Internet of Things</article-title><source>ACM Comput Surv</source><year>2023</year><month>07</month><day>31</day><volume>55</volume><issue>7</issue><fpage>1</fpage><lpage>38</lpage><pub-id pub-id-type="doi">10.1145/3533381</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huque</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Carlin</surname><given-names>JB</given-names> </name><name name-style="western"><surname>Simpson</surname><given-names>JA</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>KJ</given-names> </name></person-group><article-title>A comparison of multiple imputation methods for missing data in longitudinal studies</article-title><source>BMC Med Res Methodol</source><year>2018</year><month>12</month><day>12</day><volume>18</volume><issue>1</issue><fpage>168</fpage><pub-id pub-id-type="doi">10.1186/s12874-018-0615-6</pub-id><pub-id pub-id-type="medline">30541455</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Braem</surname><given-names>CIR</given-names> </name><name name-style="western"><surname>Yavuz</surname><given-names>US</given-names> </name><name name-style="western"><surname>Hermens</surname><given-names>HJ</given-names> </name><name name-style="western"><surname>Veltink</surname><given-names>PH</given-names> </name></person-group><article-title>Missing data statistics provide causal insights into data loss in diabetes health monitoring by wearable sensors</article-title><source>Sensors (Basel)</source><year>2024</year><month>02</month><day>27</day><volume>24</volume><issue>5</issue><fpage>1526</fpage><pub-id pub-id-type="doi">10.3390/s24051526</pub-id><pub-id pub-id-type="medline">38475061</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weed</surname><given-names>L</given-names> </name><name name-style="western"><surname>Lok</surname><given-names>R</given-names> </name><name name-style="western"><surname>Chawra</surname><given-names>D</given-names> </name><name name-style="western"><surname>Zeitzer</surname><given-names>J</given-names> </name></person-group><article-title>The impact of missing data and imputation methods on the analysis of 24-hour activity patterns</article-title><source>Clocks &#x0026; Sleep</source><year>2022</year><volume>4</volume><issue>4</issue><fpage>497</fpage><lpage>507</lpage><pub-id pub-id-type="doi">10.3390/clockssleep4040039</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Feng</surname><given-names>T</given-names> </name><name name-style="western"><surname>Narayanan</surname><given-names>S</given-names> </name></person-group><article-title>Imputing missing data in large-scale multivariate biomedical wearable recordings using bidirectional recurrent neural networks with temporal activation regularization</article-title><access-date>2026-03-09</access-date><conf-name>2019 41st Annual International Conference of the IEEE Engineering in Medicine and Biology Society (EMBC)</conf-name><conf-date>Jul 23-27, 2019</conf-date><comment><ext-link ext-link-type="uri" xlink:href="https://ieeexplore.ieee.org/document/8856966">https://ieeexplore.ieee.org/document/8856966</ext-link></comment><pub-id pub-id-type="doi">10.1109/EMBC.2019.8856966</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>MP</given-names> </name><name name-style="western"><surname>Hoang</surname><given-names>K</given-names> </name><name name-style="western"><surname>Park</surname><given-names>S</given-names> </name><etal/></person-group><article-title>Imputing missing sleep data from wearables with neural networks in real-world settings</article-title><source>Sleep</source><year>2024</year><month>01</month><day>11</day><volume>47</volume><issue>1</issue><fpage>zsad266</fpage><pub-id pub-id-type="doi">10.1093/sleep/zsad266</pub-id><pub-id pub-id-type="medline">37819273</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cho</surname><given-names>S</given-names> </name><name name-style="western"><surname>Weng</surname><given-names>C</given-names> </name><name name-style="western"><surname>Kahn</surname><given-names>MG</given-names> </name><name name-style="western"><surname>Natarajan</surname><given-names>K</given-names> </name></person-group><article-title>Identifying data quality dimensions for person-generated wearable device data: multi-method study</article-title><source>JMIR Mhealth Uhealth</source><year>2021</year><month>12</month><day>23</day><volume>9</volume><issue>12</issue><fpage>e31618</fpage><pub-id pub-id-type="doi">10.2196/31618</pub-id><pub-id pub-id-type="medline">34941540</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hicks</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Althoff</surname><given-names>T</given-names> </name><name name-style="western"><surname>Sosic</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Best practices for analyzing large-scale health data from wearables and smartphone apps</article-title><source>NPJ Digit Med</source><year>2019</year><volume>2</volume><fpage>45</fpage><pub-id pub-id-type="doi">10.1038/s41746-019-0121-1</pub-id><pub-id pub-id-type="medline">31304391</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Matzke</surname><given-names>I</given-names> </name><name name-style="western"><surname>Huhn</surname><given-names>S</given-names> </name><name name-style="western"><surname>Koch</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Assessment of heat exposure and health outcomes in rural populations of western Kenya by using wearable devices: observational case study</article-title><source>JMIR Mhealth Uhealth</source><year>2024</year><month>07</month><day>4</day><volume>12</volume><issue>1</issue><fpage>e54669</fpage><pub-id pub-id-type="doi">10.2196/54669</pub-id><pub-id pub-id-type="medline">38963698</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>McKnight</surname><given-names>PE</given-names> </name><name name-style="western"><surname>McKnight</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Sidani</surname><given-names>S</given-names> </name><name name-style="western"><surname>Figueredo</surname><given-names>AJ</given-names> </name></person-group><source>Missing Data: A Gentle Introduction</source><year>2007</year><access-date>2026-03-09</access-date><publisher-name>Guilford Press</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.guilford.com/books/Missing-Data/McKnight-McKnight-Sidani-Figueredo/9781593853938">https://www.guilford.com/books/Missing-Data/McKnight-McKnight-Sidani-Figueredo/9781593853938</ext-link></comment><pub-id pub-id-type="other">978-1593853938</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Azur</surname><given-names>MJ</given-names> </name><name name-style="western"><surname>Stuart</surname><given-names>EA</given-names> </name><name name-style="western"><surname>Frangakis</surname><given-names>C</given-names> </name><name name-style="western"><surname>Leaf</surname><given-names>PJ</given-names> </name></person-group><article-title>Multiple imputation by chained equations: what is it and how does it work?</article-title><source>Int J Methods Psychiatr Res</source><year>2011</year><month>03</month><volume>20</volume><issue>1</issue><fpage>40</fpage><lpage>49</lpage><pub-id pub-id-type="doi">10.1002/mpr.329</pub-id><pub-id pub-id-type="medline">21499542</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Madley-Dowd</surname><given-names>P</given-names> </name><name name-style="western"><surname>Hughes</surname><given-names>R</given-names> </name><name name-style="western"><surname>Tilling</surname><given-names>K</given-names> </name><name name-style="western"><surname>Heron</surname><given-names>J</given-names> </name></person-group><article-title>The proportion of missing data should not be used to guide decisions on multiple imputation</article-title><source>J Clin Epidemiol</source><year>2019</year><month>06</month><volume>110</volume><fpage>63</fpage><lpage>73</lpage><pub-id pub-id-type="doi">10.1016/j.jclinepi.2019.02.016</pub-id><pub-id pub-id-type="medline">30878639</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fernstad</surname><given-names>SJ</given-names> </name></person-group><article-title>To identify what is not there: a definition of missingness patterns and evaluation of missing value visualization</article-title><source>Inf Vis</source><year>2019</year><month>04</month><volume>18</volume><issue>2</issue><fpage>230</fpage><lpage>250</lpage><pub-id pub-id-type="doi">10.1177/1473871618785387</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Little</surname><given-names>RJA</given-names> </name></person-group><article-title>A test of missing completely at random for multivariate data with missing values</article-title><source>J Am Stat Assoc</source><year>1988</year><month>12</month><volume>83</volume><issue>404</issue><fpage>1198</fpage><lpage>1202</lpage><pub-id pub-id-type="doi">10.1080/01621459.1988.10478722</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fielding</surname><given-names>S</given-names> </name><name name-style="western"><surname>Fayers</surname><given-names>PM</given-names> </name><name name-style="western"><surname>Ramsay</surname><given-names>CR</given-names> </name></person-group><article-title>Investigating the missing data mechanism in quality of life outcomes: a comparison of approaches</article-title><source>Health Qual Life Outcomes</source><year>2009</year><month>06</month><day>22</day><volume>7</volume><fpage>57</fpage><pub-id pub-id-type="doi">10.1186/1477-7525-7-57</pub-id><pub-id pub-id-type="medline">19545408</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sondhi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Weberpals</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yerram</surname><given-names>P</given-names> </name><etal/></person-group><article-title>A systematic approach towards missing lab data in electronic health records: a case study in non-small cell lung cancer and multiple myeloma</article-title><source>CPT Pharmacom Syst Pharma</source><year>2023</year><month>09</month><volume>12</volume><issue>9</issue><fpage>1201</fpage><lpage>1212</lpage><pub-id pub-id-type="doi">10.1002/psp4.12998</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Haghayegh</surname><given-names>S</given-names> </name><name name-style="western"><surname>Khoshnevis</surname><given-names>S</given-names> </name><name name-style="western"><surname>Smolensky</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Diller</surname><given-names>KR</given-names> </name><name name-style="western"><surname>Castriotta</surname><given-names>RJ</given-names> </name></person-group><article-title>Accuracy of wristband Fitbit models in assessing sleep: systematic review and meta-analysis</article-title><source>J Med Internet Res</source><year>2019</year><month>11</month><day>28</day><volume>21</volume><issue>11</issue><fpage>e16273</fpage><pub-id pub-id-type="doi">10.2196/16273</pub-id><pub-id pub-id-type="medline">31778122</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Berryhill</surname><given-names>S</given-names> </name><name name-style="western"><surname>Morton</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Dean</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Effect of wearables on sleep in healthy individuals: a randomized crossover trial and validation study</article-title><source>J Clin Sleep Med</source><year>2020</year><month>05</month><day>15</day><volume>16</volume><issue>5</issue><fpage>775</fpage><lpage>783</lpage><pub-id pub-id-type="doi">10.5664/jcsm.8356</pub-id><pub-id pub-id-type="medline">32043961</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roberts</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Schade</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Mathew</surname><given-names>GM</given-names> </name><name name-style="western"><surname>Gartenberg</surname><given-names>D</given-names> </name><name name-style="western"><surname>Buxton</surname><given-names>OM</given-names> </name></person-group><article-title>Detecting sleep using heart rate and motion data from multisensor consumer-grade wearables, relative to wrist actigraphy and polysomnography</article-title><source>Sleep</source><year>2020</year><month>07</month><day>13</day><volume>43</volume><issue>7</issue><fpage>zsaa045</fpage><pub-id pub-id-type="doi">10.1093/sleep/zsaa045</pub-id><pub-id pub-id-type="medline">32215550</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sathyanarayana</surname><given-names>A</given-names> </name><name name-style="western"><surname>Joty</surname><given-names>S</given-names> </name><name name-style="western"><surname>Fernandez-Luque</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Sleep quality prediction from wearable data using deep learning</article-title><source>JMIR Mhealth Uhealth</source><year>2016</year><month>11</month><day>4</day><volume>4</volume><issue>4</issue><fpage>e125</fpage><pub-id pub-id-type="doi">10.2196/mhealth.6562</pub-id><pub-id pub-id-type="medline">27815231</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Evenson</surname><given-names>KR</given-names> </name><name name-style="western"><surname>Spade</surname><given-names>CL</given-names> </name></person-group><article-title>Review of validity and reliability of Garmin activity trackers</article-title><source>J Meas Phys Behav</source><year>2020</year><month>06</month><volume>3</volume><issue>2</issue><fpage>170</fpage><lpage>185</lpage><pub-id pub-id-type="doi">10.1123/jmpb.2019-0035</pub-id><pub-id pub-id-type="medline">32601613</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schyvens</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Van Oost</surname><given-names>NC</given-names> </name><name name-style="western"><surname>Aerts</surname><given-names>JM</given-names> </name><etal/></person-group><article-title>Accuracy of Fitbit Charge 4, Garmin Vivosmart 4, and WHOOP versus polysomnography: systematic review</article-title><source>JMIR Mhealth Uhealth</source><year>2024</year><month>03</month><day>27</day><volume>12</volume><fpage>e52192</fpage><pub-id pub-id-type="doi">10.2196/52192</pub-id><pub-id pub-id-type="medline">38557808</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Grandner</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Lujan</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Ghani</surname><given-names>SB</given-names> </name></person-group><article-title>Sleep-tracking technology in scientific research: looking to the future</article-title><source>Sleep</source><year>2021</year><month>05</month><day>14</day><volume>44</volume><issue>5</issue><fpage>zsab071</fpage><pub-id pub-id-type="doi">10.1093/sleep/zsab071</pub-id><pub-id pub-id-type="medline">33782687</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Enders</surname><given-names>CK</given-names> </name></person-group><source>Applied Missing Data Analysis</source><year>2022</year><access-date>2026-03-09</access-date><edition>2</edition><publisher-name>Guilford Publications</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.guilford.com/books/Applied-Missing-Data-Analysis/Craig-Enders/9781462549863">https://www.guilford.com/books/Applied-Missing-Data-Analysis/Craig-Enders/9781462549863</ext-link></comment><pub-id pub-id-type="other">978-1462549863</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Culbreth</surname><given-names>RE</given-names> </name><name name-style="western"><surname>Nielsen</surname><given-names>KE</given-names> </name><name name-style="western"><surname>Mobley</surname><given-names>K</given-names> </name><name name-style="western"><surname>Palmier</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bukuluki</surname><given-names>P</given-names> </name><name name-style="western"><surname>Swahn</surname><given-names>MH</given-names> </name></person-group><article-title>Life satisfaction factors, stress, and depressive symptoms among young women living in urban Kampala: findings from the TOPOWA Project pilot studies</article-title><source>Int J Environ Res Public Health</source><year>2024</year><month>02</month><day>6</day><volume>21</volume><issue>2</issue><fpage>184</fpage><pub-id pub-id-type="doi">10.3390/ijerph21020184</pub-id><pub-id pub-id-type="medline">38397675</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="web"><article-title>How Garmin watches track your sleep, calculate sleep score</article-title><source>Garmin</source><access-date>2025-06-03</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.garmin.com/en-US/blog/fitness/how-garmin-watches-track-your-sleep-calculate-sleep-score/">https://www.garmin.com/en-US/blog/fitness/how-garmin-watches-track-your-sleep-calculate-sleep-score/</ext-link></comment></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>Z</given-names> </name></person-group><article-title>Missing data exploration: highlighting graphical presentation of missing pattern</article-title><source>Ann Transl Med</source><year>2015</year><month>12</month><volume>3</volume><issue>22</issue><fpage>356</fpage><pub-id pub-id-type="doi">10.3978/j.issn.2305-5839.2015.12.28</pub-id><pub-id pub-id-type="medline">26807411</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Grandner</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Jackson</surname><given-names>NJ</given-names> </name><name name-style="western"><surname>Izci-Balserak</surname><given-names>B</given-names> </name><etal/></person-group><article-title>Social and behavioral determinants of perceived insufficient sleep</article-title><source>Front Neurol</source><year>2015</year><volume>6</volume><fpage>112</fpage><pub-id pub-id-type="doi">10.3389/fneur.2015.00112</pub-id><pub-id pub-id-type="medline">26097464</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mazloomi</surname><given-names>SN</given-names> </name><name name-style="western"><surname>Talebi</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kazemi</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Food insecurity is associated with the sleep quality and quantity in adults: a systematic review and meta-analysis</article-title><source>Public Health Nutr</source><year>2023</year><month>04</month><volume>26</volume><issue>4</issue><fpage>792</fpage><lpage>802</lpage><pub-id pub-id-type="doi">10.1017/S1368980022002488</pub-id><pub-id pub-id-type="medline">36416108</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Fairclough</surname><given-names>DL</given-names> </name></person-group><source>Design and Analysis of Quality of Life Studies in Clinical Trials</source><year>2002</year><access-date>2026-03-09</access-date><publisher-name>Chapman and Hall/CRC</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.taylorfrancis.com/books/mono/10.1201/9781420035438/design-analysis-quality-life-studies-clinical-trials-diane-fairclough">https://www.taylorfrancis.com/books/mono/10.1201/9781420035438/design-analysis-quality-life-studies-clinical-trials-diane-fairclough</ext-link></comment><pub-id pub-id-type="other">9780429122743</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Karpievitch</surname><given-names>YV</given-names> </name><name name-style="western"><surname>Hill</surname><given-names>EG</given-names> </name><name name-style="western"><surname>Leclerc</surname><given-names>AP</given-names> </name><name name-style="western"><surname>Dabney</surname><given-names>AR</given-names> </name><name name-style="western"><surname>Almeida</surname><given-names>JS</given-names> </name></person-group><article-title>An introspective comparison of random forest-based classifiers for the analysis of cluster-correlated data by way of RF++</article-title><source>PLoS One</source><year>2009</year><month>09</month><day>18</day><volume>4</volume><issue>9</issue><fpage>e7087</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0007087</pub-id><pub-id pub-id-type="medline">19763254</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Hoffman</surname><given-names>L</given-names> </name></person-group><source>Longitudinal Analysis: Modeling within-Person Fluctuation and Change</source><year>2015</year><publisher-name>Routledge</publisher-name><pub-id pub-id-type="doi">10.4324/9781315744094</pub-id><pub-id pub-id-type="other">9781315744094</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ballinger</surname><given-names>GA</given-names> </name></person-group><article-title>Using generalized estimating equations for longitudinal data analysis</article-title><source>Organ Res Methods</source><year>2004</year><month>04</month><volume>7</volume><issue>2</issue><fpage>127</fpage><lpage>150</lpage><pub-id pub-id-type="doi">10.1177/1094428104263672</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jadhav</surname><given-names>A</given-names> </name><name name-style="western"><surname>Pramod</surname><given-names>D</given-names> </name><name name-style="western"><surname>Ramanathan</surname><given-names>K</given-names> </name></person-group><article-title>Comparison of performance of data imputation methods for numeric dataset</article-title><source>Appl Artif Intell</source><year>2019</year><month>08</month><day>24</day><volume>33</volume><issue>10</issue><fpage>913</fpage><lpage>933</lpage><pub-id pub-id-type="doi">10.1080/08839514.2019.1637138</pub-id></nlm-citation></ref></ref-list></back></article>