<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id><journal-id journal-id-type="publisher-id">jmir</journal-id><journal-id journal-id-type="index">1</journal-id><journal-title>Journal of Medical Internet Research</journal-title><abbrev-journal-title>J Med Internet Res</abbrev-journal-title><issn pub-type="epub">1438-8871</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v27i1e72216</article-id><article-id pub-id-type="doi">10.2196/72216</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>At-Home Evaluation of Both Wearable and Touchless Digital Health Technologies for Measuring Nocturnal Scratching in Atopic Dermatitis: Analytical Validation Study</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Avey</surname><given-names>Stefan</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Morris</surname><given-names>Mark</given-names></name><degrees>MBA</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sargsyan</surname><given-names>Davit</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lucas</surname><given-names>Molly V</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>O'Brisky</surname><given-names>Andrea</given-names></name><degrees>BS</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Mosca</surname><given-names>Kenneth</given-names></name><degrees>MBA</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Elias</surname><given-names>Andrew</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Fountoulakis</surname><given-names>Nicholas</given-names></name><degrees>BS</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Boukhechba</surname><given-names>Mehdi</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kok</surname><given-names>Xuen Hoong</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Jain</surname><given-names>Saiyam</given-names></name><degrees>BTech</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Oghbaie</surname><given-names>Mehrnoosh</given-names></name><degrees>EMOT, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Manyakov</surname><given-names>Nikolay V</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Wang</surname><given-names>Miao</given-names></name><degrees>MD, PhD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Aguilar</surname><given-names>Zuleima</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yieh</surname><given-names>Lynn</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib></contrib-group><aff id="aff1"><institution>Johnson &#x0026; Johnson</institution><addr-line>1400 McKean Rd</addr-line><addr-line>Spring House</addr-line><addr-line>PA</addr-line><country>United States</country></aff><aff id="aff2"><institution>Johnson &#x0026; Johnson</institution><addr-line>Raritan</addr-line><addr-line>NJ</addr-line><country>United States</country></aff><aff id="aff3"><institution>Johnson &#x0026; Johnson</institution><addr-line>London</addr-line><country>United Kingdom</country></aff><aff id="aff4"><institution>Johnson &#x0026; Johnson</institution><addr-line>Delhi</addr-line><country>India</country></aff><aff id="aff5"><institution>Johnson &#x0026; Johnson</institution><addr-line>Beerse</addr-line><country>Belgium</country></aff><aff id="aff6"><institution>Johnson &#x0026; Johnson</institution><addr-line>San Diego</addr-line><addr-line>CA</addr-line><country>United States</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Sarvestan</surname><given-names>Javad</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Northcott</surname><given-names>Carrie</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Schopf</surname><given-names>Thomas</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Chen</surname><given-names>Xiaotian</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Stefan Avey, PhD, Johnson &#x0026; Johnson, 1400 McKean Rd, Spring House, PA, 19002, United States, 1 2157937355; <email>savey@its.jnj.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>15</day><month>7</month><year>2025</year></pub-date><volume>27</volume><elocation-id>e72216</elocation-id><history><date date-type="received"><day>05</day><month>02</month><year>2025</year></date><date date-type="rev-recd"><day>24</day><month>04</month><year>2025</year></date><date date-type="accepted"><day>14</day><month>05</month><year>2025</year></date></history><copyright-statement>&#x00A9; Stefan Avey, Mark Morris, Davit Sargsyan, Molly V Lucas, Andrea O'Brisky, Kenneth Mosca, Andrew Elias, Nicholas Fountoulakis, Mehdi Boukhechba, Xuen Hoong Kok, Saiyam Jain, Mehrnoosh Oghbaie, Nikolay V Manyakov, Miao Wang, Zuleima Aguilar, Lynn Yieh. Originally published in the Journal of Medical Internet Research (<ext-link ext-link-type="uri" xlink:href="https://www.jmir.org">https://www.jmir.org</ext-link>), 15.7.2025. </copyright-statement><copyright-year>2025</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research (ISSN 1438-8871), is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://www.jmir.org/">https://www.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://www.jmir.org/2025/1/e72216"/><abstract><sec><title>Background</title><p>The most common symptom of atopic dermatitis (AD) is pruritus, which is often exacerbated at night and leads to nocturnal scratching and sleep disturbance. The quantification of nocturnal scratching provides an objective measure, which could be used as a clinical trial endpoint tracking this AD-related behavior. However, it is not clear how digital health technologies (DHTs) intended to measure scratching perform in the real-world environment of patient homes.</p></sec><sec><title>Objective</title><p>In this study, we present the analytical validation of 2 DHTs: the GENEActiv wristband with Philips sleep and scratch algorithms (&#x201C;Philips&#x201D;) and the Emerald radio frequency touchless sensor (&#x201C;Emerald&#x201D;) to measure nocturnal scratching in adults with AD.</p></sec><sec sec-type="methods"><title>Methods</title><p>Thirty-one participants (15 with moderate AD, 11 with mild AD, and 5 healthy volunteers) were enrolled in the study. Nocturnal scratching was assessed by each DHT in the study participant&#x2019;s home environment over a 4-week observation period. Infrared videos were recorded during sleep twice per week and manually annotated for the intended sleep window (total sleep opportunity [TSO]) and scratching events. Human annotations for sleep and scratch measures were used as a reference for comparison with DHTs (&#x201C;Reference&#x201D;). Estimated TSO was compared for each DHT to Reference using Bland-Altman analysis. Within-night agreement of DHT-predicted scratching events versus the Reference was assessed by sensitivity, precision, and <italic>F</italic><sub>1</sub>-score. Intraclass correlation was used to compare night-level scratch summaries (scratch duration per hour of TSO and scratch frequency per hour of TSO) between each DHT and the Reference.</p></sec><sec sec-type="results"><title>Results</title><p>Characterization of human-annotated scratching revealed a basal level of scratching in both healthy volunteers (13.1 seconds per hour) and in participants with AD on nights when no itch was reported (10.2 seconds per hour). The TSO window was quantified accurately with both DHTs having a mean bias compared with Reference of &#x003C;30 minutes. The within-night agreement with reference to scratch detection performance resulted in <italic>F</italic><sub>1</sub>-scores at the disease group level ranging from 0.51 to 0.68 for the Emerald DHT and 0.47 to 0.56 for the Philips DHT. The night-level agreement of nocturnal scratch duration and frequency with human raters fell mostly in the moderate&#x2014;good range of intraclass correlation coefficients (0.5&#x2010;0.9) in participants with AD and was not significantly lower than the level of agreement between any 2 human raters.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>These results support the analytical validity of both DHTs tested for continuous measurement of nocturnal scratching in individuals with AD in the home environment. Opportunities remain for improving the performance of the DHTs tested, especially in the precision of wrist-worn accelerometer scratch detection, to reach human-level performance. Additional data collection in diverse patient populations will be beneficial for practitioners intending to use or improve these tools for quantifying nocturnal scratching behavior.</p></sec></abstract><kwd-group><kwd>nocturnal scratch</kwd><kwd>scratching</kwd><kwd>itch</kwd><kwd>atopic dermatitis</kwd><kwd>wearable</kwd><kwd>touchless sensor</kwd><kwd>sensor</kwd><kwd>digital health technology</kwd><kwd>analytical validation</kwd><kwd>accelerometer</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Atopic dermatitis (AD) is an inflammatory skin disease that has been reported to affect up to 10% of the adult population [<xref ref-type="bibr" rid="ref1">1</xref>]. The most common symptom is pruritus or itch. Itch is reported to be exacerbated at night [<xref ref-type="bibr" rid="ref2">2</xref>], and the consequent scratching often disrupts sleep and can be accompanied by anxiety, depression, and even suicidal ideation [<xref ref-type="bibr" rid="ref3">3</xref>]. While there are patient-reported outcomes (PROs) to assess pruritus (the sensation of itch), these are not designed to measure the amount of scratching behavior [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Nocturnal scratching, which by definition is an action of rhythmic and repetitive skin contact movement performed during a delimited time period of intended and actual sleep [<xref ref-type="bibr" rid="ref6">6</xref>], is unlikely to be accurately self-reported and has been shown to correlate only weakly with self-reported measures of itch [<xref ref-type="bibr" rid="ref7">7</xref>]. Therefore, an objective measurement of nocturnal scratching would complement a patient-reported measurement of itch in future clinical trials.</p><p>Video recording followed by manual human annotation of scratch events is considered the reference standard for assessment of nocturnal scratching [<xref ref-type="bibr" rid="ref7">7</xref>] and has been used as a research tool for more than 25 years to characterize scratching in AD [<xref ref-type="bibr" rid="ref8">8</xref>,<xref ref-type="bibr" rid="ref9">9</xref>]. However, the privacy implications of collecting video as well as the time-intensive manual annotation process preclude the widespread assessment of nocturnal scratching in clinical trials. Recently, several digital health technologies (DHTs) have been developed that claim to objectively quantify nocturnal scratching, which could help facilitate adoption of nocturnal scratching as an objective and readily measured clinical trial end point [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref18">18</xref>]. The most widely studied type of technology for measuring scratching is actigraphy (wrist-worn accelerometers). Based on previous research, it is well established that actigraphy-based methods have poor sensitivity for detecting finger-dominant scratching or other types of non&#x2013;wrist-driven scratching, such as scratching one leg against the other [<xref ref-type="bibr" rid="ref12">12</xref>]. Recently, touchless sensors have been proposed as a tool for capturing a wider variety of scratching movements without requiring any physical contact with the body. Indeed, touchless sensors using reflections of radio waves have already shown promise in assessing human behaviors such as sleep [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>] and gait [<xref ref-type="bibr" rid="ref21">21</xref>].</p><p>This study builds on existing research in the field that has developed algorithms for detecting nocturnal scratching from either wrist-worn accelerometers or touchless sensors in a clinical setting by showing how they both perform in comparison with video observation in individuals&#x2019; natural sleeping environment. To date, there have been only a few studies that examined the analytical validity of DHT-derived nocturnal scratch measures in a home setting, and these have concentrated on pediatric patients with AD [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>]. In contrast, this study provides independent analytical validation evidence for DHT-derived nocturnal scratch measures in the home environment of adults with AD, using both a wrist-worn wearable and a touchless sensor.</p><p>This analytical validation study was designed to evaluate two DHTs: (1) the GENEActiv wristband with Philips sleep and scratch algorithms (referred to hereafter as &#x201C;Philips&#x201D;) and (2) the Emerald radio frequency (RF)-based sensor with Emerald sleep and scratch algorithms (referred to hereafter as &#x201C;Emerald&#x201D;). The performance of the 2 DHTs to measure nocturnal scratching during the total sleep opportunity (TSO) window was independently compared against human-labeled infrared (IR) camera recording data (referred to hereafter as &#x201C;Reference&#x201D;). The comparison to Reference was done both within nights and on nightly level summaries: normalized scratch frequency (number of scratch bouts per hour of TSO) and normalized scratch duration (seconds of scratch per hour of TSO). We begin by describing the study and patient population, then we characterize the scratch behavior in the patient cohorts, followed by a comparison of the TSO window estimates, then move to comparing scratch classification performance within nights, and finally to comparing the nightly scratch measures between each DHT and Reference.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>The study included an in-clinic screening visit, a screening period of up to 3 weeks, and a 4-week observation period at each participant&#x2019;s home. Clinical scores for characterizing the severity of disease in patients with AD were assessed during the in-clinic screening visit. The in-home portion of the study included a 28-day observation period during which scratching was assessed every night by the Philips and Emerald DHTs (<xref ref-type="fig" rid="figure1">Figure 1</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Study design. Clinician-reported (vIGA-ADTM, EASI, and SCORAD) and 1 patient-reported outcome (peak nocturnal pruritus numeric rating scale) were assessed at the in-person screening visit. The deployment visit on study day 1 consisted of the installation of the touchless sensor, IR camera, and assignment of the wristbands for wrist actigraphy. Nocturnal scratch measures were assessed nightly during the observation period with both the Philips and Emerald DHTs. IR sleep videos were recorded on any 2 nights per week, and video observers labeled sleep and scratch measures. Itch was assessed daily with the Atopic Dermatitis Itch Scale. IR: infrared; PRO: patient-reported outcome.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e72216_fig01.png"/></fig></sec><sec id="s2-2"><title>Study Population</title><p>The study enrolled men and women, aged 18 years and older, with moderate to severe AD, mild AD, or healthy volunteers (HVs). Participants with AD were required to have an established diagnosis for at least 12 months and meet the following key inclusion criteria at screening: patients were eligible for the mild AD cohort if they had a Validated Investigator Global Assessment scale for Atopic Dermatitis (vIGA-AD) score of 2 and &#x2265;3% body surface area of AD involvement; and patients were eligible for the moderate to severe AD cohort if they had a vIGA-AD score of &#x2265;3, &#x2265;10% body surface area of AD involvement, an Eczema Area and Severity Index score of &#x2265;16, and an excoriation component score of &#x003E;0 in at least 1 body region. While patients with moderate to severe AD based on vIGA-AD score were eligible, those enrolled in this cohort all had AD of moderate severity according to vIGA-AD (vIGA-AD score of 3). Therefore, this group of participants is referred to as a &#x201C;Moderate AD cohort.&#x201D; Participants with AD were allowed to continue treatment for AD as long as they were on a stable regimen by the start of the observation period, and topical medications were permitted throughout the study for the treatment of AD flares. HVs were eligible if they were healthy on the basis of medical history at screening, did not have chronic itch, and reported a numeric rating scale (NRS) Peak Nocturnal Itch score of &#x2264;1 (over a 7-day recall period) at screening.</p></sec><sec id="s2-3"><title>Reference Data Generation</title><p>Video recordings during sleep were captured in each participant&#x2019;s home environment using a bespoke IR video camera developed by Emerald Innovations Inc. The camera consisted of an IMX219 8-megapixel sensor and an IR illuminator setup capable of capturing images in 720-pixel resolution at 21 frames per second. The camera was mounted on the wall at the head of the bed about 1 m above the bed surface. Participants were asked to record video during sleep hours for 8 nights over the 4-week observation period (ie, 2 nights per week).</p><p>Videos were masked by blurring faces before subsequent processing and labeling. A computer vision&#x2013;based motion-filtering algorithm trained on historical data was applied to the masked video before human labeling. This algorithm automatically removed video segments containing no motion to reduce the duration of video presented for labeling to the human raters. Random spot checks were performed on video data from each participant to confirm that the motion-filtering algorithm did not inadvertently filter out any participant motion.</p><p>Independent raters watched the videos and provided labels for multiple tasks.</p><p>1. <bold>Scratching bout labeling:</bold> Two independent raters (R1 and R2) watched a video segment and labeled the start and end times of all scratching behavior episodes (defined as &#x201C;any repetitive and rhythmic skin contact movement&#x2014;including through fabric&#x2014;performed with any part of the body&#x201D;). Consensus was reached in the first round if the intersection over union of R1 and R2 annotations exceeded a threshold of 0.765 (empirically chosen based on historical rating data). If consensus was not reached, the video segment was rated by 2 additional raters (R3 and R4) in round 2 and the same consensus threshold was used. If consensus was reached in either round 1 or 2, the intersection of the 2 raters&#x2019; labels within the round reaching consensus was taken as the final Reference. If consensus was still not reached after round 2, a fifth rater (R5) decided on the final scratch labels in round 3. Raters had access to view labels from all previous rounds, but labels were independent within a given round.</p><p>2. <bold>TSO labeling</bold>: Two independent raters (R1 and R2) watched the full night video and determined when the participant got into bed intending to sleep (TSO start) and when the participant got out of bed for the last time, intending to stay awake (TSO end). If the 2 raters in round 1 did not agree (disagreement defined as &#x003E;1-minute difference in either TSO start or TSO end), a third rater with access to labels from round 1 determined the TSO start and end labels.</p></sec><sec id="s2-4"><title>Emerald Data Collection and Scratch Algorithm</title><p>The Emerald system consists of a sensor using frequency-modulated continuous wave radar and antennae arrays to receive reflections from nearby people. The Emerald RF system uses a machine learning algorithm that operates on the data recorded by the Emerald sensor to derive sleep-related metrics [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. It uses a second proprietary machine learning algorithm that operates on the recorded data to derive scratching-related metrics [<xref ref-type="bibr" rid="ref24">24</xref>]. In this study, the RF sensor was installed on the bedroom wall 1.15 m from the floor and not more than 5 m from the participant&#x2019;s bed. Participants in this study agreed to be the only person sleeping in the room with the RF sensor and agreed to keep pets out of the bedroom during the 28-day observation period.</p></sec><sec id="s2-5"><title>Philips Data Collection and Scratch Algorithm</title><p>The GENEActiv Original (ActivInsights) wristband was configured to collect accelerometer data at 20 Hz. Each participant received 2 wristbands on study day 1 and wore both for 14 days. Each participant received a new pair of wristbands around day 14 and shipped the first set back to study sites for data collection. Participants were instructed to wear 1 wristband on the nondominant wrist continuously and the other on the dominant wrist during sleep hours.</p><p>Philips Respironics Rapid Actigraphy Data Analyzer (RADA) algorithms were applied to the raw GENEActiv data to generate sleep and scratch metrics. The RADA scratch algorithm is based on a previously published study [<xref ref-type="bibr" rid="ref12">12</xref>]. Scratches output by the RADA algorithm were characterized as left wrist, right wrist, or both wrists. The analysis of the data was wrist agnostic, and all scratching events were used for analysis.</p></sec><sec id="s2-6"><title>Outcome Definitions</title><p>TSO was defined for the Reference by the human-labeled TSO start and TSO end times from video. TSO was calculated separately for each DHT to emulate how the DHT would be used in a future study (ie, without information from the videos). TSO for the Philips DHT was selected as the major rest period on each night as determined by the RADA algorithms. TSO for the Emerald DHT was calculated as the merged sleep period where multiple sleep periods on the same night with &#x003C;30 minutes gap were merged. Any TSO with a duration of &#x003C;3.5 hours was excluded from the analysis as they were not considered representative of a nightly sleep period. A short, estimated TSO can occur when the true TSO is short, or the estimated TSO is capturing only a portion of the true TSO. The cutoff was set based on the observed data to minimize filtering out any true TSO. The intent of the filter was to automatically detect and remove cases when only a portion of the true TSO was detected (eg, the video was switched on only for a portion of the true TSO). Seven out of 232 Reference nights (3%) were excluded from all analyses due to Reference TSO of &#x003C;3.5 hours. One additional night was excluded when comparing Reference to Philips, and 3 additional nights were excluded when comparing Reference to Emerald due to the respective DHT-derived TSO of &#x003C;3.5 hours. These 11 nights impacted by the TSO filter on nights with Reference data were examined, and in 8 cases, the short TSO is a subset of a longer TSO detected by another method; in 2 cases, the short TSO does not overlap at all with the other methods, and in 1 case, all methods of TSO determination were short. Over all nights recorded by the DHTs, 23 out of 728 nights (3%) were removed for short TSO from Emerald, and 11 out of 635 (2%) nights were removed for short TSO from Philips.</p><p>The 2 primary scratch outcomes analyzed were the scratch duration and the scratch frequency. Before any downstream analysis, individual scratch events were merged and filtered. First, all scratch events with a &#x003C;3-second gap were merged into a single scratching bout. Next, only scratch events of at least 2 seconds in duration (69% of all Reference scratch events) were retained. The same merging and filtering of scratch events were applied to both DHTs and the Reference. A minimum duration of 2 seconds was chosen both because the clinical relevance of very short scratch events is unclear and to allow for fair comparisons since 2 seconds was the minimum duration of scratch predicted by the Philips algorithm [<xref ref-type="bibr" rid="ref12">12</xref>]. In all analyses, scratch duration and frequency were normalized by the duration of the TSO window so that changes in sleep time would not unduly impact the outcomes. The scratch duration is presented in units of seconds of scratch per hour of TSO, while the scratch frequency is presented in units of number of scratch bouts per hour of TSO. Both scratch duration and scratch frequency have right-skewed distributions and are therefore modeled (in intraclass correlation coefficient [ICC] analysis) on a logarithmic scale.</p></sec><sec id="s2-7"><title>Patient-Reported Outcomes</title><p>Atopic Dermatitis Itch Scale was completed in the AD cohort twice daily (morning and evening) to assess both nighttime and daytime itch. The characterization of scratch by itch level was performed using the morning Atopic Dermatitis Itch Scale administration, which asked about worst eczema-related itching last night on a 0&#x2010;10 numeric rating scale. PROs were administered electronically through a mobile phone app. In cases of technical issues with the phones, paper PROs were completed, and responses were entered by the site staff. Only responses with time stamps (electronic or handwritten) between 4 AM and 12 PM were considered valid for the morning administration. In rare cases where multiple responses were recorded on the same day, all responses on that day were excluded from analysis.</p></sec><sec id="s2-8"><title>Statistical Analysis</title><sec id="s2-8-1"><title>Characterization of Nocturnal Scratching Behavior</title><p>Descriptive statistics were used to characterize the scratching behavior in various subgroups of participants (or participant nights). All scratching characterization was done using human-labeled scratching. To summarize scratching behavior at the participant level, first, the night-level metrics were calculated for all nights with labeled scratches. Then, the geometric means were calculated at the participant level for each scratch metric over all nights. Box plots were used to summarize the distribution and medians of the distributions were compared between subgroups. Data were visualized on a linear scale in original units for ease of interpretation.</p></sec><sec id="s2-8-2"><title>Bland-Altman Analysis of TSO</title><p>Bland-Altman analysis was performed accounting for repeated measures using a mixed-effects model. Observations without paired data due to missing data in either Reference or DHT were removed from the analysis, and the number of paired observations (participant nights) is shown in the figures.</p></sec><sec id="s2-8-3"><title>Within-Night Comparison to Reference</title><p>The time period considered for within-night comparison to Reference was the intersection of the TSO between the DHT and the Reference. Nonoverlapping 10-second windows (nonoverlapping 1-second windows for the sensitivity analysis) from all nights and all participants within a cohort were categorized as true positives, false positives, true negatives, or false negatives and combined at the cohort level to generate a confusion matrix and subsequent performance metrics. A window was considered positive for the event if any part of a scratch event overlapped the window. <italic>F</italic><sub>1</sub>-score was defined as the harmonic mean of sensitivity and precision for the positive class (windows containing scratch).</p><p>When comparing <italic>F</italic><sub>1</sub>-score performance by participant characteristics, the variables considered were age, BMI, biological sex, ethnicity (ignoring 2 cases when ethnicity was not reported), race (converted to 2 classes &#x201C;White&#x201D; and &#x201C;non-White&#x201D; due to sample size and ignoring 2 cases where race was not reported), scratch prevalence, total epochs, and power of scratch events (for Philips DHT only). The total epochs are the number of 10-second windows pooled across all nights for each participant. The scratch prevalence is the percentage of the total epochs containing Reference scratch events and is calculated as the sum of true positives and false negatives divided by the total epochs. The power of Philips-predicted scratch events was calculated as the geometric mean of the power (in G) for all events for a given participant before any merging or filtering of scratch events. A 2-sided <italic>t</italic> test was performed for categorical variables, and a Pearson correlation coefficient was estimated for continuous variables. Nominal <italic>P</italic> values were reported.</p></sec><sec id="s2-8-4"><title>Intraclass Correlation Analysis</title><p>ICCs were used to compare night-level metrics between each DHT and human raters. ICCs were estimated using outputs from linear mixed-effects models (function <italic>lmer</italic> from R package <italic>lmerTest</italic> (version 3.1-3 [<xref ref-type="bibr" rid="ref25">25</xref>]) on log-transformed scratch outcomes (normalized scratch frequency and normalized scratch duration) as the response variables, scratch metric source (Philips, Emerald, Reference) as the fixed effect, a random intercept for study participant, and a random intercept for study day nested within participant. Function <italic>icc</italic> (R package <italic>performance</italic> version 0.12.0 [<xref ref-type="bibr" rid="ref26">26</xref>]) was used to calculate ICCs; 95% CIs for the ICC estimates were calculated by taking 500 bootstrap samples. This form of ICC calculation corresponds to &#x201C;Case 3A: Two-way mixed effects model, interaction absent&#x201D; with an absolute agreement definition using the McGraw and Wong convention [<xref ref-type="bibr" rid="ref27">27</xref>].</p></sec></sec><sec id="s2-9"><title>Ethical Considerations</title><p>This clinical study was performed at 6 commercial dermatology clinic sites across the United States between 2022 and 2023. Institutional review board approval was received for the study (WCG institutional review board protocol no 20213992), and all study participants provided informed consent. This study adhered to ethical standards by obtaining informed consent from all participants and ensuring that they received fair compensation for their involvement. Participant privacy and confidentiality were protected as outlined in the informed consent process, and any participant-level data presented in this manuscript are pseudonymized to preserve participant privacy.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Study Design and Participant Characteristics</title><p>Thirty-one participants enrolled in the study, including 15 with moderate AD, 11 with mild AD, and 5 HVs. Of the 31 participants, 2 participants were excluded for not meeting the inclusion or exclusion criteria (one based on disease severity and another based on change in therapy during the screening period). One additional participant in the moderate AD group was excluded from the analysis due to capture of poor-quality videos that failed spot checks and could not be manually labeled. A schematic overview of the study design is shown in <xref ref-type="fig" rid="figure1">Figure 1</xref>.</p><p>A summary of demographics and disease severity characteristics at baseline for the 28 participants included in the analysis is shown in <xref ref-type="table" rid="table1">Table 1</xref>. Participants ranged in age from 19 to 65 (median 37.5) years. Participants were categorized as having mild AD or moderate AD based on the vIGA-AD. Mean Eczema Area and Severity Index scores for the moderate AD and mild AD groups were 17.54 and 4.63, respectively. Mean SCORing Atopic Dermatitis (SCORAD) values for the moderate AD and mild AD groups were approximately 50 and 36, respectively. Peak nocturnal itch reported on a 0&#x2010;10 NRS was 0 at screening for all HVs and at least 2 for all patients with AD, with a similar median peak nocturnal itch score for the groups with mild and moderate AD (mild AD: 6.0, moderate AD: 5.5).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Summary of demographic and disease characteristics at screening.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Analysis set: per protocol set</td><td align="left" valign="bottom">HVs<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> (n=5)</td><td align="left" valign="bottom">Moderate AD<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup> (n=14)</td><td align="left" valign="bottom">Mild AD (n=9)</td><td align="left" valign="bottom">Total (n=28)</td></tr></thead><tbody><tr><td align="left" valign="top">Age, years</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Mean (SD)</td><td align="left" valign="top">27.20 (9.65)</td><td align="left" valign="top">42.21 (15.39)</td><td align="left" valign="top">43.89 (10.91)</td><td align="left" valign="top">40.07 (14.18)</td></tr><tr><td align="left" valign="top" rowspan="2">&#x2003;Median (range)<break/></td><td align="left" valign="top" rowspan="2">25 (19-42)</td><td align="left" valign="top" rowspan="2">38.5 (21-65)</td><td align="left" valign="top" rowspan="2">47 (28-56)</td><td align="left" valign="top" rowspan="2">37.5 (19-65)</td></tr><tr><td align="left" valign="top">Sex, n (%)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Female</td><td align="left" valign="top">3 (60.00)</td><td align="left" valign="top">9 (64.29)</td><td align="left" valign="top">5 (55.56)</td><td align="left" valign="top">17 (60.71)</td></tr><tr><td align="left" valign="top">&#x2003;Male</td><td align="left" valign="top">2 (40.00)</td><td align="left" valign="top">5 (35.71)</td><td align="left" valign="top">4 (44.44)</td><td align="left" valign="top">11 (39.29)</td></tr><tr><td align="left" valign="top">Race, n (%)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;American Indian/Alaskan Native</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">2 (14.29)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">2 (7.14)</td></tr><tr><td align="left" valign="top">&#x2003;Asian</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">1 (7.14)</td><td align="left" valign="top">1 (11.11)</td><td align="left" valign="top">2 (7.14)</td></tr><tr><td align="left" valign="top">&#x2003;Black/ African American</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">1 (7.14)</td><td align="left" valign="top">2 (22.22)</td><td align="left" valign="top">3 (10.71)</td></tr><tr><td align="left" valign="top">&#x2003;White</td><td align="left" valign="top">5 (100.00)</td><td align="left" valign="top">9 (64.29)</td><td align="left" valign="top">4 (44.44)</td><td align="left" valign="top">18 (64.29)</td></tr><tr><td align="left" valign="top">&#x2003;Multiple</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">1 (11.11)</td><td align="left" valign="top">1 (3.57)</td></tr><tr><td align="left" valign="top">&#x2003;Not reported</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">1 (7.14)</td><td align="left" valign="top">1 (11.11)</td><td align="left" valign="top">2 (7.14)</td></tr><tr><td align="left" valign="top">Ethnicity, n (%)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Hispanic or Latino</td><td align="left" valign="top">3 (60.00)</td><td align="left" valign="top">7 (50.00)</td><td align="left" valign="top">1 (11.11)</td><td align="left" valign="top">11 (39.29)</td></tr><tr><td align="left" valign="top">&#x2003;Non-Hispanic or Latino</td><td align="left" valign="top">2 (40.00)</td><td align="left" valign="top">6 (42.86)</td><td align="left" valign="top">7 (77.78)</td><td align="left" valign="top">15 (53.57)</td></tr><tr><td align="left" valign="top">&#x2003;Not reported</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">1 (7.14)</td><td align="left" valign="top">1 (11.11)</td><td align="left" valign="top">2 (7.14)</td></tr><tr><td align="left" valign="top">NRS<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup> peak nocturnal itch</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Median (range)</td><td align="left" valign="top">0.00 (0.00-0.00)</td><td align="left" valign="top">5.50 (2.00-8.00)</td><td align="left" valign="top">6.00 (2.00-9.00)</td><td align="left" valign="top">5.00 (0.00-9.00)</td></tr><tr><td align="left" valign="top">EASI<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Mean (SD)</td><td align="left" valign="top">N/A<sup><xref ref-type="table-fn" rid="table1fn5">e</xref></sup></td><td align="left" valign="top">17.54 (0.97)</td><td align="left" valign="top">4.63 (2.86)</td><td align="left" valign="top">12.49 (6.71)</td></tr><tr><td align="left" valign="top">&#x2003;Median (range)</td><td align="left" valign="top">N/A (N/A)</td><td align="left" valign="top">17.25 (16.40-20.00)</td><td align="left" valign="top">4.20 (0.60-11.00)</td><td align="left" valign="top">16.80 (0.60-20.00)</td></tr><tr><td align="left" valign="top">&#x2003;IQR<sup><xref ref-type="table-fn" rid="table1fn6">f</xref></sup></td><td align="left" valign="top">N/A</td><td align="left" valign="top">16.92-17.98</td><td align="left" valign="top">3.20-5.00</td><td align="left" valign="top">4.65-17.40</td></tr><tr><td align="left" valign="top">SCORAD<sup><xref ref-type="table-fn" rid="table1fn7">g</xref></sup></td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Mean (SD)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">50.27 (8.21)</td><td align="left" valign="top">35.87 (11.03)</td><td align="left" valign="top">44.63 (11.65)</td></tr><tr><td align="left" valign="top">&#x2003;Median (range)</td><td align="left" valign="top">N/A (N/A)</td><td align="left" valign="top">51.10 (36.50-66.90)</td><td align="left" valign="top">35.00 (18.20-52.60)</td><td align="left" valign="top">47.90 (18.20-66.90)</td></tr><tr><td align="left" valign="top">&#x2003;IQR</td><td align="left" valign="top">N/A</td><td align="left" valign="top">47.23-53.45</td><td align="left" valign="top">32.00-40.80</td><td align="left" valign="top">36.95-52.70</td></tr><tr><td align="left" valign="top">vIGA-AD<sup><xref ref-type="table-fn" rid="table1fn8">h</xref></sup>, n (%)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Clear (0)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td></tr><tr><td align="left" valign="top">&#x2003;Almost clear (1)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td></tr><tr><td align="left" valign="top">&#x2003;Mild (2)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">9 (100.00)</td><td align="left" valign="top">9 (39.13)</td></tr><tr><td align="left" valign="top">&#x2003;Moderate (3)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">14 (100.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">14 (60.87)</td></tr><tr><td align="left" valign="top">&#x2003;Severe (4)</td><td align="left" valign="top">N/A</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td><td align="left" valign="top">0 (0.00)</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>HVs: healthy volunteers.</p></fn><fn id="table1fn2"><p><sup>b</sup>AD: atopic dermatitis.</p></fn><fn id="table1fn3"><p><sup>c</sup>NRS: numeric rating scale.</p></fn><fn id="table1fn4"><p><sup>d</sup>EASI: Eczema Area and Severity Index.</p></fn><fn id="table1fn5"><p><sup>e</sup>N/A: not applicable.</p></fn><fn id="table1fn6"><p><sup>f</sup>IQR: interquartile range.</p></fn><fn id="table1fn7"><p><sup>g</sup>SCORAD: SCORing Atopic Dermatitis.</p></fn><fn id="table1fn8"><p><sup>h</sup>vIGA-AD: Validated Investigator Global Assessment scale for Atopic Dermatitis.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>Characterization of Nocturnal Scratching Behavior</title><p>To define a nocturnal scratch outcome, it was first necessary to determine the time window during which scratching was to be measured. Following the terminology used in previous research, we call this window of intended sleep the TSO [<xref ref-type="bibr" rid="ref10">10</xref>]. The TSO windows for the Reference were manually annotated and defined to start when the participant got into the bed intending to sleep and defined to end when the participant got out of the bed intending to stay awake.</p><p>Nightly scratch measures (normalized scratch duration and normalized scratch frequency) as defined in the Reference were characterized by disease severity and patient-reported itch in <xref ref-type="fig" rid="figure2">Figure 2</xref>. The median frequency and duration of nighttime scratching increase with AD disease severity from HVs (2.4 bouts per hour, 13.1 seconds per hour) to mild AD (3.51 bouts per hour, 17.4 seconds per hour) to moderate AD (4.64 bouts per hour, 30.0 seconds per hour); however, the ranges are highly overlapping between all 3 cohorts (<xref ref-type="fig" rid="figure2">Figures 2A and B</xref>). Scratching was also characterized by SCORAD severity since this is a frequently used scoring system in AD. Similarly to cohort, there is a trend of increasing median nocturnal scratch frequency and duration with increasing severity of SCORAD but highly overlapping ranges (<xref ref-type="fig" rid="figure2">Figures 2C and D</xref>).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Characterization of human-labeled scratching behavior by disease severity and patient-reported itch. Distribution of normalized scratch frequency (scratch bouts per hour; left column) and normalized scratch duration (scratch seconds per hour; right column) are shown. Participant level average (<bold>A</bold>) scratch frequency and (<bold>B</bold>) scratch duration by cohort. Participant level average (<bold>C</bold>) scratch frequency and (<bold>D</bold>) scratch duration by SCORAD severity within the AD cohort only. Participant-night level (<bold>E</bold>) scratch frequency and (<bold>F</bold>) scratch duration by peak nighttime itch NRS obtained via the Atopic Dermatitis Itch Scale morning administration within the AD cohort only. Box plots show the IQR of the distribution. Bold horizontal lines within the box show the median. Whiskers show the maximum and minimum values after excluding any outliers. The box plot is overlaid with all observed data. AD: atopic dermatitis; ADIS: Atopic Dermatitis Itch Scale; HV: healthy volunteer; NRS: numeric rating scale; SCORAD: SCORing Atopic Dermatitis; TSO: total sleep opportunity.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e72216_fig02.png"/></fig><p>Finally, we investigated how the reference nocturnal scratch frequency and duration compared on nights when participants reported no itch, mild itch, moderate itch, or severe itch (<xref ref-type="fig" rid="figure2">Figures 2E and F</xref>). In this cross-sectional analysis, when AD study participants reported in the morning that the previous night had no itch, the scratching was dramatically lower (but not zero) than when any itch was reported. Median scratch frequency on nights with no itch was 2.37 bouts per hour versus 4.5 bouts per hour with mild itch and 4.64 bouts per hour with moderate itch. The trend did not hold for severe itch, which had the lowest number of nights and fell in between the levels of no itch and mild itch with a median of 3.68 bouts per hour. Similar trends were observed for nocturnal scratch duration with 10.2 seconds per hour in no itch, 26.7 seconds per hour in mild itch, 26.5 seconds per hour in moderate itch, and 17.8 seconds per hour in severe itch.</p></sec><sec id="s3-3"><title>TSO Agreement With Reference</title><p>After characterizing the scratching behavior with the human-labeled reference, we began to assess the agreement of the DHT-derived measures with the Reference. First, we assessed the level of agreement between TSO derived from Philips versus Reference and from Emerald versus Reference with a Bland-Altman analysis (<xref ref-type="fig" rid="figure3">Figures 3A and B</xref>). The average bias in TSO in the home environment was less than half an hour for both DHTs with bias (lower and upper 95% limits of agreement) estimates of 0.42 hours (&#x2212;2.18 hours and 3.02 hours) for Philips and 0.44 hours (&#x2212;1.85 hours and 2.73 hours) for Emerald.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Bland-Altman plots of TSO duration. Bland-Altman plots for (<bold>A</bold>) Philips versus Reference and (<bold>B</bold>) Emerald versus Reference. Each point represents a single night from 1 participant. Cohorts are represented by different colors. The solid black horizontal line is the bias, and the long dashed horizontal lines are the 95% LLOA and ULOA. The short dashed horizontal lines are the 95% CI lower and upper bounds for the bias and the 95% limits of agreement. AD: atopic dermatitis; HV: healthy volunteer; LLOA: lower limit of agreement; TSO: total sleep opportunity; ULOA: upper limit of agreement.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e72216_fig03.png"/></fig></sec><sec id="s3-4"><title>Within-Night Scratch Detection Performance</title><p>Next, we assessed the level of agreement in scratch classification between each DHT and the Reference for all 10-second windows. The time period considered for the evaluation was the intersection of the TSO between the Reference and the corresponding DHT to avoid ambiguous cases where scratch labels were missing. All time windows within the TSO intersections were considered, and no balancing of the scratch and nonscratch windows was performed. In the moderate AD group, an <italic>F</italic><sub>1</sub>-score of 0.64 was achieved for Emerald and 0.43 for Philips (<xref ref-type="table" rid="table2">Table 2</xref>). Overall, the performance of the Emerald DHT, as measured by <italic>F</italic><sub>1</sub>-score, was noticeably higher than that of the Philips DHT in each cohort. The difference in <italic>F</italic><sub>1</sub>-scores was mainly due to the lower precision (0.29&#x2010;0.36) of the Philips algorithm, indicating that many false-positive scratching events were identified.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Sensitivity, precision, <italic>F</italic><sub>1</sub>-score, and balanced accuracy to detect scratching events on 10-second windows compared to the Reference.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom"/><td align="left" valign="bottom">Emerald</td><td align="left" valign="bottom">Philips</td></tr></thead><tbody><tr><td align="left" valign="top">HVs<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;N (participants)</td><td align="left" valign="top">5</td><td align="left" valign="top">5</td></tr><tr><td align="left" valign="top">&#x2003;N (participant nights)</td><td align="left" valign="top">46</td><td align="left" valign="top">45</td></tr><tr><td align="left" valign="top">&#x2003;Sensitivity</td><td align="left" valign="top">0.52</td><td align="left" valign="top">0.69</td></tr><tr><td align="left" valign="top">&#x2003;Precision</td><td align="left" valign="top">0.61</td><td align="left" valign="top">0.44</td></tr><tr><td align="left" valign="top">&#x2003;<italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.56</td><td align="left" valign="top">0.54</td></tr><tr><td align="left" valign="top">&#x2003;Balanced accuracy</td><td align="left" valign="top">0.76</td><td align="left" valign="top">0.84</td></tr><tr><td align="left" valign="top">Mild AD<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;N (participants)</td><td align="left" valign="top">9</td><td align="left" valign="top">9</td></tr><tr><td align="left" valign="top">&#x2003;N (participant nights)</td><td align="left" valign="top">76</td><td align="left" valign="top">73</td></tr><tr><td align="left" valign="top">&#x2003;Sensitivity</td><td align="left" valign="top">0.54</td><td align="left" valign="top">0.62</td></tr><tr><td align="left" valign="top">&#x2003;Precision</td><td align="left" valign="top">0.49</td><td align="left" valign="top">0.38</td></tr><tr><td align="left" valign="top">&#x2003;<italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.51</td><td align="left" valign="top">0.47</td></tr><tr><td align="left" valign="top">&#x2003;Balanced accuracy</td><td align="left" valign="top">0.76</td><td align="left" valign="top">0.80</td></tr><tr><td align="left" valign="top">Moderate AD</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;N (participants)</td><td align="left" valign="top">14</td><td align="left" valign="top">14</td></tr><tr><td align="left" valign="top">&#x2003;N (participant nights)</td><td align="left" valign="top">98</td><td align="left" valign="top">74</td></tr><tr><td align="left" valign="top">&#x2003;Sensitivity</td><td align="left" valign="top">0.71</td><td align="left" valign="top">0.72</td></tr><tr><td align="left" valign="top">&#x2003;Precision</td><td align="left" valign="top">0.66</td><td align="left" valign="top">0.46</td></tr><tr><td align="left" valign="top">&#x2003;<italic>F</italic><sub>1</sub>-score</td><td align="left" valign="top">0.68</td><td align="left" valign="top">0.56</td></tr><tr><td align="left" valign="top">&#x2003;Balanced accuracy</td><td align="left" valign="top">0.85</td><td align="left" valign="top">0.85</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>HVs: healthy volunteers.</p></fn><fn id="table2fn2"><p><sup>b</sup>AD: atopic dermatitis.</p></fn></table-wrap-foot></table-wrap><p>To better understand the behaviors leading to false-positive scratch prediction with the Philips algorithm, we sampled 2 nights from each study participant and watched the videos during the false-positive event to identify which nonscratch movements were contributing to false-positive scratch predictions. We found that the main nonscratch movements incorrectly classified as scratch were body repositioning within the bed, mobile phone usage, and movement associated with entering or exiting the bed.</p><p>A more detailed listing of performance metrics by participant is shown in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. A 10-second window size was chosen for this analysis of within-night performance to mitigate any misalignment of scratch events resulting from incomplete clock synchronization between DHTs and video. A sensitivity analysis showing the performance metrics with 1-second windows is shown in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>. Overall, the trends observed with 10-second windows are consistent with 1-second windows, but the performance metrics are generally lower.</p><p>Because of the wide range of participant-level <italic>F</italic><sub>1</sub>-scores observed (ranging from 0.13 to 0.85), we investigated whether any participant characteristics were associated with <italic>F</italic><sub>1</sub>-scores (<xref ref-type="supplementary-material" rid="app3">Multimedia Appendix 3</xref>). We found that the strongest factor associated with <italic>F</italic><sub>1</sub>-score was the scratch prevalence that varied between 0.5% and 4.5% when pooling all epochs at the participant level. Scratch prevalence was strongly positively correlated with <italic>F</italic><sub>1</sub>-score for both Philips (<italic>r</italic>=0.82; <italic>P</italic>&#x003C;.001) and Emerald (<italic>r</italic>=0.59; <italic>P</italic>=.001) DHTs. Ethnicity was the next most associated variable with <italic>F</italic><sub>1</sub>-score in this dataset, with non-Hispanic or non-Latino participants having an average <italic>F</italic><sub>1</sub>-score 0.17 lower than Hispanic or Latino participants (Philips: <italic>P</italic>=.004, Emerald: <italic>P</italic>=.01). However, upon closer inspection of the variables&#x2019; correlation structure, it was noted that ethnicity is associated with prevalence in this dataset, which is likely driving the observed association. We also identified a significant correlation between the participants&#x2019; geometric mean power of scratch events (in G) and the <italic>F</italic><sub>1</sub>-score for the Philips DHT (<italic>r</italic>=0.43; <italic>P</italic>=.02). Additionally, a negative correlation was observed between participant age and <italic>F</italic><sub>1</sub>-score (Philips: <italic>r</italic>=&#x2212;0.39, <italic>P</italic>=.04; Emerald: <italic>r</italic>=&#x2212;0.41, <italic>P</italic>=.03). Participant age was found to be negatively correlated with the power of scratching events, which may be partly mediating the association with age.</p></sec><sec id="s3-5"><title>Agreement of Nightly Scratch Measures With Reference</title><p>The level of agreement in nocturnal scratch measures between each DHT and Reference on a nightly level is shown in <xref ref-type="fig" rid="figure4">Figure 4</xref>. The points were largely distributed along the identity line, indicating that the predicted nocturnal scratch frequency and nocturnal scratch duration were similar to the reference. Philips scratch predictions had a higher false-positive rate, resulting in overestimation of both nocturnal scratch frequency and duration as observed in <xref ref-type="fig" rid="figure4">Figures 4A and 4C</xref>. Emerald scratch predictions fall more evenly about the identity line, indicating lower bias as observed in <xref ref-type="fig" rid="figure4">Figures 4B and 4D</xref>.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Scatter plots of night-level scratch metrics in each DHT versus Reference. Normalized scratch frequency of Philips versus Reference (<bold>A</bold>) and Emerald versus Reference (<bold>B</bold>). Normalized scratch duration of Philips versus Reference (<bold>C</bold>) and Emerald versus Reference (<bold>D</bold>). Solid blue lines show the line of best fit from mixed-effects linear regression models, and dashed black lines show the identity line (y=x). The plotted values are the normalized scratch durations and normalized scratch frequencies. Each point represents observed scratching from 1 participant night. The x-axis and y-axis use a log-transformed scale with tick labels shown on the original scale. Each point is colored according to the study cohort. AD: atopic dermatitis; HV: healthy volunteer; TSO: total sleep opportunity.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e72216_fig04.png"/></fig><p>The primary hypothesis of this study was that the nocturnal scratch metrics estimated from DHTs would be comparable with nocturnal scratch metrics assessed by human-labeled IR video. However, to our knowledge, the level of human agreement expected between human raters for this task had not been characterized in the literature and thus was unknown to us at the start of the study. Therefore, we used a rigorous human labeling approach where every night of video was first split into motion and nonmotion periods, and then every motion period was independently labeled by at least 2 human raters for scratching. To quantify the level of agreement between methods, the ICC was used as a measure of interrater reliability.</p><p>Interrater reliability estimates comparing 2 human raters fell in the &#x201C;good&#x201D; to &#x201C;excellent&#x201D; range (95% CI lower bound &#x003E;0.75) for HVs and the &#x201C;moderate&#x201D; to &#x201C;good&#x201D; range (95% CI lower bound 0.5&#x2010;0.9) for patients with AD [<xref ref-type="bibr" rid="ref28">28</xref>] (<xref ref-type="fig" rid="figure5">Figure 5</xref>). In all cohorts, the 95% CIs for DHT versus human rater and human rater versus human rater ICCs overlapped, indicating noninferiority. The noninferior ICC estimates for both Philips and Emerald indicate that DHT estimates of normalized scratch duration and frequency are comparable with human raters.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>ICC estimates showing agreement between 2 human raters and between each digital health technology and a human rater. Dots show the ICC point estimates and whiskers show the 95% CIs. Note that rater 1 values are missing for normalized scratch frequency in the moderate AD cohort due to nonconvergence of the model. AD: atopic dermatitis; HV: healthy volunteer; ICC: intraclass correlation.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="jmir_v27i1e72216_fig05.png"/></fig></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Results and Comparison With Prior Work</title><p>We conducted an analytical validation study of both a wearable sensor and a touchless sensor, and corresponding algorithms, for the ability to correctly identify nocturnal scratching events in adults with AD, while participants were sleeping at home. We found that the intended sleep window (TSO) can be reliably estimated with both DHTs. The TSO determination for both the Philips DHT and the Emerald DHT was in the range previously reported in a sleep clinic (&#x003C;30 minutes mean bias) [<xref ref-type="bibr" rid="ref10">10</xref>]. The sensitivity of scratch classification performance was higher with the Philips DHT, whereas the precision was higher with the Emerald DHT. Overall, the <italic>F</italic><sub>1</sub>-score was higher with the Emerald DHT (ranging from 0.51 to 0.68) than with the Philips DHT (ranging from 0.47 to 0.56). The Philips algorithm was found to be oversensitive, falsely identifying movements as scratch events during nonscratch participant motion. Participant-level <italic>F</italic><sub>1</sub>-scores varied widely from 0.13 to 0.85, and this was highly associated with the scratch prevalence&#x2014;participants having a higher scratch prevalence generally achieved a higher <italic>F</italic><sub>1</sub>-score for both Emerald and Philips DHT. Other weaker associations identified with the participant-level <italic>F</italic><sub>1</sub>-scores (accelerometer power, ethnicity, and age) should be interpreted cautiously due to the limited sample size.</p><p>While the <italic>F</italic><sub>1</sub>-scores in this study were lower than those previously reported for these DHTs [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref24">24</xref>], this was expected due to several factors. First, the dataset used was previously unseen by the algorithms tested, whereas previous studies tested an algorithm that was developed on the same dataset. Second, the study execution was made as &#x201C;real-world&#x201D; as possible with all data collected in the participants&#x2019; homes. Additionally, the comparison with reference to generate <italic>F</italic><sub>1</sub>-scores was performed on all windows, without first balancing scratch and nonscratch events, which was shown to have a large impact on <italic>F</italic><sub>1</sub>-score [<xref ref-type="bibr" rid="ref11">11</xref>]. Finally, we have shown that <italic>F</italic><sub>1</sub>-score is influenced by scratch prevalence, which makes it difficult to compare results across studies without accounting for differences in the scratch prevalence between study populations.</p><p>Importantly, we quantified the interrater agreement for the nightly scratch summary measures and found that the performance of both DHTs and human raters was noninferior to how 2 independent human raters performed when compared with each other. The mean level of human interrater agreement for nocturnal scratch duration and nocturnal scratch frequency was approximately 0.75 for both mild and moderate AD groups. This finding provides a ceiling for the maximal level of agreement expected between DHT and human raters. Our results show that current DHTs are close to, but do not reach, this ceiling of agreement between 2 human raters. Future work should investigate whether improved nocturnal scratching algorithms trained on additional datasets could reach the level of agreement of 2 human raters. Algorithm development should seek to minimize false positives from nonscratch movements.</p><p>When characterizing human-labeled scratch measures, we noted that nocturnal scratching was also observed in HVs in this study. While previous studies have generally found little to no scratching among HVs as assessed by video monitoring [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref17">17</xref>], recent results from other studies of nocturnal scratching hint that even HVs may scratch during the night [<xref ref-type="bibr" rid="ref29">29</xref>]. We also found that nocturnal scratch duration and frequency were similar between mild AD and moderate AD cohorts in this study. Previous work has also shown overlapping ranges between mild and moderate AD without finding a significant relationship in the total scratching time as a percentage of the total recording [<xref ref-type="bibr" rid="ref9">9</xref>]. Converting the metric used in <xref ref-type="fig" rid="figure1">Figure 1</xref> of Ebata et al [<xref ref-type="bibr" rid="ref9">9</xref>] into normalized scratch duration as we define it would lead to a median estimate of normalized scratching duration of &#x003C;36 seconds per hour in mild AD and 216 seconds per hour in moderate AD. Therefore, it is possible that our study tended to recruit people who scratch less than a typical patient with moderate AD. Notably, the similarity in mild AD and moderate AD scratch was also mirrored in the self-reported itch NRS at screening, which had a similar range and median value in both cohorts (<xref ref-type="table" rid="table1">Table 1</xref>). Future work may further elucidate whether there are differences in the characteristics (eg, intensity, distribution by sleep stage, and timing) of scratching between patients with AD of varying severities or between patients with AD as a whole and, otherwise, healthy individuals reporting no pruritus.</p></sec><sec id="s4-2"><title>Limitations</title><p>This study has a few limitations to be considered. The number of participants analyzed (n=28) was relatively small since it was chosen to be powered primarily for the analysis of ICC estimation in patients with moderate AD. Still, the sample size is comparable with other studies of nocturnal scratching [<xref ref-type="bibr" rid="ref10">10</xref>-<xref ref-type="bibr" rid="ref12">12</xref>], and this study was unique in that rather than 1 or 2 nights of collected IR video, participants collected, on average, 8 nights of IR video over the 4-week observation period. The study also had a limited sample size to investigate the performance of the scratch algorithms in subgroups (eg, by age or race). While associations with <italic>F</italic><sub>1</sub>-scores were performed, additional data are necessary to reach a conclusion about scratch performance in any subgroups. Future work should test these tools in a more diverse population to ensure that performance is acceptable in a representative sample of the targeted population. This study has another limitation tied to the collection of video data in the home. An intentional choice was made to give the study participants full control over the IR video recording, allowing them to turn it on and off at will. This could result in some degree of bias in the determination of the reference TSO window because it is possible that participants recorded video only for part of the true TSO window. Anecdotal evidence from DHT-derived sleep windows suggests that on some nights, the camera may have been turned off before the end of the sleep period, leading to a bias in the Reference TSO duration. To mitigate the impact of this bias, short estimated TSO windows (&#x003C;3.5 hours) were excluded from the analysis. Overall, the net benefits of performing the study in the home (less participant burden and a natural sleeping environment) outweigh any potential drawbacks in capturing the TSO.</p><p>While our intent was to enroll patients with a broad range of disease severity, no patients with AD with severe disease according to vIGA-AD enrolled in our study. This is due, in part, to the requirements for having a stable regimen of systemic treatment for at least 4 weeks prior to study screening and no changes in treatment during the 4-week study, which made it difficult to recruit participants with severe disease. Notably, when classifying the study participants according to SCORAD, there are 9 participants considered severe (total score of &#x003E;50). Future analytical validation studies may consider modifying the inclusion criteria to recruit participants with a broader range of AD severity.</p><p>Results from the Emerald DHT are promising; however, data in this study were collected with strict lifestyle restrictions. Namely, participants were required to sleep without any other people or pets in the bedroom due to the requirements of current algorithms for detecting scratching. Future work should focus on algorithmic solutions to the problem of detecting scratching in a single individual while not sleeping alone to enable scaling this technology for more widespread clinical trial use.</p></sec><sec id="s4-3"><title>Conclusions</title><p>Our results support the analytical validity of both DHTs tested for continuous measurement of nocturnal scratching in the home environment. The most supportive finding is the noninferior performance of both the Emerald DHT and Philips DHT compared with human labelers. Opportunities remain for improving the performance of the DHTs tested, especially in the precision of wrist-worn accelerometer scratch detection, to reach human-level performance. Nevertheless, ultimately the use of measuring nocturnal scratching as an efficacy end point for clinical trials is dependent not on perfect agreement with the reference but rather on detecting clinically meaningful changes in scratching behavior in patients. Therefore, current tools may be fit-for-purpose to generate clinical trial end points depending on their intended use and the magnitude of the treatment effect on specific nocturnal scratch end points. Practitioners who would like to use these tools may consider collecting additional data on diverse samples to better understand scratching behavior in the context of natural history studies or interventional studies where treatment effects on scratching behavior can be assessed.</p></sec></sec></body><back><ack><p>The authors would like to thank all study participants, investigators, and study site staff for their contributions to the study. The authors would also like to acknowledge the Emerald team for providing valuable advice. This study was sponsored by Johnson &#x0026; Johnson.</p></ack><notes><sec><title>Data Availability</title><p>The data-sharing policy of Johnson &#x0026; Johnson is available on the web [<xref ref-type="bibr" rid="ref30">30</xref>]. As noted on this site, requests for access to the study data can be submitted through the Yale Open Data Access (YODA) Project site [<xref ref-type="bibr" rid="ref31">31</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>SA, MM, AE, NF, and LY contributed to conceptualization. SA and SJ contributed to data curation. SA, DS, MB, MO, and XHK did the formal analysis. SA, DS, and MO performed the visualization. LY and MW contributed to project administration. NM, KM, and ZA performed supervision. SA contributed to writing&#x2014;original draft. All authors contributed to writing&#x2014;review and editing.</p></fn><fn fn-type="conflict"><p>At the time of the study, all authors were employed by Johnson &#x0026; Johnson and may hold company stock.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AD</term><def><p>atopic dermatitis</p></def></def-item><def-item><term id="abb2">DHT</term><def><p>digital health technology</p></def></def-item><def-item><term id="abb3">HV</term><def><p>healthy volunteer</p></def></def-item><def-item><term id="abb4">ICC</term><def><p>intraclass correlation coefficient</p></def></def-item><def-item><term id="abb5">IR</term><def><p>infrared</p></def></def-item><def-item><term id="abb6">NRS</term><def><p>numeric rating scale</p></def></def-item><def-item><term id="abb7">PRO</term><def><p>patient-reported outcome</p></def></def-item><def-item><term id="abb8">RADA</term><def><p>Rapid Actigraphy Data Analyzer</p></def></def-item><def-item><term id="abb9">RF</term><def><p>radio frequency</p></def></def-item><def-item><term id="abb10">SCORAD</term><def><p>SCORing Atopic Dermatitis</p></def></def-item><def-item><term id="abb11">TSO</term><def><p>total sleep opportunity</p></def></def-item><def-item><term id="abb12">vIGA-AD</term><def><p>Validated Investigator Global Assessment scale for Atopic Dermatitis</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bieber</surname><given-names>T</given-names> </name></person-group><article-title>Atopic dermatitis</article-title><source>N Engl J Med</source><year>2008</year><month>04</month><day>3</day><volume>358</volume><issue>14</issue><fpage>1483</fpage><lpage>1494</lpage><pub-id pub-id-type="doi">10.1056/NEJMra074081</pub-id><pub-id pub-id-type="medline">18385500</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Patel</surname><given-names>T</given-names> </name><name name-style="western"><surname>Ishiuji</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Yosipovitch</surname><given-names>G</given-names> </name></person-group><article-title>Nocturnal itch: why do we itch at night?</article-title><source>Acta Derm Venereol</source><year>2007</year><volume>87</volume><issue>4</issue><fpage>295</fpage><lpage>298</lpage><pub-id pub-id-type="doi">10.2340/00015555-0280</pub-id><pub-id pub-id-type="medline">17598030</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cesnakova</surname><given-names>L</given-names> </name><name name-style="western"><surname>Meadows</surname><given-names>K</given-names> </name><name name-style="western"><surname>Avey</surname><given-names>S</given-names> </name><etal/></person-group><article-title>A patient-centred conceptual model of nocturnal scratch and its impact in atopic dermatitis: a mixed-methods study supporting the development of novel digital measurements</article-title><source>Skin Health Dis</source><year>2023</year><month>10</month><volume>3</volume><issue>5</issue><fpage>e262</fpage><pub-id pub-id-type="doi">10.1002/ski2.262</pub-id><pub-id pub-id-type="medline">37799371</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Charman</surname><given-names>CR</given-names> </name><name name-style="western"><surname>Venn</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Williams</surname><given-names>HC</given-names> </name></person-group><article-title>The patient-oriented eczema measure: development and initial validation of a new tool for measuring atopic eczema severity from the patients&#x2019; perspective</article-title><source>Arch Dermatol</source><year>2004</year><month>12</month><volume>140</volume><issue>12</issue><fpage>1513</fpage><lpage>1519</lpage><pub-id pub-id-type="doi">10.1001/archderm.140.12.1513</pub-id><pub-id pub-id-type="medline">15611432</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Topp</surname><given-names>J</given-names> </name><name name-style="western"><surname>Apfelbacher</surname><given-names>C</given-names> </name><name name-style="western"><surname>St&#x00E4;nder</surname><given-names>S</given-names> </name><name name-style="western"><surname>Augustin</surname><given-names>M</given-names> </name><name name-style="western"><surname>Blome</surname><given-names>C</given-names> </name></person-group><article-title>Measurement properties of patient-reported outcome measures for pruritus: an updated systematic review</article-title><source>J Invest Dermatol</source><year>2022</year><month>02</month><volume>142</volume><issue>2</issue><fpage>343</fpage><lpage>354</lpage><pub-id pub-id-type="doi">10.1016/j.jid.2021.06.032</pub-id><pub-id pub-id-type="medline">34339743</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ke Wang</surname><given-names>W</given-names> </name><name name-style="western"><surname>Cesnakova</surname><given-names>L</given-names> </name><name name-style="western"><surname>Goldsack</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Dunn</surname><given-names>J</given-names> </name></person-group><article-title>Defining the digital measurement of scratching during sleep or nocturnal scratching: review of the literature</article-title><source>J Med Internet Res</source><year>2023</year><month>04</month><day>18</day><volume>25</volume><fpage>e43617</fpage><pub-id pub-id-type="doi">10.2196/43617</pub-id><pub-id pub-id-type="medline">37071460</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>AF</given-names> </name><name name-style="western"><surname>Nguyen</surname><given-names>M</given-names> </name><name name-style="western"><surname>Li</surname><given-names>AW</given-names> </name><etal/></person-group><article-title>Use of technology for the objective evaluation of scratching behavior: a systematic review</article-title><source>JAAD Int</source><year>2021</year><month>12</month><volume>5</volume><fpage>19</fpage><lpage>32</lpage><pub-id pub-id-type="doi">10.1016/j.jdin.2021.06.005</pub-id><pub-id pub-id-type="medline">34816131</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ebata</surname><given-names>T</given-names> </name><name name-style="western"><surname>Aizawa</surname><given-names>H</given-names> </name><name name-style="western"><surname>Kamide</surname><given-names>R</given-names> </name></person-group><article-title>An infrared video camera system to observe nocturnal scratching in atopic dermatitis patients</article-title><source>J Dermatol</source><year>1996</year><month>03</month><volume>23</volume><issue>3</issue><fpage>153</fpage><lpage>155</lpage><pub-id pub-id-type="doi">10.1111/j.1346-8138.1996.tb03990.x</pub-id><pub-id pub-id-type="medline">8935624</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ebata</surname><given-names>T</given-names> </name><name name-style="western"><surname>Aizawa</surname><given-names>H</given-names> </name><name name-style="western"><surname>Kamide</surname><given-names>R</given-names> </name><name name-style="western"><surname>Niimura</surname><given-names>M</given-names> </name></person-group><article-title>The characteristics of nocturnal scratching in adults with atopic dermatitis</article-title><source>Br J Dermatol</source><year>1999</year><month>07</month><volume>141</volume><issue>1</issue><fpage>82</fpage><lpage>86</lpage><pub-id pub-id-type="doi">10.1046/j.1365-2133.1999.02924.x</pub-id><pub-id pub-id-type="medline">10417519</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mahadevan</surname><given-names>N</given-names> </name><name name-style="western"><surname>Christakis</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Di</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Development of digital measures for nighttime scratch and sleep using wrist-worn wearable devices</article-title><source>NPJ Digit Med</source><year>2021</year><month>03</month><day>3</day><volume>4</volume><issue>1</issue><fpage>42</fpage><pub-id pub-id-type="doi">10.1038/s41746-021-00402-x</pub-id><pub-id pub-id-type="medline">33658610</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ji</surname><given-names>J</given-names> </name><name name-style="western"><surname>Venderley</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Assessing nocturnal scratch with actigraphy in atopic dermatitis patients</article-title><source>NPJ Digit Med</source><year>2023</year><month>04</month><day>26</day><volume>6</volume><issue>1</issue><fpage>72</fpage><pub-id pub-id-type="doi">10.1038/s41746-023-00821-y</pub-id><pub-id pub-id-type="medline">37100893</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Moreau</surname><given-names>A</given-names> </name><name name-style="western"><surname>Anderer</surname><given-names>P</given-names> </name><name name-style="western"><surname>Ross</surname><given-names>M</given-names> </name><name name-style="western"><surname>Cerny</surname><given-names>A</given-names> </name><name name-style="western"><surname>Almazan</surname><given-names>TH</given-names> </name><name name-style="western"><surname>Peterson</surname><given-names>B</given-names> </name></person-group><article-title>Detection of nocturnal scratching movements in patients with atopic dermatitis using accelerometers and recurrent neural networks</article-title><source>IEEE J Biomed Health Inform</source><year>2018</year><month>07</month><volume>22</volume><issue>4</issue><fpage>1011</fpage><lpage>1018</lpage><pub-id pub-id-type="doi">10.1109/JBHI.2017.2710798</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Padmanabha</surname><given-names>A</given-names> </name><name name-style="western"><surname>Choudhary</surname><given-names>S</given-names> </name><name name-style="western"><surname>Majidi</surname><given-names>C</given-names> </name><name name-style="western"><surname>Erickson</surname><given-names>Z</given-names> </name></person-group><article-title>A multimodal sensing ring for quantification of scratch intensity</article-title><source>Commun Med</source><year>2023</year><volume>3</volume><issue>1</issue><fpage>115</fpage><pub-id pub-id-type="doi">10.1038/s43856-023-00345-2</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chun</surname><given-names>KS</given-names> </name><name name-style="western"><surname>Kang</surname><given-names>YJ</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>JY</given-names> </name><etal/></person-group><article-title>A skin-conformable wireless sensor to objectively quantify symptoms of pruritus</article-title><source>Sci Adv</source><year>2021</year><month>04</month><volume>7</volume><issue>18</issue><fpage>eabf9405</fpage><pub-id pub-id-type="doi">10.1126/sciadv.abf9405</pub-id><pub-id pub-id-type="medline">33931455</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>AF</given-names> </name><name name-style="western"><surname>Chun</surname><given-names>KS</given-names> </name><name name-style="western"><surname>Yu</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Validation of a hand-mounted wearable sensor for scratching movements in adults with atopic dermatitis</article-title><source>J Am Acad Dermatol</source><year>2023</year><month>03</month><volume>88</volume><issue>3</issue><fpage>726</fpage><lpage>729</lpage><pub-id pub-id-type="doi">10.1016/j.jaad.2022.09.032</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ebata</surname><given-names>T</given-names> </name><name name-style="western"><surname>Iwasaki</surname><given-names>S</given-names> </name><name name-style="western"><surname>Kamide</surname><given-names>R</given-names> </name><name name-style="western"><surname>Niimura</surname><given-names>M</given-names> </name></person-group><article-title>Use of a wrist activity monitor for the measurement of nocturnal scratching in patients with atopic dermatitis</article-title><source>Br J Dermatol</source><year>2001</year><month>02</month><volume>144</volume><issue>2</issue><fpage>305</fpage><lpage>309</lpage><pub-id pub-id-type="doi">10.1046/j.1365-2133.2001.04019.x</pub-id><pub-id pub-id-type="medline">11251563</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ikoma</surname><given-names>A</given-names> </name><name name-style="western"><surname>Ebata</surname><given-names>T</given-names> </name><name name-style="western"><surname>Chantalat</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Measurement of nocturnal scratching in patients with pruritus using a smartwatch: initial clinical studies with the itch tracker app</article-title><source>Acta Derm Venereol</source><year>2019</year><month>03</month><day>1</day><volume>99</volume><issue>3</issue><fpage>268</fpage><lpage>273</lpage><pub-id pub-id-type="doi">10.2340/00015555-3105</pub-id><pub-id pub-id-type="medline">30523352</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Smith</surname><given-names>MP</given-names> </name><name name-style="western"><surname>Ly</surname><given-names>K</given-names> </name><name name-style="western"><surname>Thibodeaux</surname><given-names>Q</given-names> </name><etal/></person-group><article-title>Emerging methods to objectively assess pruritus in atopic dermatitis</article-title><source>Dermatol Ther (Heidelb)</source><year>2019</year><month>09</month><day>1</day><volume>9</volume><issue>3</issue><fpage>407</fpage><lpage>420</lpage><pub-id pub-id-type="doi">10.1007/s13555-019-0312-3</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hsu</surname><given-names>CY</given-names> </name><name name-style="western"><surname>Ahuja</surname><given-names>A</given-names> </name><name name-style="western"><surname>Yue</surname><given-names>S</given-names> </name><name name-style="western"><surname>Hristov</surname><given-names>R</given-names> </name><name name-style="western"><surname>Kabelac</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Katabi</surname><given-names>D</given-names> </name></person-group><article-title>Zero-effort in-home sleep and insomnia monitoring using radio signals</article-title><source>Proc ACM Interact Mobile Wearable Ubiquitous Technol</source><year>2017</year><month>09</month><day>11</day><volume>1</volume><issue>3</issue><fpage>1</fpage><lpage>18</lpage><pub-id pub-id-type="doi">10.1145/3130924</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Zhao</surname><given-names>M</given-names> </name><name name-style="western"><surname>Yue</surname><given-names>S</given-names> </name><name name-style="western"><surname>Katabi</surname><given-names>D</given-names> </name><name name-style="western"><surname>Jaakkola</surname><given-names>TS</given-names> </name><name name-style="western"><surname>Bianchi</surname><given-names>MT</given-names> </name></person-group><article-title>Learning sleep stages from radio signals: a conditional adversarial architecture</article-title><year>2017</year><access-date>2024-08-05</access-date><conf-name>Proceedings of the 34th International Conference on Machine Learning</conf-name><fpage>6205</fpage><lpage>6214</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://proceedings.mlr.press/v70/zhao17d.html">https://proceedings.mlr.press/v70/zhao17d.html</ext-link></comment></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>G</given-names> </name><name name-style="western"><surname>Tarolli</surname><given-names>CG</given-names> </name><etal/></person-group><article-title>Monitoring gait at home with radio waves in Parkinson&#x2019;s disease: a marker of severity, progression, and medication response</article-title><source>Sci Transl Med</source><year>2022</year><month>09</month><day>21</day><volume>14</volume><issue>663</issue><fpage>eadc9669</fpage><pub-id pub-id-type="doi">10.1126/scitranslmed.adc9669</pub-id><pub-id pub-id-type="medline">36130014</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Benjamin</surname><given-names>K</given-names> </name><name name-style="western"><surname>Waterston</surname><given-names>K</given-names> </name><name name-style="western"><surname>Russell</surname><given-names>M</given-names> </name><name name-style="western"><surname>Schofield</surname><given-names>O</given-names> </name><name name-style="western"><surname>Diffey</surname><given-names>B</given-names> </name><name name-style="western"><surname>Rees</surname><given-names>JL</given-names> </name></person-group><article-title>The development of an objective method for measuring scratch in children with atopic dermatitis suitable for clinical use</article-title><source>J Am Acad Dermatol</source><year>2004</year><month>01</month><volume>50</volume><issue>1</issue><fpage>33</fpage><lpage>40</lpage><pub-id pub-id-type="doi">10.1016/s0190-9622(03)02480-0</pub-id><pub-id pub-id-type="medline">14699362</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>AF</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>S</given-names> </name></person-group><article-title>455 Correlation between objective measures of sleep and nocturnal scratch in children with atopic dermatitis</article-title><source>J Invest Dermatol</source><year>2021</year><month>05</month><volume>141</volume><issue>5</issue><fpage>S79</fpage><pub-id pub-id-type="doi">10.1016/j.jid.2021.02.478</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Ouroutzoglou</surname><given-names>M</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hellerstein</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Quantifying itch and its impact on sleep using machine learning and radio signals</article-title><source>arXiv</source><comment>Preprint posted online on 2025</comment><pub-id pub-id-type="doi">10.48550/arXiv.2501.04896</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kuznetsova</surname><given-names>A</given-names> </name><name name-style="western"><surname>Brockhoff</surname><given-names>PB</given-names> </name><name name-style="western"><surname>Christensen</surname><given-names>RHB</given-names> </name></person-group><article-title>lmerTest Package: Tests in linear mixed effects models</article-title><source>J Stat Soft</source><year>2017</year><month>12</month><day>6</day><volume>82</volume><issue>13</issue><fpage>1</fpage><lpage>26</lpage><pub-id pub-id-type="doi">10.18637/jss.v082.i13</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>L&#x00FC;decke</surname><given-names>D</given-names> </name><name name-style="western"><surname>Ben-Shachar</surname><given-names>M</given-names> </name><name name-style="western"><surname>Patil</surname><given-names>I</given-names> </name><name name-style="western"><surname>Waggoner</surname><given-names>P</given-names> </name><name name-style="western"><surname>Makowski</surname><given-names>D</given-names> </name></person-group><article-title>Performance: an R package for assessment, comparison and testing of statistical models</article-title><source>J Open Sour Softw</source><year>2021</year><month>Spring</month><volume>6</volume><issue>60</issue><fpage>3139</fpage><pub-id pub-id-type="doi">10.21105/joss.03139</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>McGraw</surname><given-names>KO</given-names> </name><name name-style="western"><surname>Wong</surname><given-names>SP</given-names> </name></person-group><article-title>Forming inferences about some intraclass correlation coefficients</article-title><source>Psychol Methods</source><year>1996</year><volume>1</volume><issue>1</issue><fpage>30</fpage><lpage>46</lpage><pub-id pub-id-type="doi">10.1037/1082-989X.1.1.30</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Koo</surname><given-names>TK</given-names> </name><name name-style="western"><surname>Li</surname><given-names>MY</given-names> </name></person-group><article-title>A guideline of selecting and reporting intraclass correlation coefficients for reliability research</article-title><source>J Chiropr Med</source><year>2016</year><month>06</month><volume>15</volume><issue>2</issue><fpage>155</fpage><lpage>163</lpage><pub-id pub-id-type="doi">10.1016/j.jcm.2016.02.012</pub-id><pub-id pub-id-type="medline">27330520</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alexopoulos</surname><given-names>C</given-names> </name><name name-style="western"><surname>Kassim</surname><given-names>A</given-names> </name><name name-style="western"><surname>Christakis</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>518&#x2014;Interaction of sleep disturbance and nocturnal scratch in atopic dermatitis patients</article-title><source>Br J Dermatol</source><year>2024</year><month>02</month><day>7</day><volume>190</volume><issue>Suppl 2</issue><fpage>ii22</fpage><lpage>ii22</lpage><pub-id pub-id-type="doi">10.1093/bjd/ljad498.025</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="web"><article-title>Clinical trial data transparency</article-title><source>Johnson &#x0026; Johnson Innovative Medicine</source><access-date>2025-07-15</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://innovativemedicine.jnj.com/clinical-trials/transparency">https://innovativemedicine.jnj.com/clinical-trials/transparency</ext-link></comment></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="web"><source>The Yoda Project</source><access-date>2025-07-16</access-date><comment><ext-link ext-link-type="uri" xlink:href="http://yoda.yale.edu">http://yoda.yale.edu</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Participant-level within-night scratch classification performance metrics.</p><media xlink:href="jmir_v27i1e72216_app1.xlsx" xlink:title="XLSX File, 14 KB"/></supplementary-material><supplementary-material id="app2"><label>Multimedia Appendix 2</label><p>Sensitivity, precision, <italic>F</italic><sub>1</sub>-score, and balanced accuracy to detect scratching events on 1-second windows compared to the Reference.</p><media xlink:href="jmir_v27i1e72216_app2.docx" xlink:title="DOCX File, 16 KB"/></supplementary-material><supplementary-material id="app3"><label>Multimedia Appendix 3</label><p>Association of scratch detection performance (<italic>F</italic><sub>1</sub>) with participant-level characteristics.</p><media xlink:href="jmir_v27i1e72216_app3.xlsx" xlink:title="XLSX File, 12 KB"/></supplementary-material></app-group></back></article>