<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Aging</journal-id><journal-id journal-id-type="publisher-id">aging</journal-id><journal-id journal-id-type="index">31</journal-id><journal-title>JMIR Aging</journal-title><abbrev-journal-title>JMIR Aging</abbrev-journal-title><issn pub-type="epub">2561-7605</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e91873</article-id><article-id pub-id-type="doi">10.2196/91873</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Combining Subjective Perceptions and Objective Behavioral Metrics With the Elderly Digital Twin System: Quantitative Usability Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Momand</surname><given-names>Ziaullah</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Mongkolnam</surname><given-names>Pornchai</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Pal</surname><given-names>Debajyoti</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name name-style="western"><surname>Yamsaengsung</surname><given-names>Siam</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1"/></contrib></contrib-group><aff id="aff1"><institution>School of Information Technology, King Mongkut's University of Technology Thonburi</institution><addr-line>126 Pracha Uthit Rd, Bang Mod, Thung Khru</addr-line><addr-line>Bangkok</addr-line><country>Thailand</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Chau</surname><given-names>Pui Hing</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Mor</surname><given-names>Nachiket</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Zhang</surname><given-names>Xiangmin</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Pornchai Mongkolnam, PhD, School of Information Technology, King Mongkut's University of Technology Thonburi, 126 Pracha Uthit Rd, Bang Mod, Thung Khru, Bangkok, 10140, Thailand, 66 24709892; <email>pornchai@sit.kmutt.ac.th</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>26</day><month>5</month><year>2026</year></pub-date><volume>9</volume><elocation-id>e91873</elocation-id><history><date date-type="received"><day>21</day><month>01</month><year>2026</year></date><date date-type="rev-recd"><day>14</day><month>04</month><year>2026</year></date><date date-type="accepted"><day>18</day><month>04</month><year>2026</year></date></history><copyright-statement>&#x00A9; Ziaullah Momand, Pornchai Mongkolnam, Debajyoti Pal, Siam Yamsaengsung. Originally published in JMIR Aging (<ext-link ext-link-type="uri" xlink:href="https://aging.jmir.org">https://aging.jmir.org</ext-link>), 26.5.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Aging, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://aging.jmir.org">https://aging.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://aging.jmir.org/2026/1/e91873"/><abstract><sec><title>Background</title><p>The growing aging population has increased the need for technologies that support informal caregivers in home-based older adult care. Digital twin (DT) systems offer promising capabilities; yet, their effectiveness depends on usability, an aspect still insufficiently evaluated among caregivers.</p></sec><sec><title>Objective</title><p>This study aimed to assess the usability of an older adult care DT system using a dual-method evaluation that integrates subjective and objective behavioral performance.</p></sec><sec sec-type="methods"><title>Methods</title><p>Fifty caregivers participated in a usability assessment combining the System Usability Scale (SUS) and detailed system activity log analytics. Log-based measures included task completion, time on task, errors, and abandonment rate. A composite user engagement score was computed and analyzed for correlation and predictive association with SUS ratings. Engagement clusters were also explored.</p></sec><sec sec-type="results"><title>Results</title><p>Caregivers reported an excellent mean SUS score of 80.45. System logs showed a 94.08% task completion rate, 2.66% abandonment, and an average task duration of 89.16 seconds. User engagement score demonstrated significant correlations with SUS (<italic>r</italic>=0.626, &#x03C1;=0.552; <italic>P</italic>&#x003C;.001) and significantly predicted usability in regression analysis (<italic>&#x03B2;</italic>=52.94, <italic>R</italic>&#x00B2;=0.392; <italic>P</italic>&#x003C;.001). Engagement-based clustering identified high-, medium-, and low-tier user groups, each exhibiting distinct usability patterns.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>Integrating subjective usability ratings with objective behavioral metrics provides a rigorous and comprehensive approach to evaluating DT systems for older adult care. The findings highlight strong usability of the system and offer actionable insights for refining caregiver support technologies.</p></sec></abstract><kwd-group><kwd>elderly digital twin</kwd><kwd>usability study</kwd><kwd>System Usability Scale</kwd><kwd>user engagement score</kwd><kwd>caregiver support</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background</title><p>The global demographic shift toward an aging population presents unprecedented challenges for health care systems worldwide. The world&#x2019;s population older than 60 years is projected to double from 1.06 billion (13.5%) in 2020 to 2.13 billion in 2050 (22.0%), raising significant concerns about the impact of aging [<xref ref-type="bibr" rid="ref1">1</xref>]. This rapid aging process is characterized by an increased prevalence of chronic diseases, complex health care needs, and a growing demand for personalized and proactive health care models [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. In the current technology-driven age, digital twin (DT) has emerged as a transformative approach in health care, offering the potential to revolutionize older adult care through predictive analytics and personalized interventions. DTs are virtual representations of physical entities that enable the dynamic simulation of potential treatment strategies, monitoring and prediction of health trajectories, and early intervention and prevention [<xref ref-type="bibr" rid="ref4">4</xref>]. In the context of older adult health monitoring, DTs create comprehensive virtual models that integrate multimodal data, including clinical records, genetic information, wearable sensor data, and environmental factors, to provide a holistic view of an individual&#x2019;s health status [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>].</p><p>The application of DT technology in older adult care is particularly compelling because of its ability to monitor vital signs, physiological parameters, and other health-related data in real time, enabling health care providers to detect early signs of deterioration or anomalies and proactively intervene in such scenarios [<xref ref-type="bibr" rid="ref6">6</xref>]. Recent implementations have demonstrated the potential of this technology in aging-in-place scenarios, where DTs facilitate continuous health monitoring while preserving the independence and quality of life of seniors [<xref ref-type="bibr" rid="ref7">7</xref>]. For example, DT systems have been successfully deployed to monitor older adult patients for fall detection, abnormal posture recognition, and health risk assessment, with validation trials showing promising results in real-world nursing home environments [<xref ref-type="bibr" rid="ref8">8</xref>].</p><p>The complexity of older adult care often necessitates significant involvement from both formal and informal caregivers, who play crucial roles in health monitoring, decision-making, and care coordination. Informal caregivers, predominantly family members, face substantial challenges in navigating complex health care systems and making informed decisions [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>]. Family caregivers&#x2019; decision support interventions have shown promise in improving care outcomes, with studies demonstrating that well-designed decision support tools can reduce family caregivers&#x2019; decision uncertainty and improve satisfaction with the quality of care [<xref ref-type="bibr" rid="ref9">9</xref>]. Such tools leverage trust, cultural humility, strength-based approaches, and effective information sharing to facilitate meaningful conversations between caregivers and health care providers. In the context of DT systems for older adult care, caregiver-facing interfaces have become essential components that must translate complex health data into actionable insights that support informed care&#x2013;related decisions [<xref ref-type="bibr" rid="ref10">10</xref>].</p><p>The success of DT systems in older adult health care depends critically on their usability, particularly in home care settings, where family members are involved in a variety of experiences [<xref ref-type="bibr" rid="ref11">11</xref>]. In health care contexts, poor usability can have serious consequences, including medical errors, reduced adoption rates, and compromised patient safety [<xref ref-type="bibr" rid="ref12">12</xref>]. For DT systems targeting older adult populations and their caregivers, usability considerations have become even more critical because of the potential age-related changes in vision, dexterity, and cognitive processing. Older adults often require caregiver mediation when interacting with digital health technologies, and systems must be designed to accommodate both direct older adult users and caregiver interactions [<xref ref-type="bibr" rid="ref13">13</xref>].</p><p>In health care usability research, evaluation has largely relied on subjective self-report instruments, most prominently the System Usability Scale (SUS), which has been applied across diverse digital health systems such as caregiver monitoring tools HELMA [<xref ref-type="bibr" rid="ref14">14</xref>], self-management apps for heart failure (Engage) [<xref ref-type="bibr" rid="ref13">13</xref>], exergame training systems [<xref ref-type="bibr" rid="ref15">15</xref>], and interdisciplinary hospital information platforms such as therapy and monitoring systems [<xref ref-type="bibr" rid="ref16">16</xref>]. While SUS provides standardized benchmarking, its reliance on user perception limits insights into actual system interaction. Studies have attempted to complement the SUS with performance or log data: the HELMA project tracked caregiver login frequency and session duration, the Engage system analyzed task completion and observed errors, and exergame interventions logged exercise scores and reaction accuracy. However, these measures often remain surface-level, focusing on frequency, duration, or clinical outcomes rather than granular task behavior analytics such as navigation sequences, error recovery, feature usage, task completion, time on task, click on task ratio, retry rate, session duration, or task abandonment ratio. Moreover, limitations such as older adults&#x2019; reliance on caregiver mediation [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref17">17</xref>] and testing in controlled settings [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref15">15</xref>] constrain the validity of existing evaluations. Collectively, these findings underscore a critical gap: while subjective usability assessments dominate and objective measures have been trailed, few health care studies [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>] have integrated log-based behavioral data with standardized questionnaires. To address this gap, our study proposes a dual-method evaluation framework that unites SUS scores with detailed behavioral engagement metrics, providing both perceived and observed dimensions of usability in caregiver-facing DT systems.</p><p>To address this gap, this study conducted a usability evaluation of an elderly digital twin (EDT) system designed to support informal caregivers in home care settings. In our previous work [<xref ref-type="bibr" rid="ref18">18</xref>], we proposed a comprehensive EDT framework to assist caregivers in making informed decisions. To evaluate the feasibility and applicability of the framework, we developed a working EDT system prototype. Unlike prior studies that emphasized technical modeling or data integration, this study explicitly targets the informal caregiver perspective, in which usability is critical for adoption in daily home care. Our evaluation follows a dual-method approach with the following two objectives: (1) subjective evaluation of the usability of our proposed EDT system by assessing caregivers&#x2019; perceptions using the hugely popular SUS; (2) objective evaluation of usability by proposing a novel behavioral engagement metric that can be used in conjunction with the SUS.</p><p>We present a dual-method usability evaluation framework that combines log-based behavioral analytics (objective measurement) with a standardized SUS questionnaire (subjective measurement) [<xref ref-type="bibr" rid="ref19">19</xref>]. This approach leverages the complementary strengths of objective behavioral data and subjective user feedback to provide a comprehensive view of the system&#x2019;s usability. The log-based component captures detailed user behavior, including interaction patterns, feature usage, task completion pathways, error rates, and temporal usage characteristics. These metrics offer insights into real-world usage that may not be revealed through self-reported measures alone. In parallel, the SUS component provides standardized usability scores that enable benchmarking against established norms in health care applications and allow comparisons with other digital health interventions.</p><p>This dual-method approach directly addresses a noticeable gap in existing evaluation practices: the dominance of subjective methods with limited or superficial use of objective interaction data. Previous health care systems&#x2019; usability studies often relied on the SUS or combined it with a basic usage log [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref17">17</xref>], which failed to capture how systems are actually navigated and used in real practice. By integrating behavioral engagement metrics with subjective user perceptions, our study provides an evidence-based, user-centered, and replicable framework for evaluating digital health applications. Applied specifically to caregiver-facing interfaces for DTs of the older adults, this methodology not only fills the gap but also offers actionable insights to guide iterative design and ensure more effective, caregiver-friendly digital health systems. The remainder of this manuscript is organized as follows: Section 2 reviews related work, Section 3 outlines the methods, Section 4 presents the results, Section 5 offers a discussion, and Section 6 concludes the study.</p></sec><sec id="s1-2"><title>Related Work</title><p>The growing complexity of older adult care has driven the development of digital health technologies, including DT systems, to support clinical decision-making and informal caregivers. As these systems advance, ensuring their usability, particularly for nonprofessional caregivers, is critical for adoption and effectiveness. Previous studies have evaluated digital health technologies using subjective measures, such as the SUS or qualitative interviews. This section reviews usability studies and highlights the methodological gap addressed by our dual-method approach.</p></sec><sec id="s1-3"><title>Usability Evaluation Methods: Subjective Versus Objective</title><p>Usability evaluation methods fall into 2 primary categories: subjective and objective. Each category offers unique advantages and faces distinct limitations, making the choice between them or their combination critical for comprehensive usability assessment. SUS remains the most widely adopted usability instrument, valued for its brevity, reliability, and extensive benchmarking data [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. Recent validation studies have reinforced SUS&#x2019;s psychometric properties of the SUS. A validation study of voice user interfaces confirmed SUS&#x2019;s usefulness across different interaction modalities. Additionally, researchers have developed item-level benchmarks for the SUS, allowing practitioners to interpret individual items when specific usability attributes require targeted assessment. These benchmarks enable a more granular evaluation while maintaining the scale&#x2019;s standardized scoring advantage [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref22">22</xref>].</p><p>In addition to the SUS, several other standardized questionnaires serve specific evaluation contexts. The usability metric for user experience (UMUX) and its shortened variant, UMUX-LITE, offer alternatives that are more closely aligned with the ISO (International Organization for Standardization) 9241 definitions of usability. Recent psychometric evaluations suggest that the UMUX-LITER provides the closest correspondence to SUS scores when converted to comparable scales [<xref ref-type="bibr" rid="ref23">23</xref>]. The NASA-TLX (National Aeronautics and Space Administration&#x2013;Task Load Index) addresses perceived workload in complex, high-consequence environments, making it particularly valuable for health care, aerospace, and military applications. However, its complexity and administration time limit its usefulness for consumer product evaluations [<xref ref-type="bibr" rid="ref24">24</xref>]. AttrakDiff occupies a unique position by measuring both the pragmatic and hedonic quality dimensions of the user experience. This dual focus allows for the evaluation of traditional usability metrics alongside emotional and aesthetic responses, although recent studies have raised concerns about translation reliability and cultural adaptation [<xref ref-type="bibr" rid="ref25">25</xref>].</p><p>Subjective methods are easy to administer, resource-efficient, and standardized, enabling benchmark comparisons and effective communication among practitioners [<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. However, subjective measures have significant limitations. Social desirability bias is a primary concern, with users potentially providing responses they believe evaluators want to hear rather than their genuine perceptions. Cultural factors also influence responses, with different populations rather than actual performance potentially missing critical usability issues that users may not consciously recognize [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>,<xref ref-type="bibr" rid="ref28">28</xref>].</p><p>Objective evaluation centers on measurable performance indicators, such as task completion, time on task, and error analysis, which together provide insights into system effectiveness and efficiency [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref31">31</xref>]. Error analysis offers detailed insights into the usability problems. Error rates can be calculated globally (total errors divided by total attempts) and task-specific (errors per task opportunity), providing different perspectives on system performance. Modern approaches distinguish between error types and severity levels, enabling targeted improvements [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref31">31</xref>].</p><p>Clickstream analysis is a core component of behavioral log methods and has emerged as a powerful objective approach for tracking user navigation patterns, feature usage, and drop-off points. By capturing the sequence of interactions, it highlights problems that are invisible to traditional subjective metrics [<xref ref-type="bibr" rid="ref32">32</xref>-<xref ref-type="bibr" rid="ref34">34</xref>]. Advanced behavioral analytics extend this further by combining multiple interaction types, such as clicks, mouse movements, and page transitions, to generate comprehensive user journey maps. These methods are particularly valuable for detecting navigation bottlenecks and optimizing conversion paths in digital systems.</p><p>Objective methods generally provide concrete evidence for design decisions by revealing fine-grained interaction patterns that users may not consciously recognize or accurately report [<xref ref-type="bibr" rid="ref35">35</xref>,<xref ref-type="bibr" rid="ref36">36</xref>]. However, they also face implementation challenges: data collection and analysis can be complex and resource-intensive, and these methods may not directly capture user satisfaction or emotional responses, requiring supplementary subjective measures. Moreover, standardized interpretation frameworks for many objective metrics remain underdeveloped, complicating cross-study comparisons [<xref ref-type="bibr" rid="ref26">26</xref>]. Recent health care usability studies have demonstrated effective hybrid implementation [<xref ref-type="bibr" rid="ref37">37</xref>] and described a hybrid approach that satisfies both pragmatic development needs and academic research requirements. Their framework captures detailed behavioral data for intermediate iterations while enabling deeper qualitative analysis for academic dissemination. Contemporary usability evaluation is shifting toward integrated approaches that combine machine learning with behavioral subjective data analysis. Advanced statistical methods improve the correlation between objective performance and user satisfaction [<xref ref-type="bibr" rid="ref38">38</xref>]. Recognizing that no single method offers a complete picture, the field increasingly adopts multimethod strategies that balance methodological strengths and limitations while maintaining practical feasibility [<xref ref-type="bibr" rid="ref37">37</xref>].</p></sec><sec id="s1-4"><title>Clinical Relevance of Fitbit Sense 2 Data</title><p>Consumer wearables are increasingly used in digital health because they enable continuous, low-burden physiological monitoring outside clinical settings. Their clinical relevance, however, is parameter-specific rather than uniform. A systematic review of Fitbit devices found the strongest evidence for step counting under selected conditions, whereas energy expenditure, sleep, and some other measures showed less consistent accuracy and should be interpreted cautiously in health-related decision contexts [<xref ref-type="bibr" rid="ref39">39</xref>]. A later meta-analysis of wrist-worn Fitbit sleep models reported that newer sleep-staging devices performed better than earlier motion-only models but still were not substitutes for polysomnography [<xref ref-type="bibr" rid="ref40">40</xref>]. Because this study used Fitbit Sense 2, newer-generation evidence is also relevant: a prospective multicenter validation study of 11 consumer sleep trackers found that Fitbit Sense 2 showed moderate agreement with polysomnography for sleep-stage classification and competitive performance among wearables, including relatively strong performance in deep-stage detection [<xref ref-type="bibr" rid="ref41">41</xref>].</p><p>Taken together, these findings support a measured role for Fitbit Sense 2 in caregiver-facing systems. Recent free-living validation of a newer Fitbit device against medical-grade references showed moderate to good agreement for daily steps, resting heart rate, respiratory rate, and some heart rate variability (HRV) measures but weaker agreement for oxygen saturation, indicating that some physiological channels are more dependable than others [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref41">41</xref>,<xref ref-type="bibr" rid="ref42">42</xref>]. Accordingly, Fitbit Sense 2 data in the EDT are best viewed as supporting longitudinal trend monitoring, anomaly awareness, and caregiver-oriented decision support rather than diagnostic inference.</p></sec><sec id="s1-5"><title>Current Usability Evaluation Methods for Health Care Systems</title><p>As shown in <xref ref-type="table" rid="table1">Table 1</xref>, prior usability studies of digital health systems have relied on subjective methods, particularly the SUS, interviews, and qualitative feedback [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref43">43</xref>-<xref ref-type="bibr" rid="ref48">48</xref>]. Only a few studies incorporated partial task-based or observational measures, and these were typically limited and not derived from detailed real-time interaction logs [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref45">45</xref>]. Moreover, studies focused on patients, older adults, or clinical professionals in institutional settings rather than informal caregivers in home-based care [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref44">44</xref>-<xref ref-type="bibr" rid="ref48">48</xref>]. Synthesizing these studies reveals three major gaps: (1) heavy reliance on subjective measures without integrating detailed objective interaction logs, (2) limited focus on formal caregivers in home settings, and (3) superficial assessment of task behavior, where satisfaction or completion was reported but navigation patterns, retries, and feature usage were not captured. To address these gaps, this study integrates subjective usability perceptions (SUS) with objective system usage data (user activity logs), providing a more ecologically valid and holistic framework for evaluating caregiver-facing DT systems for older adults.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Comparison of usability methods, target groups, and system features across related studies.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Target users</td><td align="left" valign="bottom">Method</td><td align="left" valign="bottom">SUS<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="bottom">Log</td><td align="left" valign="bottom">Setting</td><td align="left" valign="bottom">Focus</td><td align="left" valign="bottom">Behavioral metrics</td><td align="left" valign="bottom">References</td></tr></thead><tbody><tr><td align="left" valign="top">Informal caregivers</td><td align="left" valign="top">SUS, interview</td><td align="left" valign="top">No</td><td align="left" valign="top">No</td><td align="left" valign="top">Home</td><td align="left" valign="top">Stroke support</td><td align="left" valign="top">No</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref43">43</xref>]</td></tr><tr><td align="left" valign="top">Older adults + Caregivers</td><td align="left" valign="top">SUS, interview</td><td align="char" char="." valign="top">72.2</td><td align="left" valign="top">Partial</td><td align="left" valign="top">Home</td><td align="left" valign="top">Cognitive monitoring</td><td align="left" valign="top">Partial</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref14">14</xref>]</td></tr><tr><td align="left" valign="top">Older adults + Caregivers</td><td align="left" valign="top">SUS, NASA-TLX</td><td align="char" char="." valign="top">82.6</td><td align="left" valign="top">No</td><td align="left" valign="top">Home +<break/>Clinical</td><td align="left" valign="top">Heart Failure</td><td align="left" valign="top">Partial (observed)</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref13">13</xref>]</td></tr><tr><td align="left" valign="top">Older adults</td><td align="left" valign="top">SUS, acceptability score</td><td align="char" char="." valign="top">59.7</td><td align="left" valign="top">No</td><td align="left" valign="top">Clinical</td><td align="left" valign="top">Gait monitoring</td><td align="left" valign="top">No</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref17">17</xref>]</td></tr><tr><td align="left" valign="top">Older adults</td><td align="left" valign="top">SUS, feedback</td><td align="char" char="." valign="top">58.3</td><td align="left" valign="top">No</td><td align="left" valign="top">Lab +<break/>Clinical</td><td align="left" valign="top">Fall prevention</td><td align="left" valign="top">No</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref15">15</xref>]</td></tr><tr><td align="left" valign="top">Patients</td><td align="left" valign="top">SUS</td><td align="char" char="." valign="top">87.5</td><td align="left" valign="top">No</td><td align="left" valign="top">Clinical</td><td align="left" valign="top">Symptom tracking</td><td align="left" valign="top">No</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref45">45</xref>]</td></tr><tr><td align="left" valign="top">Health care<break/>professional</td><td align="left" valign="top">SUS</td><td align="char" char="." valign="top">69.2</td><td align="left" valign="top">No</td><td align="left" valign="top">Geriatric wards</td><td align="left" valign="top">Health monitoring</td><td align="left" valign="top">No</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref16">16</xref>]</td></tr><tr><td align="left" valign="top">Older adults</td><td align="left" valign="top">SUS + Interview</td><td align="char" char="." valign="top">78.8</td><td align="left" valign="top">No</td><td align="left" valign="top">Home</td><td align="left" valign="top">Home care platform</td><td align="left" valign="top">No</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref46">46</xref>]</td></tr><tr><td align="left" valign="top">Patients +<break/>Clinicians</td><td align="left" valign="top">SUS + Feedback</td><td align="char" char="." valign="top">86.8</td><td align="left" valign="top">No</td><td align="left" valign="top">Clinical</td><td align="left" valign="top">Trial data capture</td><td align="left" valign="top">No</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref48">48</xref>]</td></tr><tr><td align="left" valign="top">Emergency staff</td><td align="left" valign="top">SUS + Interview</td><td align="char" char="." valign="top">53.1</td><td align="left" valign="top">No</td><td align="left" valign="top">Clinical</td><td align="left" valign="top">Clinical information management</td><td align="left" valign="top">No</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref47">47</xref>]</td></tr><tr><td align="left" valign="top">Our study (informal caregivers)</td><td align="left" valign="top">SUS + System usage logs</td><td align="char" char="." valign="top">80.45</td><td align="left" valign="top">Activity logs</td><td align="left" valign="top">Home</td><td align="left" valign="top">Decision support in older adult care</td><td align="left" valign="top">Task metrics, user engagement score</td><td align="left" valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>SUS: System Usability Scale.</p></fn><fn id="table1fn2"><p><sup>b</sup>Not applicable.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>This study evaluated the usability of the EDT system for supporting informal caregivers in home-based care. To provide a comprehensive assessment of user interaction, both subjective and objective measures were integrated. The following sections describe the study design, system features, participant recruitment, testing procedures, and analytical methods used to assess usability.</p></sec><sec id="s2-2"><title>Overall System Flow</title><p>We used a cross-sectional observational design to evaluate the usability of the caregiver-facing EDT prototype. <xref ref-type="fig" rid="figure1">Figure 1</xref> illustrates the system architecture and data flow during the usability sessions. Older adult participants wore a Fitbit smartwatch to collect physiological data, including heart rate, sleep, and activity measures. These data were transmitted to the cloud for secure transfer and preprocessing and then processed and stored by the back end for analysis and insight generation. Caregivers accessed the EDT system through computers, tablets, iPads, or smartphones, where they viewed real-time and historical health information, including digital biomarkers and artificial intelligence (AI)&#x2013;generated recommendations. During the sessions, informal caregivers completed representative tasks such as exploring dashboards, reviewing AI-based recommendations, and navigating system features. User interactions were recorded through back-end logs, and caregiver feedback was collected using a questionnaire. Sample user interfaces of the system are presented in <xref ref-type="fig" rid="figure2">Figure 2</xref> for cardiac DT and <xref ref-type="fig" rid="figure3">Figure 3</xref> for sleep stage monitoring, while detailed system feature interfaces are provided in the <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Illustration of the system usability session setup, showing data flow from a home-based older adult to a digital twin platform accessed by an informal caregiver.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e91873_fig01.png"/></fig><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Cardiac Digital Twin model user interface.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e91873_fig02.png"/></fig><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Sleep stages analysis user interface.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e91873_fig03.png"/></fig></sec><sec id="s2-3"><title>System Features</title><p>The EDT system evaluated in this study was designed to provide informal caregivers with real-time, personalized insights into the health status of older adults in their homes. The system follows a modular architecture with 5 core components: data sources, data curation pipeline, data integration and storage, models and insight generation, and user interaction, with a dedicated security and privacy layer and a dynamic feedback loop between the user and intelligent models, as shown in <xref ref-type="fig" rid="figure4">Figure 4</xref>.</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>High-level architecture of elderly digital twin system. AI: artificial intelligence; LLM: large language model; ML: machine learning.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e91873_fig04.png"/></fig></sec><sec id="s2-4"><title>Data Sources</title><p>The system captures multimodal physiological data using a Fitbit smartwatch worn by older adults. These signals included heart rate, respiratory data, sleep log data, blood oxygen saturation (SpO<sub>2</sub>), and physical activity.</p></sec><sec id="s2-5"><title>Data Curation Pipeline</title><p>Incoming sensor data are streamed into an automated preprocessing module that handles data cleaning, synchronization, and consolidation across modalities. A dedicated stream processing engine prepares the data for integration and downstream analysis in real time. This stage ensures quality and consistency before the data are forwarded through an orchestrated pipeline.</p></sec><sec id="s2-6"><title>Data Integration and Storage</title><p>The processed data were stored centrally in a PostgreSQL database. This layer supports structured data storage and efficient querying for both real-time and retrospective analyses. Integration mechanisms ensure temporal alignment of physiological signals for model consumption.</p></sec><sec id="s2-7"><title>Models and Insights Generation</title><p>The EDT system comprises 2 main components: a Cardiac Digital Twin and a Sleep Monitoring Digital Twin, which monitor physiological signals and generate insights for caregivers. The EDT prototype was evaluated as a caregiver-oriented decision support research system rather than as a diagnostic tool, and the sensing device used in this study, Fitbit Sense 2, is not a Food and Drug Administration&#x2013;approved device for clinical use. Cardiac Digital Twin tracks heart health in older adults through real-time heart rate monitoring, trend visualization, and HRV analysis. A 3D cardiac model simulates a beating heart with animation driven by current beats per minute. For continuous monitoring during data loss, a bidirectional long short-term memory (Bi-LSTM) model predicts beats per minute at 5-minute intervals. Bi-LSTM was selected because of its ability to capture temporal dependencies and improve physiological prediction accuracy. When activated, the system notifies the caregivers that synthetic predictions are being used. The Bi-LSTM model was trained in 579,486 heart rate records, achieving a mean squared error of 0.2944 and a mean absolute error of 0.3410. The reported model performance metrics are presented to characterize the technical behavior of the prototype components and should not be interpreted as evidence of clinical-grade validity.</p><p>The Sleep Monitoring Digital Twin processes multisensory physiological data to monitor sleep behavior. It analyzes patterns across sleep stages, including light, deep, rapid eye movement, and awake, and visualizes trends to support long-term observation. The system computes sleep quality metrics, such as efficiency, latency, and awakenings, using probabilistic models to map the stage transitions. These outputs enable the detection of sleep disruptions and behavioral anomalies linked to health decline in the older adult population. A long short-term memory model was developed to infer sleep stages from SpO&#x2082; and heart rate data, chosen for its memory structure suitable for temporal dependencies in physiological time series. The model achieved 92% validation accuracy for 9125 sequences, maintaining sleep-tracking continuity. In this study, however, the sleep-monitoring model was included to enable the functional operation of the caregiver-facing EDT interface and was evaluated as part of the overall usability workflow rather than as a stand-alone clinically validated diagnostic model. A submodule monitored SpO&#x2082; levels to detect hypoxemia, triggering alerts and large language model (LLM) feedback when oxygen saturation fell below the critical threshold. The LLM outputs are intended to support caregiver awareness and follow-up, rather than provide medical diagnosis or treatment advice.</p><p>To enhance real-time interpretability and caregiver empowerment, both DT models were supported by a fine-tuned GPT-4o LLM through instruction-based fine-tuning in caregiving. This LLM module delivers context-aware personalized feedback by interpreting physiological indicators, including abnormal heart rate patterns, HRV, disrupted sleep trends, sleep efficiency, latency, awakening, and hypoxemia through SpO<sub>2</sub> monitoring. When the system detects anomalies such as elevated heart rate, low HRV indicating stress, oxygen saturation below thresholds, or deviations from sleep benchmarks, it triggers the LLM to generate clear, caregiver-facing recommendations. These responses are personalized based on recent health trends and are presented in an understandable language. LLM summarizes patterns and provides decision support recommendations for caregiver actions such as monitoring hydration or seeking clinical evaluation. This fine-tuned GPT-4o model translates complex sensor data into actionable guidance, strengthens decision support capabilities, and fosters informed caregiving responses.</p><p>In our previous study, the caregiver-facing recommendations were subjected to structured medical experts' evaluation across the dimensions of clinical appropriateness, usefulness, safety, and alignment with clinical guidelines, with overall positive ratings and substantial interrating agreement, supporting their use as decision support guidance in the present system [<xref ref-type="bibr" rid="ref18">18</xref>]. To reduce the hallucinations, the GPT-4o model was developed using instruction-based fine-tuning in caregiving and grounded in structured physiological indicators from the EDT. The model was activated only when anomalies or threshold deviations were detected. The decision support recommendation generation was constrained through restricted prompting and limited output scope. Its outputs were designed as caregiver-friendly guidance and human-readable summaries of observed sensor patterns and not diagnosis or treatment advice. The system also used escalation language, such as advising clinical evaluation for concerning cases.</p></sec><sec id="s2-8"><title>User Interaction</title><p>The system provides a web-based interface for informal caregivers that is accessible through desktops, smartphones, and tablets. The dashboard enables navigation across modules such as heart rate trends, sleep analysis, SpO&#x2082; monitoring, and alerts. This alert section presents LLM-generated alert messages and recommendations when abnormal physiological patterns or threshold violations are detected. Visualizations use color-coded indicators and summaries to reduce cognitive load. The GPT-4o chatbot further generates natural language feedback and recommendations based on health data and caregiver queries. Caregivers can review alerts, add notes, and interact with the system across devices, thus ensuring flexible and informed older adult care support.</p></sec><sec id="s2-9"><title>Feedback Loop for Adaptive Learning</title><p>The architecture incorporates a dynamic feedback loop based on caregiver responses and system logs. These feedback signals are used to retrain the detection thresholds, improve alert relevance, and fine-tune the language model for more accurate and useful recommendations.</p></sec><sec id="s2-10"><title>Security and Privacy</title><p>A dedicated privacy layer ensures compliance with data protection standards. It includes data encryption, access control mechanisms, and data anonymization to protect sensitive health data and support the deployment of ethical systems.</p></sec><sec id="s2-11"><title>Participants Recruitment</title><p>This study included 2 groups of participants: older adults and their informal caregivers. Six older adult participants were recruited to generate real-world physiological data for the validation of the monitoring function of the system. These individuals, aged 60&#x2010;85 years, were Thai nationals residing in home care environments and were cognitively and physically capable of using a Fitbit Sense 2 device. Patients with stable chronic health conditions were included in the study, while those with known skin sensitivities, cognitive impairments, or conditions interfering with the use of wearable devices were excluded.</p><p>Fifty informal caregivers were recruited for the usability evaluation using a purposive sampling strategy to ensure the representation of individuals actively engaged in home-based older adult care. <xref ref-type="table" rid="table2">Table 2</xref> summarizes the demographic characteristics of the informal caregiver participants. Eligible caregivers were adults aged 18&#x2010;55 years with at least 3 months&#x2019; caregiving experience. To support meaningful interaction with the system, participants were required to demonstrate basic digital literacy (eg, prior use of smartphones or web apps) and the ability to navigate English-language interfaces. Screening interviews confirmed these criteria prior to enrollment. For better recruitment and participant comfort, all initial communications and consent discussions were conducted in the local Thai language with caregivers and older adult individuals. A local Thai assistant was engaged to explain the study procedure and provide step-by-step system guidance in Thai, ensuring clarity and inclusivity during the sessions. Caregivers received a stipend of 100 Thai Baht (average THB to US dollar exchange rate in July 2025: THB 1=US $0.03082; THB 100=US $3.082) to acknowledge their time and contribution. The Fitbit Sense 2 smartwatch used in this study was separately provided by the research team to all older adult participants.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Demographic characteristics of informal caregiver participants.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristic</td><td align="left" valign="bottom">Caregivers (n=50)</td></tr></thead><tbody><tr><td align="left" valign="top">Age (years), mean (SD)</td><td align="left" valign="top">35.6 (7.6)</td></tr><tr><td align="left" valign="top">Age (years), range</td><td align="left" valign="top">18&#x2010;55</td></tr><tr><td align="left" valign="top">Age (years), group distribution, n (%)</td><td align="left" valign="top"/></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>18&#x2010;25</td><td align="char" char="." valign="top">3 (6)</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>26&#x2010;35</td><td align="left" valign="top">25 (50)</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>36&#x2010;45</td><td align="left" valign="top">15 (30)</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>46&#x2010;50</td><td align="left" valign="top">6 (12)</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>51&#x2010;55</td><td align="left" valign="top">1 (2)</td></tr><tr><td align="left" valign="top">Sex, n (%)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Male</td><td align="char" char="." valign="top">21 (42)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Female</td><td align="left" valign="top">29 (58)</td></tr><tr><td align="left" valign="top">Caregiving experience (years), n (%)</td><td align="left" valign="top"/></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;1</td><td align="char" char="." valign="top">11 (22)</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1&#x2010;3</td><td align="left" valign="top">21 (42)</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4&#x2010;6</td><td align="left" valign="top">12 (24)</td></tr><tr><td align="char" char="." valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003E;6</td><td align="left" valign="top">6 (12)</td></tr></tbody></table></table-wrap></sec><sec id="s2-12"><title>Ethical Considerations</title><p>The study protocol was reviewed and approved by the institutional review board of King Mongkut&#x2019;s University of Technology Thonburi under reference number KMUTT-IRB-COA-2025&#x2010;048 on July 7, 2025. Written informed consent was obtained from all participants prior to data collection. Specifically, informed consent was secured from both the older adult participants and their informal caregivers before their involvement in the study. Caregiver participants received a small stipend of THB 100, equivalent to approximately US $3.08, as compensation for their time. This compensation was not linked to task performance, usability ratings, or study outcomes and was not considered coercive. All collected data were deidentified prior to analysis, and participant confidentiality was maintained throughout the study.</p></sec><sec id="s2-13"><title>Usability Evaluation Framework</title><p>This study used a dual-method usability evaluation framework designed to capture subjective perceptions and objective behavioral interactions with the EDT system. The framework, illustrated in <xref ref-type="fig" rid="figure5">Figure 5</xref>, consists of 3 key components: participant roles, system interaction, and evaluation methods, integrated through a feedback-driven design loop. Two participant groups were involved: older adults who contributed real-time physiological data using a Fitbit Sense 2 smartwatch, and informal caregivers who interacted with the system to evaluate its usability. Usability was assessed using both subjective and objective methods. Subjectively, SUS was used to collect caregiver-reported feedback on ease of use, satisfaction, and overall system experience. Objectively, the activity log data captured granular interaction behaviors, including task completion rates, click paths, session duration, error rates, drop-off points, and module usage frequency. These 2 data streams were then fused to generate comprehensive usability insights. This fusion enabled us to assess both how users perceived the system and how they interacted with it.</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Usability evaluation framework for the elderly digital twin system. The framework integrates subjective (System Usability Scale) and objective (log-based) evaluation methods to assess system usability and inform design improvements. AI: artificial intelligence.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e91873_fig05.png"/></fig></sec><sec id="s2-14"><title>Data Collection</title><p>Data Collection was conducted over an 8-week period (July 7 to August 31, 2025) and involved 2 participant groups: older adults and informal caregivers. The older adult participants wore the Fitbit Sense 2 smartwatch in their home environments to generate real-time physiological data, including heart rate, respiratory rate, SpO<sub>2</sub>, sleep logs, and physical activity. Before commencing data collection, all older adult participants completed a brief health and comfort assessment to confirm their suitability for using a smartwatch. The survey gathered basic demographic information and screened for potential risks, such as allergies, history of skin irritation, relevant medical conditions, or wrist swelling, which could affect comfort or safety. Participants with contraindications were excluded. The results of the health and comfort screening are summarized in <xref ref-type="table" rid="table3">Table 3</xref>. This prescreening step ensured that the smartwatch could be used safely and comfortably during subsequent data collection.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Health and comfort screening outcomes for older adult participants.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Screening item</td><td align="left" valign="bottom">Yes/No, n (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Allergy to smartwatch materials (silicone, metal, and adhesives)</td><td align="left" valign="top">0 (0)/6 (100)</td></tr><tr><td align="left" valign="top">History of skin irritation from wristband/watches/jewelry</td><td align="left" valign="top">0 (0)/6 (100)</td></tr><tr><td align="left" valign="top">Skin/medical conditions affecting smartwatch use</td><td align="left" valign="top">0 (0)/6 (100)</td></tr><tr><td align="left" valign="top">Swelling in wrist/hands</td><td align="left" valign="top">0 (0)/6 (100)</td></tr><tr><td align="left" valign="top">Physical activity</td><td align="left" valign="top">Daily: 3 (50), occasionally: 1 (16.7), and rarely: 2 (33.3)</td></tr></tbody></table></table-wrap><p>The data were streamed to the system back end to validate the predictive analytics and monitoring capabilities of the EDT models under real-life conditions. Informal caregivers evaluated the system usability through guided interaction sessions using their smartphones, tablets, or computers. Each caregiver used the EDT system for 4 consecutive days, engaging with it for 20&#x2010;30 minutes daily. The SUS questionnaire was administered after the fourth day to capture the caregivers&#x2019; consolidated perception of usability after repeated interactions. This approach balanced ecological validity with participant burden: 4 days ensured sufficient system interaction while remaining feasible for busy caregivers. We also captured users&#x2019; behavioral data through system-generated activity logs, which were passively recorded through automatic instrumentation. The system obtained informed consent prior to log data collection, disclosing that no personally identifiable information was recorded. All logged data were anonymized and stored per institutional guidelines.</p><p>A total of 24 system tasks were predefined for the log data collection phase. These tasks were systematically constructed from the core functional modules of the EDT prototype, including heart monitoring, sleep tracking, SpO<sub>2</sub> assessment, AI-driven health advice, and the AI chatbot assistant. The task set was designed to ensure structured coverage of the system&#x2019;s principal functions during usability testing, so that all key user interactions could be consistently captured in the log analysis. Thus, the tasks were intended primarily to exercise the major features of the prototype rather than to directly reproduce naturally occurring caregiving workflows derived from interviews, observational studies, or clinical workflow analysis. Each task represented a meaningful user interaction within the prototype (eg, viewing 24-hour heart rate trends or checking sleep stage analysis), and each was assigned a unique code for consistent identification in the analysis, as detailed in <xref ref-type="table" rid="table4">Table 4</xref>.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>System tasks and associated codes used for feature usage analysis during the user activity log data collection.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model and task</td><td align="left" valign="bottom">Logged behavior</td><td align="left" valign="bottom">End role</td><td align="left" valign="bottom">Associated objective metrics</td></tr></thead><tbody><tr><td align="left" valign="top" colspan="4">Cardiac Digital Twin</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Request AI<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> insights for real-time heart rate</td><td align="left" valign="top">Click on AI insights</td><td align="left" valign="top">AI output shown</td><td align="left" valign="top">TC<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup>, ToT<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup>, FU<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup></td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Observe real-time heart rate dashboard</td><td align="left" valign="top">Open live HR<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup> screen</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, ToT, RR<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup>, NF<sup><xref ref-type="table-fn" rid="table4fn7">g</xref></sup>, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>View 24-hour heart rate history</td><td align="left" valign="top">Open 24-hour chart</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, ToT, NF, TAR<sup><xref ref-type="table-fn" rid="table4fn8">h</xref></sup>, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>View 7-day heart rate trends</td><td align="left" valign="top">Open 7-day HR trends</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, ToT, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>View 24-hour heart rate summary</td><td align="left" valign="top">Open HR summary panel</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, ToT, TAR, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Observe heart rate variability dashboard</td><td align="left" valign="top">Open HRV<sup><xref ref-type="table-fn" rid="table4fn9">i</xref></sup> panel</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, RR, ToT, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Request AI insights on heart rate variability</td><td align="left" valign="top">Click AI for HRV</td><td align="left" valign="top">AI output shown</td><td align="left" valign="top">TC, FU, CTR<sup><xref ref-type="table-fn" rid="table4fn10">j</xref></sup></td></tr><tr><td align="left" valign="top" colspan="4">Sleep Monitoring Digital Twin</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>View last night&#x2019;s sleep quality</td><td align="left" valign="top">Open sleep summary</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, NF, TAR, ToT</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Request AI advice for abnormal deep sleep</td><td align="left" valign="top">Click AI for deep sleep</td><td align="left" valign="top">AI output shown</td><td align="left" valign="top">TC, FU, CTR, ToT</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Request AI advice for low light sleep</td><td align="left" valign="top">Click AI for light sleep</td><td align="left" valign="top">AI output shown</td><td align="left" valign="top">TC, FU, CTR, ToT</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Request AI advice for REM<sup><xref ref-type="table-fn" rid="table4fn11">k</xref></sup> sleep levels</td><td align="left" valign="top">Click AI for REM sleep</td><td align="left" valign="top">AI output shown</td><td align="left" valign="top">TC, FU, CTR, ToT</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>View sleep metrics dashboard</td><td align="left" valign="top">Open sleep metrics</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, ToT, TAR</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>View sleep stage timeline</td><td align="left" valign="top">Open stage timeline</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, NF, CTR, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>View sleep benchmark reference</td><td align="left" valign="top">Open benchmark panel</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, NF, TAR</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Review sleep benchmark interpretation</td><td align="left" valign="top">Open benchmark explanation</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, ToT, RR, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Request AI advice on sleep benchmark</td><td align="left" valign="top">Click AI for benchmark</td><td align="left" valign="top">AI output shown</td><td align="left" valign="top">TC, session duration, TAR, FU, ToT, CTR</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Open and generate sleep trend report</td><td align="left" valign="top">Open/generate report</td><td align="left" valign="top">Report shown</td><td align="left" valign="top">TC, session duration, TAR, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>View weekly sleep log</td><td align="left" valign="top">Open weekly sleep log</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, NF, TAR, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>View sleep fragmentation and stage transitions</td><td align="left" valign="top">Open fragmentation view</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, NF, ToT, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Request AI advice on sleep fragmentation</td><td align="left" valign="top">Click AI for fragmentation</td><td align="left" valign="top">AI output shown</td><td align="left" valign="top">TC, FU, session duration, ToT</td></tr><tr><td align="left" valign="top" colspan="4">SpO<sub>2</sub> Monitoring</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>View SpO<sub>2</sub> analysis dashboard</td><td align="left" valign="top">Open SpO<sub>2</sub> analysis</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, ToT, NF, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Observe real-time SpO<sub>2</sub> for hypoxemia monitoring</td><td align="left" valign="top">Open live SpO<sub>2</sub> screen</td><td align="left" valign="top">Exit/switch page</td><td align="left" valign="top">TC, RR, TAR, FU</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Request AI advice on SpO<sub>2</sub> abnormalities</td><td align="left" valign="top">Click AI for SpO<sub>2</sub></td><td align="left" valign="top">AI output shown</td><td align="left" valign="top">TC, FU, CTR, ToT</td></tr><tr><td align="left" valign="top" colspan="4">AI Assistant</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Submit query to AI health chatbot</td><td align="left" valign="top">Enter/send prompt</td><td align="left" valign="top">Response shown</td><td align="left" valign="top">TC, session duration, RR, CTR, TAR, FU</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>AI: artificial intelligence.</p></fn><fn id="table4fn2"><p><sup>b</sup>TC: task completion. </p></fn><fn id="table4fn3"><p><sup>c</sup>ToT: time on task.</p></fn><fn id="table4fn4"><p><sup>d</sup>FU: feature usage.</p></fn><fn id="table4fn5"><p><sup>e</sup>HR: heart rate.</p></fn><fn id="table4fn6"><p><sup>f</sup>RR: retry rate.</p></fn><fn id="table4fn7"><p><sup>g</sup>NF: navigation frequency.</p></fn><fn id="table4fn8"><p><sup>h</sup>TAR: task abandonment rate.</p></fn><fn id="table4fn9"><p><sup>i</sup>HRV: heart rate variability.</p></fn><fn id="table4fn10"><p><sup>j</sup>CTR: click-to-task ratio.</p></fn><fn id="table4fn11"><p><sup>k</sup>REM: rapid eye movement</p></fn></table-wrap-foot></table-wrap><p>The mapping tasks for objective metrics were derived from the functional characteristics of each task. Metrics such as task completion and time on task were applied universally as core usability indicators. The retry rate was assigned to tasks with likely repeated attempts in monitoring and chatbot interactions. Feature usage was linked to AI-driven features, demonstrating user engagement beyond basic monitoring. Navigation frequency was applied to tasks involving timelines and log exploration. Session duration was associated with tasks requiring extended engagement, such as report generation. The click-to-task ratio was included for tasks with multiple interaction steps. The task abandonment rate was assigned where drop-offs were likely, such as when viewing summaries and reports. This mapping ensures the replicability of linking system interactions to the 8 objective usability metrics.</p><p>To ensure that the objective usability measures reflected actual user behavior, each logged task was operationalized as a concrete interface-level action. Tasks such as view and observe were defined as opening and accessing a specific dashboard, chart, or panel until the user exited or switched pages. AI-related tasks were defined as explicit user-triggered actions, such as clicking an AI insight or advice function or submitting a chatbot query, with completion recorded when the system response was displayed. In <xref ref-type="table" rid="table4">Table 4</xref>, open indicates that the user accessed a dashboard, chart, panel, or report. Click AI indicates an explicit user request for AI-generated insights or advice. Exit/switch page indicates that the user left the target screen or moved to another module. AI output shown indicates successful system generation and display of the requested response.</p></sec><sec id="s2-15"><title>Data Analysis</title><sec id="s2-15-1"><title>User Activity Log Analysis</title><p>User activity logs were extracted from the system back end for all caregiver interaction sessions that were conducted during the study period. Each log entry included a time stamp, session identifier, user identifier, task name, action type (eg, started, completed, error, retry, and abandoned), task duration (in seconds), navigation events, and click events. As shown in <xref ref-type="fig" rid="figure6">Figure 6</xref>, these raw entries were processed at the session-level metrics, aggregated across sessions for each user, and normalized by relevant totals (eg, total tasks started) to enable cross-user comparisons.</p><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>Sequential steps for transforming raw log data into quantified usability measures.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e91873_fig06.png"/></fig></sec><sec id="s2-15-2"><title>Metrics Computation</title><p>The raw interaction logs were parsed and preprocessed, aggregated at the session level, and used for metric extraction. From this pipeline, key objective behavioral indicators were computed, including task completion (TC), time on task (ToT), click-to-task ratio (CTR), retry rate (RR), feature usage (FU), navigation frequency (NF), session duration, and task abandonment rate (TAR). TC is the percentage of started tasks that were completed. This metric was calculated using equation 1.</p><disp-formula id="E1"><label>(1)</label><mml:math id="eqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">C</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mi mathvariant="normal">%</mml:mi><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:msub><mml:mi>C</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mi>S</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mfrac><mml:mo>&#x00D7;</mml:mo><mml:mn>100</mml:mn></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where <italic>C</italic><sub><italic>i</italic></sub> is the number of tasks of user <italic>i</italic> with completed status and <italic>S</italic><sub><italic>i</italic></sub> indicates the number of tasks with started status of user <italic>i</italic>. ToT measures how long it takes a user to begin or complete a task once they start interacting with the system. It is defined as:</p><disp-formula id="E2"><label>(2)</label><mml:math id="eqn2"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi mathvariant="normal">T</mml:mi><mml:mi mathvariant="normal">o</mml:mi><mml:mi mathvariant="normal">T</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:munderover><mml:mo movablelimits="false">&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:munderover><mml:mfrac><mml:msub><mml:mi>d</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mi>n</mml:mi></mml:mfrac></mml:mstyle></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where <italic>d</italic><sub><italic>i</italic></sub> is the duration of the <italic>i</italic> &#x2212; <italic>th</italic> completed task and <italic>n</italic> is the number of completed tasks. The RR measures how often users had to repeat a task before succeeding. For each task, if a user has multiple STARTED events before success, everything after the first event is a retry, defined as follows:</p><disp-formula id="E3"><label>(3)</label><mml:math id="eqn3"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mi>R</mml:mi><mml:msub><mml:mi>R</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:msub><mml:mi>r</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:msub><mml:mi>a</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mfrac></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where <italic>r</italic><sub><italic>i</italic></sub> is the number of retries for user <italic>i</italic> repeated a task after a failed attempt (errors, abandoned, and reclicks) and <italic>a</italic><sub><italic>i</italic></sub> the total number of tasks the user initiated. FU counts the interaction of users per system feature and was calculated as, FU<sub><italic>x</italic></sub> = <italic>N</italic><sub><italic>x</italic></sub>, where, <italic>N</italic><sub><italic>x</italic></sub> is the count of feature <italic>x</italic> in the navigation logs. Session duration was calculated as follows:</p><disp-formula id="E4"><label>(4)</label><mml:math id="eqn4"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi mathvariant="normal">S</mml:mi><mml:mi mathvariant="normal">D</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:msub><mml:mi>t</mml:mi><mml:mrow><mml:mi mathvariant="normal">e</mml:mi><mml:mi mathvariant="normal">n</mml:mi><mml:mi mathvariant="normal">d</mml:mi></mml:mrow></mml:msub><mml:mo>&#x2212;</mml:mo><mml:msub><mml:mi>t</mml:mi><mml:mrow><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">t</mml:mi><mml:mi mathvariant="normal">a</mml:mi><mml:mi mathvariant="normal">r</mml:mi><mml:mi mathvariant="normal">t</mml:mi></mml:mrow></mml:msub></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where <italic>t</italic><sub>start</sub> and <italic>t</italic><sub>end</sub> are the first and last actions in a session, respectively. The TAR is the percentage of tasks started but never completed and is defined as follows:</p><disp-formula id="E5"><label>(5)</label><mml:math id="eqn5"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mtext>TAR</mml:mtext><mml:mo stretchy="false">(</mml:mo><mml:mi mathvariant="normal">%</mml:mi><mml:mo stretchy="false">)</mml:mo><mml:mo>=</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:mfrac><mml:mi>A</mml:mi><mml:mi>S</mml:mi></mml:mfrac><mml:mo>)</mml:mo></mml:mrow><mml:mo>&#x00D7;</mml:mo><mml:mn>100</mml:mn></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where <italic>A</italic> is abandoned tasks. CTR is the number of clicks per completed task, defined as CTR = <italic>K</italic>/<italic>C</italic>, where <italic>K</italic> is the click event. NF is the number of times each navigation step/module is used, defined as NF<sub><italic>x</italic></sub> = <italic>N</italic><sub><italic>x</italic></sub>. All metrics were calculated per session and aggregated for user and cross-user analysis. <xref ref-type="table" rid="table5">Table 5</xref> presents the descriptive statistics of the 8 objective usability metrics collected from caregivers&#x2019; interactions with the EDT system.</p><table-wrap id="t5" position="float"><label>Table 5.</label><caption><p>Descriptive statistics of objective usability metrics.</p></caption><table id="table5" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Metric</td><td align="left" valign="bottom">Minimum</td><td align="left" valign="bottom">Maximum</td><td align="left" valign="bottom" colspan="2">Mean (SD)</td></tr></thead><tbody><tr><td align="left" valign="top">TC<sup><xref ref-type="table-fn" rid="table5fn1">a</xref></sup> (%)</td><td align="left" valign="top">82.93</td><td align="left" valign="top">98.02</td><td align="left" valign="top" colspan="2">94.08 (4.10)</td></tr><tr><td align="left" valign="top">RR<sup><xref ref-type="table-fn" rid="table5fn2">b</xref></sup></td><td align="left" valign="top">0.00</td><td align="left" valign="top">1.00</td><td align="left" valign="top" colspan="2">0.25 (0.28)</td></tr><tr><td align="left" valign="top">ToT<sup><xref ref-type="table-fn" rid="table5fn3">c</xref></sup> (seconds)</td><td align="left" valign="top">39.20</td><td align="left" valign="top">175.67</td><td align="left" valign="top" colspan="2">89.16 (21.97)</td></tr><tr><td align="left" valign="top">TAR<sup><xref ref-type="table-fn" rid="table5fn4">d</xref></sup> (%)</td><td align="left" valign="top">0.00</td><td align="left" valign="top">14.13</td><td align="left" valign="top" colspan="2">2.66 (2.87)</td></tr><tr><td align="left" valign="top">CTR<sup><xref ref-type="table-fn" rid="table5fn5">e</xref></sup></td><td align="left" valign="top">0.12</td><td align="left" valign="top">1.32</td><td align="left" valign="top" colspan="2">0.48 (0.22)</td></tr><tr><td align="left" valign="top">NF<sup><xref ref-type="table-fn" rid="table5fn6">f</xref></sup></td><td align="left" valign="top">5.00</td><td align="left" valign="top">12.00</td><td align="left" valign="top" colspan="2">11.02 (1.39)</td></tr><tr><td align="left" valign="top">Session duration (minutes)</td><td align="left" valign="top">36.97</td><td align="left" valign="top">171.90</td><td align="left" valign="top" colspan="2">101.59 (30.17)</td></tr><tr><td align="left" valign="top">FU<sup><xref ref-type="table-fn" rid="table5fn7">g</xref></sup> (event count)</td><td align="left" valign="top">52</td><td align="left" valign="top">98</td><td align="left" valign="top" colspan="2">54 (13.4)</td></tr></tbody></table><table-wrap-foot><fn id="table5fn1"><p><sup>a</sup>TC: task completion.</p></fn><fn id="table5fn2"><p><sup>b</sup>RR: retry rate.</p></fn><fn id="table5fn3"><p><sup>c</sup>ToT: time on task.</p></fn><fn id="table5fn4"><p><sup>d</sup>TAR: task abandonment rate.</p></fn><fn id="table5fn5"><p><sup>e</sup>CTR: click-to-task ratio.</p></fn><fn id="table5fn6"><p><sup>f</sup>NF: navigation frequency.</p></fn><fn id="table5fn7"><p><sup>g</sup>FU: feature usage.</p></fn></table-wrap-foot></table-wrap><p>To establish the relationship between objective usability metrics derived from user activity logs and the dimensions of SUS, we mapped each metric to the SUS factors originally proposed by [<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>]. Their analysis suggested that the SUS can be interpreted as comprising 2 correlated but distinct dimensions: usable (covering items related to effectiveness, efficiency, and overall ease of use) and learnable (covering items reflecting the ease of learning and initial onboarding, specifically items 4 and 10).</p><p>The mapping of objective usability metrics to the SUS dimensions is presented in <xref ref-type="table" rid="table6">Table 6</xref>. In this study, we adopted the 2-factor structure of SUS (usability and learnability) as proposed by Borsci et al [<xref ref-type="bibr" rid="ref49">49</xref>] and Lewis and Sauro [<xref ref-type="bibr" rid="ref50">50</xref>], which is the most widely validated and parsimonious model compared with alternative factor structures. In this mapping, performance-related measures such as task completion, efficiency, engagement, and error-related indicators are aligned with the usability factor, as they reflect effectiveness and overall ease of use. In contrast, retry-related measures are aligned with the learnability factor, as they directly capture the effort required for users to acquire proficiency during initial interactions. This mapping provides a conceptual bridge between objective behavioral-based metrics and subjective usability perceptions, ensuring that activity log analysis contributes to the broader usability assessment framework represented by Borsci et al [<xref ref-type="bibr" rid="ref49">49</xref>] and Lewis and Sauro [<xref ref-type="bibr" rid="ref50">50</xref>].</p><table-wrap id="t6" position="float"><label>Table 6.</label><caption><p>The definitions of the usability metrics derived from system activity logs.</p></caption><table id="table6" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Objective metric</td><td align="left" valign="bottom">Relevant usability aspect (from literature)</td><td align="left" valign="bottom">Mapped SUS factor (Lewis and Sauro [<xref ref-type="bibr" rid="ref50">50</xref>])</td><td align="left" valign="bottom">References</td></tr></thead><tbody><tr><td align="left" valign="top">TC<sup><xref ref-type="table-fn" rid="table6fn1">a</xref></sup></td><td align="left" valign="top">Effectiveness (core usability outcome)</td><td align="left" valign="top">Usable (items 1, 3, 5, 7, 8, and 9)</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref49">49</xref>-<xref ref-type="bibr" rid="ref52">52</xref>]</td></tr><tr><td align="left" valign="top">ToT<sup><xref ref-type="table-fn" rid="table6fn2">b</xref></sup></td><td align="left" valign="top">Efficiency</td><td align="left" valign="top">Usable (efficiency items contribute to overall ease-of use perceptions)</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref53">53</xref>]</td></tr><tr><td align="left" valign="top">RR<sup><xref ref-type="table-fn" rid="table6fn3">c</xref></sup></td><td align="left" valign="top">Learnability (ease of initial learning, errors before success)</td><td align="left" valign="top">Learnable (items 4 and 10: technical support and things to learn)</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref52">52</xref>]</td></tr><tr><td align="left" valign="top">FU<sup><xref ref-type="table-fn" rid="table6fn4">d</xref></sup></td><td align="left" valign="top">Discoverability (linked to usability breadth)</td><td align="left" valign="top">Usable (items 5 and 9: confidence and integration)</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref54">54</xref>]</td></tr><tr><td align="left" valign="top">Session duration</td><td align="left" valign="top">Engagement</td><td align="left" valign="top">Usable (general usability experience, confidence, ease, and satisfaction)</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref52">52</xref>]</td></tr><tr><td align="left" valign="top">TAR<sup><xref ref-type="table-fn" rid="table6fn5">e</xref></sup></td><td align="left" valign="top">Usability issues/unclear flow</td><td align="left" valign="top">Usable (same rationale as drop-off points)</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref55">55</xref>]</td></tr><tr><td align="left" valign="top">CTR<sup><xref ref-type="table-fn" rid="table6fn6">f</xref></sup></td><td align="left" valign="top">Efficiency</td><td align="left" valign="top">Usable (efficiency dimension of usability)</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref52">52</xref>]</td></tr><tr><td align="left" valign="top">NF<sup><xref ref-type="table-fn" rid="table6fn7">g</xref></sup></td><td align="left" valign="top">User flow analysis</td><td align="left" valign="top">Usable (task integration, item 5 &#x201C;functions well integrated&#x201D;)</td><td align="char" char="." valign="top">[<xref ref-type="bibr" rid="ref49">49</xref>,<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref56">56</xref>]</td></tr></tbody></table><table-wrap-foot><fn id="table6fn1"><p><sup>a</sup>TC: task completion.</p></fn><fn id="table6fn2"><p><sup>b</sup>ToT: time on task.</p></fn><fn id="table6fn3"><p><sup>c</sup>RR: retry rate.</p></fn><fn id="table6fn4"><p><sup>d</sup>FU: feature usage.</p></fn><fn id="table6fn5"><p><sup>e</sup>TAR: task abandonment rate.</p></fn><fn id="table6fn6"><p><sup>f</sup>CTR: click-to-task ratio.</p></fn><fn id="table6fn7"><p><sup>g</sup>NF: navigation frequency.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s2-16"><title>User Engagement Based on Composite Behavioral Metrics</title><p>To capture a more holistic measure of user interaction with the EDT system, we computed a user engagement score (UES) by incorporating multiple behavioral indicators that were derived from the system logs. Specifically, 6 objective metrics were included: feature usage, average session duration, session frequency, task completion rate, error rate, and navigation diversity. Each captures a distinct aspect of usability: task efficiency, effectiveness, temporal aspects, and behavioral diversity [<xref ref-type="bibr" rid="ref51">51</xref>-<xref ref-type="bibr" rid="ref54">54</xref>,<xref ref-type="bibr" rid="ref56">56</xref>]. This composite scoring approach is essential for usability studies because it provides a multidimensional perspective on user interaction. These holistic measures are recognized as valid indicators of sustained adoption and user satisfaction [<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref58">58</xref>]. To derive the composite engagement score, we initially extracted 8 metrics from the system log. Because not all metrics uniquely represented user engagement, we retained 6 core metrics that directly reflected the breadth, depth, and effectiveness of user interactions. These metrics included FU, ToT (seconds), total session duration (seconds), TC, error count, and NF. Each metric was then normalized to a (0, 1) scale using the maximum value observed in the dataset. The normalized values were subsequently combined using equal weights to produce a composite engagement score, as presented in equation 5.</p><disp-formula id="E8"><label>(6)</label><mml:math id="eqn6"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mrow><mml:mi mathvariant="normal">E</mml:mi><mml:mi mathvariant="normal">n</mml:mi><mml:mi mathvariant="normal">g</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mi>&#x03B1;</mml:mi><mml:msub><mml:mi>F</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>&#x03B2;</mml:mi><mml:msub><mml:mi>S</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>&#x03B3;</mml:mi><mml:msub><mml:mi>R</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>&#x03B4;</mml:mi><mml:msub><mml:mi>C</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>&#x03F5;</mml:mi><mml:msub><mml:mi>E</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:mi>&#x03B6;</mml:mi><mml:msub><mml:mi>D</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:mi>&#x03B1;</mml:mi><mml:mo>+</mml:mo><mml:mi>&#x03B2;</mml:mi><mml:mo>+</mml:mo><mml:mi>&#x03B3;</mml:mi><mml:mo>+</mml:mo><mml:mi>&#x03B4;</mml:mi><mml:mo>+</mml:mo><mml:mi>&#x03F5;</mml:mi><mml:mo>+</mml:mo><mml:mi>&#x03B6;</mml:mi></mml:mrow></mml:mfrac></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where <italic>F</italic><sub><italic>i</italic></sub> is the normalized feature usage for user <italic>i</italic>, <italic>S</italic><sub><italic>i</italic></sub> indicates normalized session duration, <italic>R</italic><sub><italic>i</italic></sub> is the normalized ToT, <italic>C</italic><sub><italic>i</italic></sub> shows the normalized values of TC, <italic>E</italic><sub><italic>i</italic></sub> is normalized error rate, <italic>D</italic><sub><italic>i</italic></sub> is the normalized navigation diversity, and &#x03B1;, <italic>&#x03B2;</italic>, &#x03B3;, &#x03B4;, &#x03B5;, and &#x03B6; symbols show the weights. All weights were set to be equal (&#x03B1; = <italic>&#x03B2;</italic> = &#x03B3; = &#x03B4; = &#x03B5; = &#x03B6; = 1) so that each engagement dimension contributed uniformly to the composite score. An equal-weight additive formulation was selected as a pragmatic postnormalization approach to combine the engagement metrics while avoiding bias or subjective prioritization in the absence of empirical evidence regarding their relative importance. Prior literature on composite scoring has similarly used unit weights as a baseline when neither theoretical nor empirical justification exists for different weighting [<xref ref-type="bibr" rid="ref59">59</xref>-<xref ref-type="bibr" rid="ref61">61</xref>]. Because formal testing of interdependence or dimensional structure among the component metrics was not performed in this study, the resulting engagement score should be interpreted as an operational composite summary rather than a formally validated latent construct. For interpretability, k-means clustering with <italic>k</italic>=3 was then applied to classify users into low-, medium-, and high-engagement groups.</p></sec><sec id="s2-17"><title>The SUS</title><p>The usability of the EDT system was evaluated using the SUS, a standardized 10-item questionnaire widely used to assess the perceived usability of interactive systems. Each item was rated on a 5-point Likert scale ranging from 1 (strongly disagree) to 5 (strongly agree). SUS data were collected from 50 informal caregivers. To compute individual SUS scores, responses to odd-numbered items were scored as the participant&#x2019;s rating minus 1, whereas responses to even-numbered items were scored as 5 minus the rating. The adjusted item scores were summed and multiplied by 2.5, yielding total SUS scores ranging from 0 to 100. In addition, item-level descriptive statistics were computed for all 10 items. Internal consistency was evaluated using Cronbach &#x03B1; [<xref ref-type="bibr" rid="ref62">62</xref>] after reverse-scoring the negatively worded items so that higher scores consistently indicated greater perceived usability, as defined in <xref ref-type="disp-formula" rid="E6">equation 6</xref>.</p><disp-formula id="E6"><label>(7)</label><mml:math id="eqn7"><mml:mrow><mml:mi>&#x03B1;</mml:mi><mml:mo>=</mml:mo><mml:mfrac><mml:mi>k</mml:mi><mml:mrow><mml:mi>k</mml:mi><mml:mo>&#x2212;</mml:mo><mml:mn>1</mml:mn></mml:mrow></mml:mfrac><mml:mfenced><mml:mrow><mml:mn>1</mml:mn><mml:mo>&#x2212;</mml:mo><mml:mfrac><mml:mrow><mml:mstyle displaystyle="true"><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi><mml:mo>=</mml:mo><mml:mn>1</mml:mn></mml:mrow><mml:mi>k</mml:mi></mml:munderover><mml:mrow><mml:msubsup><mml:mi>&#x03C3;</mml:mi><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mstyle></mml:mrow><mml:mrow><mml:msubsup><mml:mi>&#x03C3;</mml:mi><mml:mi>T</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:mfrac></mml:mrow></mml:mfenced></mml:mrow></mml:math></disp-formula><p>where <italic>k</italic> is the number of items, <inline-formula><mml:math id="ieqn1"><mml:mrow><mml:msubsup><mml:mi>&#x03C3;</mml:mi><mml:mi>i</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula> is the variance of each individual item, and <inline-formula><mml:math id="ieqn2"><mml:mrow><mml:msubsup><mml:mi>&#x03C3;</mml:mi><mml:mi>T</mml:mi><mml:mn>2</mml:mn></mml:msubsup></mml:mrow></mml:math></inline-formula>is the variance of total score (sum across all items).</p></sec><sec id="s2-18"><title>Correlation and Regression Analysis of Engagement and Perceived Usability</title><p>To investigate the relationship between the composite behavioral metric and perceived usability, we first examined the correlation between the UES and the SUS. The normality of both variables (UES and SUS) was tested using the Shapiro-Wilk test. As SUS scores deviated from normality, Spearman rank correlation (&#x03C1;) was selected as the primary measure of association, and Pearson correlation (<italic>r</italic>) was also reported for completeness. Bootstrapped 95% CIs were computed to quantify the precision of the correlation estimates. Following the correlation analysis, we conducted a simple linear regression to test whether the UES predicts the SUS. The regression was specified as follows:</p><disp-formula id="E7"><label>(8)</label><mml:math id="eqn8"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:msub><mml:mrow><mml:mi mathvariant="normal">S</mml:mi><mml:mi mathvariant="normal">U</mml:mi><mml:mi mathvariant="normal">S</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>=</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mn>0</mml:mn></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x03B2;</mml:mi><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">U</mml:mi><mml:mi mathvariant="normal">E</mml:mi><mml:mi mathvariant="normal">S</mml:mi></mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mi>&#x03F5;</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where SUS<sub><italic>i</italic></sub> is the usability score for user <italic>i</italic>, UES<sub><italic>i</italic></sub> is the engagement score, <italic>&#x03B2;</italic><sub>0</sub> is the intercept, <italic>&#x03B2;</italic><sub>1</sub> is the regression coefficient, and &#x03B5;<italic><sub>i</sub></italic> is the error term. Model fit was evaluated with <italic>R</italic><sup>2</sup>, F-statistics, and coefficient significance. This 2-step approach enabled us to first establish the strength and direction of the association between user engagement and usability and then the predictive power of the UES for the SUS, thereby linking objective behavioral data with subjective ratings.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Overview</title><p>This study assessed the EDT system usability among informal caregivers by analyzing objective user interactions and subjective perceptions of usability (SUS). Three aspects were analyzed: (1) SUS survey results reflecting perceived usability, (2) patterns of composite UESs from system logs, and (3) the relationship between user engagement and usability using correlation and regression analyses. These findings address the study aim of assessing EDT system usability using objective behavioral metrics and subjective measurements and examining whether behavioral engagement indicates perceived system usability.</p></sec><sec id="s3-2"><title>SUS Results</title><p>Item-level response patterns for the 10 SUS items are presented in <xref ref-type="fig" rid="figure7">Figure 7</xref>, with descriptive statistics shown in <xref ref-type="table" rid="table7">Table 7</xref>. Overall, caregivers responded positively to the positively worded items and showed low agreement with the negatively worded items, indicating favorable usability perceptions of the EDT system. Higher mean scores were observed for confidence in using the system, integration of system functions, and intention to use it frequently, whereas lower engagement on negatively phrased items suggested limited perceived complexity, inconsistency, and need for technical support. The SUS also demonstrated strong internal consistency, with a Cronbach &#x03B1; of 0.87, indicating reliable measurement of perceived usability.</p><fig position="float" id="figure7"><label>Figure 7.</label><caption><p>Distribution of responses to the 10 System Usability Scale items among caregivers (n=50). Percentages are shown on the top axis (0%&#x2010;100%). EDT: elderly digital twin.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e91873_fig07.png"/></fig><table-wrap id="t7" position="float"><label>Table 7.</label><caption><p>Item-level descriptive statistics for the 10 System Usability Scale questions.</p></caption><table id="table7" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Item</td><td align="left" valign="bottom">Mean (SD)</td><td align="left" valign="bottom">Minimum</td><td align="left" valign="bottom">Maximum</td></tr></thead><tbody><tr><td align="left" valign="top">Q1</td><td align="left" valign="top">4.54 (0.8)</td><td align="left" valign="top">2.0</td><td align="left" valign="top">5.0</td></tr><tr><td align="left" valign="top">Q2</td><td align="left" valign="top">1.96 (1.18)</td><td align="left" valign="top">1.0</td><td align="left" valign="top">5.0</td></tr><tr><td align="left" valign="top">Q3</td><td align="left" valign="top">4.50 (0.79)</td><td align="left" valign="top">2.0</td><td align="left" valign="top">5.0</td></tr><tr><td align="left" valign="top">Q4</td><td align="left" valign="top">2.18 (1.26)</td><td align="left" valign="top">1.0</td><td align="left" valign="top">5.0</td></tr><tr><td align="left" valign="top">Q5</td><td align="left" valign="top">4.48 (0.79)</td><td align="left" valign="top">2.0</td><td align="left" valign="top">5.0</td></tr><tr><td align="left" valign="top">Q6</td><td align="left" valign="top">1.86 (1.20)</td><td align="left" valign="top">1.0</td><td align="left" valign="top">5.0</td></tr><tr><td align="left" valign="top">Q7</td><td align="left" valign="top">4.40 (0.78)</td><td align="left" valign="top">2.0</td><td align="left" valign="top">5.0</td></tr><tr><td align="left" valign="top">Q8</td><td align="left" valign="top">1.86 (1.20)</td><td align="left" valign="top">1.0</td><td align="left" valign="top">5.0</td></tr><tr><td align="left" valign="top">Q9</td><td align="left" valign="top">4.42 (0.91)</td><td align="left" valign="top">1.0</td><td align="left" valign="top">5.0</td></tr><tr><td align="left" valign="top">Q10</td><td align="left" valign="top">2.30 (1.30)</td><td align="left" valign="top">1.0</td><td align="left" valign="top">5.0</td></tr></tbody></table></table-wrap><p>The overall SUS scores (N=50) ranged from 42.5 to 100, with a mean of 80.45 (SD 17.6), indicating a generally favorable perception of usability by caregivers. As shown in <xref ref-type="table" rid="table8">Table 8</xref>, the SUS scores varied descriptively across the caregiving experience levels. Caregivers with more than 6 years of experience reported the highest mean score (mean 86.7, SD 21.8), followed by those with 1&#x2010;3 (mean 83.5, SD 14.5) years and 4&#x2010;6 (mean 81.0, SD 16.8) years of experience. Caregivers with less than 1 year of experience reported the lowest mean score (mean 70.9). A 1-way ANOVA was used to test whether these differences were statistically significant. Although the descriptive pattern suggested higher usability perception among more experienced caregivers, the ANOVA results were not statistically significant (<italic>F</italic><sub>3,46</sub>=1.58; <italic>P</italic>=.208, &#x03B7;&#x00B2;=0.093). The effect size indicates that approximately 9.3% of the variance in the SUS scores was explained by caregiving experience, reflecting a small to moderate effect.</p><table-wrap id="t8" position="float"><label>Table 8.</label><caption><p>Mean System Usability Scale scores by caregiving experience and age group.</p></caption><table id="table8" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Category (group)</td><td align="left" valign="bottom">Mean (SD) SUS<sup><xref ref-type="table-fn" rid="table8fn1">a</xref></sup> score<sup><xref ref-type="table-fn" rid="table8fn2">b</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top">Caregiving experience (years)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003C;1</td><td align="char" char="." valign="top">70.9 (20.3)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>1&#x2010;3</td><td align="char" char="." valign="top">83.5 (14.5)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>4&#x2010;6</td><td align="char" char="." valign="top">81.0 (16.8)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>&#x003E;6</td><td align="char" char="." valign="top">86.7 (21.8)</td></tr><tr><td align="left" valign="top">Age group (years)</td><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>18&#x2010;25</td><td align="char" char="." valign="top">80.8 (17.0)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>26&#x2010;35</td><td align="char" char="." valign="top">80.8 (16.1)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>36&#x2010;45</td><td align="char" char="." valign="top">77.0 (21.6)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>46&#x2010;50</td><td align="char" char="." valign="top">83.3 (18.4)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>51&#x2010;55</td><td align="char" char="." valign="top">92.5 (0.0)</td></tr></tbody></table><table-wrap-foot><fn id="table8fn1"><p><sup>a</sup>SUS: System Usability Scale.</p></fn><fn id="table8fn2"><p><sup>b</sup>Overall mean score 80.45 (SD 17.65).</p></fn></table-wrap-foot></table-wrap><p>SUS scores also showed descriptive variation across age groups, as presented in <xref ref-type="table" rid="table8">Table 8</xref>. Caregivers aged 51&#x2010;55 years reported the highest mean score (mean 92.5, SD 0.0), while those aged 36&#x2010;45 years reported the lowest (mean 77.0, SD 21.6). Younger caregivers (aged 18&#x2010;25 and 26&#x2010;35 years) reported similar mean scores (mean 80.8), and caregivers aged 46&#x2010;50 years also rated usability favorably (mean 83.3, SD 18.4). However, 1-way ANOVA found no statistically significant differences across age groups (<italic>F</italic><sub>4,45</sub>=0.399; <italic>P</italic>=.808, &#x03B7;&#x00B2;=0.034). This small effect size indicates that age accounted for only approximately 3.4% of the variance in the SUS scores. Thus, age did not meaningfully influence caregivers&#x2019; evaluations of the system. Overall, the mean SUS score of 80.45 exceeded the commonly cited 68-point benchmark and fell within the &#x201C;excellent&#x201D; range (&#x2265;80), showing that caregivers evaluated the EDT system very favorably.</p><p>Beyond demographic differences, we performed k-means clustering to classify caregivers&#x2019; SUS scores into 3 groups: low (mean 52.7), medium (mean 79.4), and high (mean 94.30). As shown in <xref ref-type="fig" rid="figure8">Figure 8</xref>, the clusters clearly distinguished participants with below-average usability perceptions from those who reported excellent usability. Most caregivers fell into the medium to high clusters, reinforcing the overall favorable evaluation of the system, while a smaller subgroup reflected lower usability perceptions, indicating areas for targeted improvements.</p><fig position="float" id="figure8"><label>Figure 8.</label><caption><p>K-means clustering of SUS (N=50) into low, medium, and high groups. Dashed lines indicate cluster centroids. SUS: System Usability Scale.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e91873_fig08.png"/></fig></sec><sec id="s3-3"><title>User Engagement Based on Composite Behavioral Metrics Results</title><p>The composite UES was computed for all participants based on normalized behavioral metrics. The scores ranged from 0.55 to 0.86, with the majority of users clustering between 0.70 and 0.80, as shown in <xref ref-type="fig" rid="figure9">Figure 9</xref>. The distribution was slightly skewed toward higher engagement, indicating that most participants interacted consistently with the EDT system features, whereas only a few exhibited lower engagement levels.</p><fig position="float" id="figure9"><label>Figure 9.</label><caption><p>Distribution of composite engagement scores across users.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e91873_fig09.png"/></fig><p>For interpretability, users were classified into 3 engagement tiers (low, medium, and high) using k-means clustering (<italic>k</italic>=3). The results showed that most users belonged to the medium engagement group, with smaller proportions in the high- and low-engagement tiers, as shown in <xref ref-type="fig" rid="figure10">Figure 10</xref>. This distribution indicates distinct user subgroups, with strong engagement among highly engaged users and lower, yet observable, interaction among the least engaged. Overall, the pattern suggests that the EDT system supported sustained interaction for most users.</p><fig position="float" id="figure10"><label>Figure 10.</label><caption><p>Composite user engagement tiers using k-means clustering (<italic>k</italic>=3).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e91873_fig10.png"/></fig></sec><sec id="s3-4"><title>Correlation and Regression Results for Engagement and Perceived Usability</title><p>Building on the relationship between the UES and SUS, we examined how user behavioral measures can predict the SUS of the EDT system. As shown in <xref ref-type="table" rid="table9">Table 9</xref>, the regression analysis further demonstrated that UES significantly predicted usability scores (<italic>F</italic><sub>1, 48</sub>=31.00, <italic>P</italic>&#x003C;.001), explaining 39.2% of the variance (<italic>R</italic><sup>2</sup>=0.392). Engagement was a positive predictor (<italic>&#x03B2;</italic>=52.94, <italic>t</italic><sub>48</sub>=5.57; <italic>P</italic>&#x003C;.001), indicating that higher engagement was associated with higher SUS ratings. <xref ref-type="fig" rid="figure11">Figure 11</xref> illustrates the correlation between SUS and UES.</p><fig position="float" id="figure11"><label>Figure 11.</label><caption><p>Scatterplot of engagement and SUS scores with Pearson linear fit (solid line) and Spearman monotonic trend (dashed line). OLS; ordinary least squares SUS: System Usability Scale.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e91873_fig11.png"/></fig><table-wrap id="t9" position="float"><label>Table 9.</label><caption><p>Correlation between System Usability Scale and composite user engagement scores.</p></caption><table id="table9" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Analysis and variable</td><td align="left" valign="bottom">Statistics (r/p)/<italic>&#x03B2;</italic> (coefficient)<sup><xref ref-type="table-fn" rid="table9fn1">a</xref></sup></td><td align="left" valign="bottom"><italic>P</italic> value</td><td align="left" valign="bottom">95% CI</td><td align="left" valign="bottom"><italic>R</italic><sup>2</sup></td><td align="left" valign="bottom">SE</td><td align="left" valign="bottom"><italic>t</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Correlation</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Pearson <italic>r</italic></td><td align="left" valign="top">0.626</td><td align="char" char="." valign="top">&#x003C;.001</td><td align="char" char="." valign="top">0.417-0.778</td><td align="char" char="." valign="top">&#x2014;<sup><xref ref-type="table-fn" rid="table9fn2">b</xref></sup></td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Spearman &#x03C1;</td><td align="left" valign="top">0.552</td><td align="char" char="." valign="top">&#x003C;.001</td><td align="char" char="." valign="top">0.311-0.734</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">&#x2014;</td></tr><tr><td align="left" valign="top">Regression</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Intercept</td><td align="left" valign="top">55.73</td><td align="char" char="." valign="top">&#x003C;.001</td><td align="char" char="." valign="top">45.97-65.49</td><td align="left" valign="top">&#x2014;</td><td align="left" valign="top">4.86</td><td align="left" valign="top">11.48</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>UES (<italic>&#x03B2;</italic>)</td><td align="left" valign="top">52.94</td><td align="char" char="." valign="top">&#x003C;.001</td><td align="char" char="." valign="top">33.82-72.05</td><td align="char" char="." valign="top">0.392</td><td align="left" valign="top">9.51</td><td align="left" valign="top">5.57</td></tr></tbody></table><table-wrap-foot><fn id="table9fn1"><p><sup>a</sup><italic>r</italic> indicates the Pearson correlation coefficient; &#x03C1; indicates the Spearman rank correlation coefficient; <italic>&#x03B2;</italic> indicates the regression coefficient.</p></fn><fn id="table9fn2"><p><sup>b</sup>Not available.</p></fn></table-wrap-foot></table-wrap></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study found that the EDT system achieved generally positive usability outcomes among informal caregivers based on both subjective perceptions and objective behavioral metrics. SUS results suggested favorable perceived usability, and user activity logs reflected meaningful engagement with system features. The observed association between SUS and UES further indicates that behavioral metrics may complement self-reported usability measures in evaluating caregiver-facing digital health systems.</p></sec><sec id="s4-2"><title>Usability Evaluation Outcomes</title><p>The EDT system attained a mean SUS score of 80.45, exceeding the widely accepted threshold of 68 for above-average usability [<xref ref-type="bibr" rid="ref19">19</xref>]. A score above 80 is typically interpreted as excellent usability [<xref ref-type="bibr" rid="ref63">63</xref>]. In this sample, these results suggest that the participating informal caregivers perceived the EDT interface as relatively easy to learn and efficient to use. The composite UES derived from detailed activity logs was positively correlated with the SUS (Pearson <italic>r</italic>=0.626, Spearman &#x03C1;=0.552). The significant correlation between UES and SUS highlights the complementary nature of behavioral and perceptual usability measures. While the SUS captures caregivers&#x2019; subjective impressions of the system&#x2019;s ease of use and satisfaction, the UES quantifies the depth and quality of their actual interactions. The strength of the observed correlation between the UES and the SUS can be interpreted as moderate to strong, where the correlation between performance and satisfaction metrics generally ranges from 0.38 to 0.70 and often does not exceed 0.7 [<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref64">64</xref>].</p><p>Beyond this association, regression analysis demonstrated that UES was a meaningful predictor of the SUS, explaining 39.2% of its variance. In the regression model, the <italic>F</italic>-test result (<italic>F</italic><sub>1, 48</sub>=31.00, <italic>P</italic>&#x003C;.001) indicated that the model with UES as a predictor of SUS was statistically significant overall. The intercept (constant = 55.73) represents the predicted SUS value when UES equals zero; because zero engagement was not observed in the study data, this value should be interpreted as a model constant rather than a substantively meaningful estimate. Engagement score (<italic>&#x03B2;</italic>=52.94, <italic>P</italic>&#x003C;.001) indicates that for every 1-point increase in UES (on its 0&#x2010;1 scale), SUS is predicted to increase by about 53 points. The coefficient of determination (<italic>R</italic>&#x00B2;=0.392) indicated that 39.2% of the variance in SUS was explained by UES. Because the model included only 1 predictor, this value is also consistent with the squared Pearson correlation between UES and SUS. The adjusted <italic>R</italic><sup>2</sup> value of approximately 0.38 suggests a comparable level of explained variance after accounting for sample size. Although much of the remaining variance is likely attributable to other factors influencing perceived usability, these results support a meaningful association between behavioral engagement and perceived usability within this sample.</p><p>In human-computer interaction research, behavioral predictors typically explain only a partial variance in subjective satisfaction metrics. Studies have shown that behavioral log data account for 30%&#x2010;40% of the variance in perceived usability, with the remainder due to unobserved factors [<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref66">66</xref>]. This aligns with strong task performance metrics: task completion 94.08%, time on task 89.16 seconds, abandonment rate 2.66%, and retry rate 0.25%, as shown in <xref ref-type="table" rid="table5">Table 5</xref>, demonstrating that objective engagement correlates with perceived usability.</p><p>The clustering of engagement scores into high-, medium-, and low-tier groups (<xref ref-type="fig" rid="figure10">Figure 10</xref>) reveals how caregivers interact with the EDT system. Users in the high-engagement cluster achieved strong task performance and high SUS scores, reflecting meaningful interactions. The medium engagement group showed satisfactory engagement with lower SUS scores, whereas the low-engagement group displayed limited interaction and lower usability perception. This analysis shows that users experience the system differently, highlighting the need to tailor system design and support for different engagement profiles. Demographic checks showed no significant difference in SUS scores by age (ANOVA <italic>F</italic><sub>4, 45</sub>=0.399; <italic>P</italic>=.81, &#x03B7;&#x00B2;=0.034) or caregiving experience (ANOVA <italic>F</italic><sub>(3, 46</sub>=1.58; <italic>P</italic>=.21, &#x03B7;&#x00B2;=0.093), indicating consistent perceived usability across the groups. The convergence of high perceived usability with high task performance provides evidence that the EDT system is usable and effective for caregivers. Higher SUS ratings correlated with more intensive interactions, demonstrating the system&#x2019;s support for meaningful use in caregiving contexts. These behavioral indicators in the composite UES strengthen the predictive relationship between the UES and the SUS, showing that engaged caregivers achieve higher task success and perceive better usability.</p></sec><sec id="s4-3"><title>Theoretical Implications</title><p>The results demonstrate the complementarity between subjective and objective measures. While the SUS provides standardized user perception data with benchmarking values [<xref ref-type="bibr" rid="ref19">19</xref>,<xref ref-type="bibr" rid="ref22">22</xref>], it cannot reveal how users succeed or struggle during interactions [<xref ref-type="bibr" rid="ref64">64</xref>]. By combining the SUS with UES behavioral analytics, our study showed that objective measures strengthen construct validity and highlight engagement heterogeneity that postuse scores may miss. In developing the UES, we refined the engagement score using foundational indicators of breadth, depth, and effectiveness of use, avoiding redundant measures, and ensuring interpretability. Equal weights were applied to the metrics, a defensible choice without prior evidence of differential importance. Future research could explore data-driven weighting strategies, such as principal component analysis, regression models, or SHAP analyses, using larger datasets [<xref ref-type="bibr" rid="ref67">67</xref>].</p><p>Another important implication concerns the demographic sensitivity of the SUS. The ANOVA analysis showed no significant differences in usability scores by age or caregiving experience, suggesting that the SUS may be relatively stable across these demographic groups within this sample. The positive association between SUS and UES indicates that perceived usability and behavioral engagement are related. However, the present findings primarily demonstrate convergence between these measures rather than fully establishing their empirical complementarity. Future work should also examine more directly how both measures may capture distinct usability patterns and subgroup needs.</p></sec><sec id="s4-4"><title>Practical Implication for Health Care Systems</title><p>The findings of this study have important implications for the use of DT systems in health care settings. First, the alignment between high SUS scores and favorable task performance metrics suggests that designers should prioritize core workflows that caregivers value most: real-time vital sign monitoring, health trend visualization, abnormal event alerts, and AI-based recommendations. Maintaining simplicity in these functions is essential for building caregiver trust and encouraging adoption. Second, the clustering analysis of the composite UES showed varied system engagement levels, with a small subgroup in the low engagement cluster. This finding indicates the need for an adaptive user interface. Designers should provide configurable interaction modes, progressive onboarding, and contextual help features to address the diverse needs and digital literacy levels of caregivers. Such adaptations can reduce the engagement barriers among different user groups. Third, given the central role of predictive modeling in EDT systems, such as Bi-LSTM for heart rate prediction and long short-term memory for sleep stage interface, AI-generated insights must be transparent and actionable. Caregivers must distinguish between real-time data and predictions, with alerts that are accompanied by clear rationales. This enhances interpretability and reduces inappropriate decision-making in care settings.</p><p>Finally, this study emphasizes the need to support informal caregivers who frequently multitask and experience cognitive and emotional strain. EDT systems should adopt design strategies for rapid comprehension, including glanceable dashboards, consistent information hierarchies, and conservative notification policies to avoid alarm fatigue in users. This study demonstrates the value of behavioral analytics in pilot deployments, with system-generated logs supporting usability evaluation and providing feedback for refinement. Health care DT developers should integrate privacy-preserving analytics to monitor navigation issues and feature abandonment during real-world applications to guide design improvements and caregiver training. The results show that caregiver-facing DT systems must optimize core workflows while offering adaptability and transparency. These principles enable health care DT systems to support informal caregivers, enhance decision-making, and integrate digital health technologies into caregiving practices.</p></sec><sec id="s4-5"><title>Comparative Positioning and Methodological Contribution</title><p>To situate the usability of the EDT system within the broader digital health literature, we compared its SUS scores with those reported in prior studies on related technologies, as shown in <xref ref-type="table" rid="table10">Table 10</xref>. The EDT system achieved 80.45, which falls within the &#x201C;excellent&#x201D; range and exceeds the values reported for many comparable systems, such as VITAAL (58.3), Pocket Gait (59.7), and ED Health Information System (53.1). Some systems, such as the CHES eDiary (87.5), achieved similarly high SUS scores, although often in more narrowly defined use cases than the others. This benchmark highlights 2 important contributions to literature. First, the EDT system ranks among the higher-performing digital health technologies in terms of perceived usability, reinforcing its readiness for use in caregiver-facing applications. Second, unlike most prior studies that relied exclusively on the SUS or paired it with limited subjective feedback (eg, interviews and acceptability scales), our study integrated objective behavioral metrics derived from detailed user activity logs. This dual-method approach strengthens the robustness of valuation and provides a replicable methodological pathway for future assessments of DT technologies in health care.</p><table-wrap id="t10" position="float"><label>Table 10.</label><caption><p>Comparative System Usability Scale scores of related studies and the elderly digital twin system.</p></caption><table id="table10" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Study/System</td><td align="left" valign="bottom">SUS<sup><xref ref-type="table-fn" rid="table10fn1">a</xref></sup> score (reported)</td><td align="left" valign="bottom">Measures/Metrics used</td></tr></thead><tbody><tr><td align="left" valign="top">HELMA [<xref ref-type="bibr" rid="ref14">14</xref>]</td><td align="left" valign="top">72.2 (caregivers)</td><td align="left" valign="top">SUS + Partial usage logs</td></tr><tr><td align="left" valign="top">Engage [<xref ref-type="bibr" rid="ref13">13</xref>]</td><td align="left" valign="top">66.3 &#x2192; 82.6</td><td align="left" valign="top">SUS + NASA-TLX</td></tr><tr><td align="left" valign="top">VITAAL [<xref ref-type="bibr" rid="ref15">15</xref>]</td><td align="left" valign="top">58.3</td><td align="left" valign="top">SUS + Feedback sessions</td></tr><tr><td align="left" valign="top">Pocket Gait [<xref ref-type="bibr" rid="ref17">17</xref>]</td><td align="left" valign="top">59.7</td><td align="left" valign="top">SUS + Acceptability scale</td></tr><tr><td align="left" valign="top">CHES eDiary [<xref ref-type="bibr" rid="ref45">45</xref>]</td><td align="left" valign="top">87.5</td><td align="left" valign="top">SUS + Walkthrough</td></tr><tr><td align="left" valign="top">TMS [<xref ref-type="bibr" rid="ref16">16</xref>]</td><td align="left" valign="top">69.2</td><td align="left" valign="top">SUS</td></tr><tr><td align="left" valign="top">HeartAround [<xref ref-type="bibr" rid="ref46">46</xref>]</td><td align="left" valign="top">62.2 &#x2192; 78.8</td><td align="left" valign="top">SUS + Interview</td></tr><tr><td align="left" valign="top">ED Health Info System [<xref ref-type="bibr" rid="ref47">47</xref>]</td><td align="left" valign="top">53.1</td><td align="left" valign="top">SUS + Interview</td></tr><tr><td align="left" valign="top">Our Study (EDT System)</td><td align="left" valign="top">80.45</td><td align="left" valign="top">SUS + Activity log metrics (UES<sup><xref ref-type="table-fn" rid="table10fn2">b</xref></sup>, tasks)</td></tr></tbody></table><table-wrap-foot><fn id="table10fn1"><p><sup>a</sup>SUS: System Usability Scale.</p></fn><fn id="table10fn2"><p><sup>b</sup>UES: user engagement score.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s4-6"><title>Limitations</title><p>Despite these strengths, several limitations must be acknowledged in this study. First, the sample size (n=50) limits the generalizability of the findings, and future research should validate the results with larger and more diverse caregiver populations. Second, the evaluation was conducted in a single-system context (the EDT prototype), which constrains external validity; usability outcomes may differ when deployed in varied care environments or integrated with other health systems. Third, although the SUS is a widely validated tool [<xref ref-type="bibr" rid="ref63">63</xref>], it remains a subjective self-reported measure that can be influenced by user expectations, prior experience, or social desirability bias [<xref ref-type="bibr" rid="ref68">68</xref>]. Although we mitigated this limitation by complementing SUS with objective behavioral logs, reliance on a single subjective scale may not fully capture all dimensions of usability. Finally, the cross-sectional study design limits our ability to assess the evaluation of engagement and usability perceptions evolved over time. Longitudinal studies are needed to capture the changes in caregiver interactions and satisfaction with sustained system use.</p><p>This study does not establish clinical validity or support the use of EDT as a diagnostic or treatment tool. The prototype was evaluated as a caregiver-oriented decision support and usability research system rather than as a regulated medical device, and the Fitbit Sense 2 used for sensing should be regarded as a consumer-grade wearable rather than a clinical reference device. In addition, the predictive components were evaluated only on the available study dataset, and no independent external sample validation was performed. Accordingly, the reported model performance metrics should be interpreted as preliminary indicators of technical feasibility rather than evidence of clinical-grade validity, external validity, or broader generalizability. Similarly, the LLM-generated outputs were intended to provide caregiver-friendly support, monitoring guidance, and follow-up suggestions rather than medical diagnosis or treatment advice. Furthermore, the composite engagement score was constructed using a pragmatic equal-weight additive approach, and formal testing of interdependence among its component metrics was not conducted.</p></sec><sec id="s4-7"><title>System Improvements and Future Work</title><p>This usability evaluation provided valuable lessons for refining the EDT. The system demonstrated excellent usability and high effectiveness, with a 94.08% task completion rate and low error rates. However, the findings reveal areas for enhancing system inclusivity and adoption. The small proportion of abandoned tasks (2.66%) and minimal retries (0.25 per task) indicated that certain interactions may challenge some users, particularly those in the low-engagement cluster identified in UES tiering. The average task time indicates overall efficiency but varies across engagement tiers. Medium- and low-engagement users required more time and retries, suggesting opportunities to streamline workflows. Simplifying navigation and reducing cognitive load can improve efficiency across different user profiles. Clustering analysis showed varied usability outcomes across users. Future development should address caregiver experience heterogeneity by tailoring features to different profiles, such as contextual prompts for low and advanced features for high-engagement users. Future work should expand the evaluation to more diverse caregiver populations, examine patterns of engagement and usability, incorporate contextual factors such as digital literacy and caregiving intensity, and evaluate the EDT in more naturalistic home care settings using scenarios grounded in real caregiver workflows to strengthen ecological validity. Future research should also examine intermetric correlations, dimensional structure, and alternative weighting strategies to further validate the composite engagement score. In addition, independent external datasets, prospective evaluation, and real-world deployment testing are needed to establish the robustness and generalizability of the predictive components more rigorously. Together, these efforts will help validate our findings and guide further improvements to ensure that the EDT system remains usable and responsive to caregiving practices.</p></sec><sec id="s4-8"><title>Conclusions</title><p>This study evaluated the usability of the EDT system by combining subjective perceptions with objective behavioral data. The findings demonstrated excellent usability and strong task performance, with high completion, low error, and abandonment rates. Correlation and regression analyses showed that the composite UES was not only positively associated with but also a significant predictor of usability, explaining 39.2% of the variance in SUS. Clustering further revealed differences in engagement tiers, underscoring that usability outcomes are not uniform across users. Taken together, these results highlight the value of integrating subjective and objective measures to capture a comprehensive picture of product usability. This study contributes methodologically by linking behavioral engagement metrics with perceived usability, particularly by identifying the strengths and areas for improvement in EDT systems. Future studies should validate these findings in larger and more diverse caregiver populations, explore longitudinal engagement patterns, and incorporate adaptive features to support users with varying engagement profiles.</p></sec></sec></body><back><ack><p>The authors would like to thank all study participants for their valuable time and insights during the usability testing sessions. The authors also extend special thanks to Miss Sutthikarn Chanthakup for her assistance as a local Thai research assistant, particularly in facilitating communication with Thai participants during data collection. This research was supported by the Petchra Pra Jom Klao Research Scholarship from King Mongkut&#x2019;s University of Technology Thonburi (KMUTT). The authors confirm that no generative artificial intelligence tools were used for writing, editing, data analysis, figure generation, or other content generation during the preparation of this manuscript. The authors take full responsibility for the accuracy, originality, and integrity of all content in the manuscript.</p></ack><notes><sec><title>Funding</title><p>No financial support or grants were received from any public, commercial, or not-for-profit entities for the research, authorship, or publication of this article.</p></sec><sec><title>Data Availability</title><p>The dataset generated and analyzed in this study are available in Zenodo [<xref ref-type="bibr" rid="ref69">69</xref>] and include anonymized data and supporting materials required to reproduce the study findings. Access to the elderly digital twin system link is available from the authors upon reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>ZM contributed to conceptualization, methodology, data collection, formal analysis, and writing &#x2013; original draft. PM participated in supervision, validation, and writing &#x2013; review &#x0026; editing. DP participated in supervision, methodology, and writing &#x2013; review &#x0026; editing. SY participated in supervision and review &#x0026; editing.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p>artificial intelligence</p></def></def-item><def-item><term id="abb2">Bi-LSTM</term><def><p>bidirectional long short-term memory</p></def></def-item><def-item><term id="abb3">CTR</term><def><p>click-to-task ratio</p></def></def-item><def-item><term id="abb4">DT</term><def><p>digital twin</p></def></def-item><def-item><term id="abb5">EDT</term><def><p>elderly digital twin</p></def></def-item><def-item><term id="abb6">FU</term><def><p>feature usage</p></def></def-item><def-item><term id="abb7">HRV</term><def><p>heart rate variability</p></def></def-item><def-item><term id="abb8">ISO</term><def><p>International Organization for Standardization</p></def></def-item><def-item><term id="abb9">LLM</term><def><p>large language model</p></def></def-item><def-item><term id="abb10">NASA-TLX</term><def><p>National Aeronautics and Space Administration&#x2014;Task Load Index</p></def></def-item><def-item><term id="abb11">NF</term><def><p>navigation frequency</p></def></def-item><def-item><term id="abb12">RR</term><def><p>retry rate</p></def></def-item><def-item><term id="abb13">SpO&#x2082;</term><def><p>peripheral oxygen saturation</p></def></def-item><def-item><term id="abb14">SUS</term><def><p>System Usability Scale</p></def></def-item><def-item><term id="abb15">TAR</term><def><p>task abandonment rate</p></def></def-item><def-item><term id="abb16">TC</term><def><p>task completion</p></def></def-item><def-item><term id="abb17">ToT</term><def><p>time on task</p></def></def-item><def-item><term id="abb18">UES</term><def><p>user engagement score</p></def></def-item><def-item><term id="abb19">UMUX</term><def><p>usability metric for user experience</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="web"><article-title>Promoting health and well-being of older persons: WHO&#x2019;s support to ASEAN member states</article-title><source>World Health Organization</source><year>2025</year><access-date>2026-05-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/thailand/news/detail/25-02-2025-promoting-health-and-well-being-of-older-persons--who-s-support-to-asean-member-states">https://www.who.int/thailand/news/detail/25-02-2025-promoting-health-and-well-being-of-older-persons--who-s-support-to-asean-member-states</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hong</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>L</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>G</given-names> </name><name name-style="western"><surname>Guan</surname><given-names>B</given-names> </name><name name-style="western"><surname>Li</surname><given-names>C</given-names> </name><name name-style="western"><surname>Luo</surname><given-names>Y</given-names> </name></person-group><article-title>Response of global health towards the challenges presented by population aging</article-title><source>China CDC Wkly</source><year>2023</year><month>09</month><day>29</day><volume>5</volume><issue>39</issue><fpage>884</fpage><lpage>887</lpage><pub-id pub-id-type="doi">10.46234/ccdcw2023.168</pub-id><pub-id pub-id-type="medline">37814614</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Khan</surname><given-names>HTA</given-names> </name><name name-style="western"><surname>Addo</surname><given-names>KM</given-names> </name><name name-style="western"><surname>Findlay</surname><given-names>H</given-names> </name></person-group><article-title>Public health challenges and responses to the growing ageing populations</article-title><source>Public Health Chall</source><year>2024</year><month>09</month><volume>3</volume><issue>3</issue><fpage>e213</fpage><pub-id pub-id-type="doi">10.1002/puh2.213</pub-id><pub-id pub-id-type="medline">40496520</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Katsoulakis</surname><given-names>E</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Digital twins for health: a scoping review</article-title><source>NPJ Digit Med</source><year>2024</year><month>03</month><day>22</day><volume>7</volume><issue>1</issue><fpage>77</fpage><pub-id pub-id-type="doi">10.1038/s41746-024-01073-0</pub-id><pub-id pub-id-type="medline">38519626</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Magwa</surname><given-names>P</given-names> </name></person-group><article-title>Leveraging digital twins for personalized medicine: A framework for predictive therapeutics</article-title><source>Clin Pharmacol Biopharm</source><year>2024</year><access-date>2026-05-25</access-date><volume>13</volume><issue>12</issue><comment><ext-link ext-link-type="uri" xlink:href="https://www.omicsonline.org/open-access-pdfs/leveraging-digital-twins-for-personalized-medicine-a-framework-for-predictive-therapeutics.pdf">https://www.omicsonline.org/open-access-pdfs/leveraging-digital-twins-for-personalized-medicine-a-framework-for-predictive-therapeutics.pdf</ext-link></comment><pub-id pub-id-type="doi">10.4172/2167-065X.1000527</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vall&#x00E9;e</surname><given-names>A</given-names> </name></person-group><article-title>Digital twin for healthcare systems</article-title><source>Front Digit Health</source><year>2023</year><volume>5</volume><fpage>1253050</fpage><pub-id pub-id-type="doi">10.3389/fdgth.2023.1253050</pub-id><pub-id pub-id-type="medline">37744683</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Leung</surname><given-names>JC</given-names> </name><name name-style="western"><surname>Chen</surname><given-names>M</given-names> </name><name name-style="western"><surname>Qiu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>BTH</given-names> </name><name name-style="western"><surname>Zeng</surname><given-names>Z</given-names> </name><etal/></person-group><article-title>An intelligent and privacy-preserving digital twin model for aging-in-place</article-title><comment>Preprint posted online on  Apr 4, 2025</comment><pub-id pub-id-type="doi">10.48550/arXiv.2504.03798</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Qian</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zhou</surname><given-names>H</given-names> </name></person-group><article-title>Application and research of digital twin technology in safety and health monitoring of the elderly in community</article-title><source>Zhongguo Yi Liao Qi Xie Za Zhi</source><year>2019</year><month>11</month><day>30</day><volume>43</volume><issue>6</issue><fpage>410</fpage><lpage>413</lpage><pub-id pub-id-type="doi">10.3969/j.issn.1671-7104.2019.06.005</pub-id><pub-id pub-id-type="medline">31854524</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Harding</surname><given-names>AJE</given-names> </name><name name-style="western"><surname>Doherty</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bavelaar</surname><given-names>L</given-names> </name><etal/></person-group><article-title>A family carer decision support intervention for people with advanced dementia residing in a nursing home: a study protocol for an international advance care planning intervention (mySupport study)</article-title><source>BMC Geriatr</source><year>2022</year><month>10</month><day>26</day><volume>22</volume><issue>1</issue><fpage>822</fpage><pub-id pub-id-type="doi">10.1186/s12877-022-03533-2</pub-id><pub-id pub-id-type="medline">36289458</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Magnusson</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Shwayder</surname><given-names>I</given-names> </name><name name-style="western"><surname>Murphy</surname><given-names>NJ</given-names> </name><name name-style="western"><surname>Ollerenshaw</surname><given-names>L</given-names> </name><name name-style="western"><surname>Ebendick</surname><given-names>M</given-names> </name><name name-style="western"><surname>Auer-Bennett</surname><given-names>E</given-names> </name></person-group><article-title>Creation of a community-driven decision support tool for caregivers of children with developmental concerns</article-title><source>Am J Speech Lang Pathol</source><year>2022</year><month>05</month><day>10</day><volume>31</volume><issue>3</issue><fpage>1084</fpage><lpage>1094</lpage><pub-id pub-id-type="doi">10.1044/2021_AJSLP-21-00072</pub-id><pub-id pub-id-type="medline">34731583</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alwashmi</surname><given-names>MF</given-names> </name><name name-style="western"><surname>Hawboldt</surname><given-names>J</given-names> </name><name name-style="western"><surname>Davis</surname><given-names>E</given-names> </name><name name-style="western"><surname>Fetters</surname><given-names>MD</given-names> </name></person-group><article-title>The iterative convergent design for mobile health usability testing: mixed methods approach</article-title><source>JMIR Mhealth Uhealth</source><year>2019</year><month>04</month><day>26</day><volume>7</volume><issue>4</issue><fpage>e11656</fpage><pub-id pub-id-type="doi">10.2196/11656</pub-id><pub-id pub-id-type="medline">31025951</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ghorayeb</surname><given-names>A</given-names> </name><name name-style="western"><surname>Darbyshire</surname><given-names>JL</given-names> </name><name name-style="western"><surname>Wronikowska</surname><given-names>MW</given-names> </name><name name-style="western"><surname>Watkinson</surname><given-names>PJ</given-names> </name></person-group><article-title>Design and validation of a new Healthcare Systems Usability Scale (HSUS) for clinical decision support systems: a mixed-methods approach</article-title><source>BMJ Open</source><year>2023</year><month>01</month><day>30</day><volume>13</volume><issue>1</issue><fpage>e065323</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2022-065323</pub-id><pub-id pub-id-type="medline">36717136</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cornet</surname><given-names>VP</given-names> </name><name name-style="western"><surname>Daley</surname><given-names>CN</given-names> </name><name name-style="western"><surname>Srinivas</surname><given-names>P</given-names> </name><name name-style="western"><surname>Holden</surname><given-names>RJ</given-names> </name></person-group><article-title>User-centered evaluations with older adults: testing the usability of a mobile health system for heart failure self-management</article-title><source>Proc Hum Factors Ergon Soc Annu Meet</source><year>2017</year><month>09</month><volume>61</volume><issue>1</issue><fpage>6</fpage><lpage>10</lpage><pub-id pub-id-type="doi">10.1177/1541931213601497</pub-id><pub-id pub-id-type="medline">30930610</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Cossu-Ergecer</surname><given-names>F</given-names> </name><name name-style="western"><surname>Dekker</surname><given-names>M</given-names> </name><name name-style="western"><surname>van Beijnum</surname><given-names>BJF</given-names> </name><name name-style="western"><surname>Tabak</surname><given-names>M</given-names> </name></person-group><article-title>Usability of a new eHealth monitoring technology that reflects health care needs for older adults with cognitive impairments and their informal and formal caregivers</article-title><conf-name>11th International Conference on Health Informatics</conf-name><conf-date>Oct 25-29, 2026</conf-date><conf-loc>Funchal, Madeira, Portugal</conf-loc><fpage>197</fpage><lpage>207</lpage><pub-id pub-id-type="doi">10.5220/0006639301970207</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Thalmann</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ringli</surname><given-names>L</given-names> </name><name name-style="western"><surname>Adcock</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Usability study of a multicomponent exergame training for older adults with mobility limitations</article-title><source>Int J Environ Res Public Health</source><year>2021</year><month>12</month><day>20</day><volume>18</volume><issue>24</issue><fpage>13422</fpage><pub-id pub-id-type="doi">10.3390/ijerph182413422</pub-id><pub-id pub-id-type="medline">34949028</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hochwarter</surname><given-names>S</given-names> </name><name name-style="western"><surname>Gutheil</surname><given-names>J</given-names> </name><name name-style="western"><surname>Stampfer</surname><given-names>P</given-names> </name><name name-style="western"><surname>Truskaller</surname><given-names>T</given-names> </name><name name-style="western"><surname>Deutsch</surname><given-names>M</given-names> </name><name name-style="western"><surname>Feichtner</surname><given-names>F</given-names> </name></person-group><article-title>One system, many professions: a System Usability Scale evaluation of a multi-professional therapy and monitoring system</article-title><source>Stud Health Technol Inform</source><year>2025</year><month>05</month><day>15</day><volume>327</volume><fpage>308</fpage><lpage>312</lpage><pub-id pub-id-type="doi">10.3233/SHTI250334</pub-id><pub-id pub-id-type="medline">40380445</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhong</surname><given-names>R</given-names> </name><name name-style="western"><surname>Rau</surname><given-names>PLP</given-names> </name></person-group><article-title>A mobile phone-based gait assessment app for the elderly: development and evaluation</article-title><source>JMIR Mhealth Uhealth</source><year>2020</year><month>02</month><day>29</day><volume>8</volume><issue>2</issue><fpage>e14453</fpage><pub-id pub-id-type="doi">10.2196/14453</pub-id><pub-id pub-id-type="medline">32452821</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Momand</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Mongkolnam</surname><given-names>P</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>JH</given-names> </name><name name-style="western"><surname>Charoenkitkarn</surname><given-names>N</given-names> </name><name name-style="western"><surname>Pal</surname><given-names>D</given-names> </name></person-group><article-title>Building digital twins for elderly care: an end-to-end framework from data acquisition to modeling</article-title><source>IEEE Access</source><year>2025</year><volume>13</volume><fpage>169415</fpage><lpage>169445</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2025.3607603</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bangor</surname><given-names>A</given-names> </name><name name-style="western"><surname>Kortum</surname><given-names>PT</given-names> </name><name name-style="western"><surname>Miller</surname><given-names>JT</given-names> </name></person-group><article-title>An empirical evaluation of the System Usability Scale</article-title><source>Int J Hum Comput Interact</source><year>2008</year><month>07</month><day>29</day><volume>24</volume><issue>6</issue><fpage>574</fpage><lpage>594</lpage><pub-id pub-id-type="doi">10.1080/10447310802205776</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Deshmukh</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Chalmeta</surname><given-names>R</given-names> </name></person-group><article-title>Validation of system usability scale as a usability metric to evaluate voice user interfaces</article-title><source>PeerJ Comput Sci</source><year>2024</year><volume>10</volume><fpage>e1918</fpage><pub-id pub-id-type="doi">10.7717/peerj-cs.1918</pub-id><pub-id pub-id-type="medline">38435614</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Khan</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Hickie</surname><given-names>IB</given-names> </name><name name-style="western"><surname>Loblay</surname><given-names>V</given-names> </name><etal/></person-group><article-title>Psychometric evaluation of the System Usability Scale in the context of a childrearing app co-designed for low- and middle-income countries</article-title><source>Digit Health</source><year>2025</year><month>05</month><volume>11</volume><fpage>20552076251335413</fpage><pub-id pub-id-type="doi">10.1177/20552076251335413</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lewis</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Sauro</surname><given-names>J</given-names> </name></person-group><article-title>Item benchmarks for the System Usability Scale</article-title><source>J Usability Stud</source><year>2018</year><access-date>2026-05-25</access-date><volume>13</volume><issue>3</issue><fpage>158</fpage><lpage>167</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://dl.acm.org/doi/abs/10.5555/3294033.3294037">https://dl.acm.org/doi/abs/10.5555/3294033.3294037</ext-link></comment></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lewis</surname><given-names>JR</given-names> </name></person-group><article-title>Measuring perceived usability: the CSUQ, SUS, and UMUX</article-title><source>Int J Hum Comput Interact</source><year>2018</year><month>12</month><day>2</day><volume>34</volume><issue>12</issue><fpage>1148</fpage><lpage>1156</lpage><pub-id pub-id-type="doi">10.1080/10447318.2017.1418805</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Laubheimer</surname><given-names>P</given-names> </name></person-group><article-title>Beyond the NPS: measuring perceived usability with the SUS, NASA-TLX, and the single ease question after tasks and usability tests</article-title><source>Nielsen Norman Group</source><year>2018</year><access-date>2026-05-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.nngroup.com/articles/measuring-perceived-usability">https://www.nngroup.com/articles/measuring-perceived-usability</ext-link></comment></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Takahashi</surname><given-names>L</given-names> </name><name name-style="western"><surname>Nebe</surname><given-names>K</given-names> </name></person-group><article-title>Observed differences between lab and online tests using the AttrakDiff Semantic Differential Scale</article-title><source>J Usability Stud</source><year>2019</year><access-date>2026-05-25</access-date><volume>14</volume><issue>2</issue><fpage>65</fpage><lpage>75</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://dl.acm.org/doi/abs/10.5555/3532689.3532691">https://dl.acm.org/doi/abs/10.5555/3532689.3532691</ext-link></comment></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Robertson</surname><given-names>IW</given-names> </name></person-group><source>Subjective Usability Evaluation: A Comparison of Four Methods</source><year>2018</year><access-date>2026-05-25</access-date><publisher-name>Rice University</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://hdl.handle.net/1911/105826">https://hdl.handle.net/1911/105826</ext-link></comment></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Sauro</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kindlund</surname><given-names>E</given-names> </name></person-group><person-group person-group-type="editor"><name name-style="western"><surname>Sauro</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kindlund</surname><given-names>E</given-names> </name></person-group><article-title>A method to standardize usability metrics into a single score</article-title><conf-name>CHI &#x2019;05: Proceedings of the SIGCHI Conference on Human Factors in Computing Systems</conf-name><conf-date>Apr 2-7, 2005</conf-date><pub-id pub-id-type="doi">10.1145/1054972.1055028</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Latkin</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Edwards</surname><given-names>C</given-names> </name><name name-style="western"><surname>Davey-Rothwell</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Tobin</surname><given-names>KE</given-names> </name></person-group><article-title>The relationship between social desirability bias and self-reports of health, substance use, and social network factors among urban substance users in Baltimore, Maryland</article-title><source>Addict Behav</source><year>2017</year><month>10</month><volume>73</volume><fpage>133</fpage><lpage>136</lpage><pub-id pub-id-type="doi">10.1016/j.addbeh.2017.05.005</pub-id><pub-id pub-id-type="medline">28511097</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Strba</surname><given-names>M</given-names> </name></person-group><article-title>Usability testing metrics</article-title><source>UXtweak</source><year>2024</year><access-date>2026-05-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.uxtweak.com/usability-testing/metrics">https://www.uxtweak.com/usability-testing/metrics</ext-link></comment></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Hariyanti</surname><given-names>NKD</given-names> </name><name name-style="western"><surname>Sudhana</surname><given-names>IFP</given-names> </name><name name-style="western"><surname>Sanjaya</surname><given-names>IGN</given-names> </name><name name-style="western"><surname>Elfarosa</surname><given-names>KV</given-names> </name></person-group><article-title>Implementation of usability testing in measuring the effectiveness and efficiency of mobile application</article-title><conf-name>Proceedings of the 5th International Conference on Applied Science and Technology on Engineering Science (iCAST-ES 2022)</conf-name><conf-date>Oct 21-23, 2022</conf-date><pub-id pub-id-type="doi">10.5220/0011892900003575</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Nielsen</surname><given-names>J</given-names> </name><name name-style="western"><surname>Budiu</surname><given-names>R</given-names> </name></person-group><article-title>Success rate: the simplest usability metric</article-title><source>Nielsen Norman Group</source><year>2021</year><access-date>2026-05-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.nngroup.com/articles/success-rate-the-simplest-usability-metric">https://www.nngroup.com/articles/success-rate-the-simplest-usability-metric</ext-link></comment></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wang</surname><given-names>G</given-names> </name><name name-style="western"><surname>Zhang</surname><given-names>X</given-names> </name><name name-style="western"><surname>Tang</surname><given-names>S</given-names> </name><name name-style="western"><surname>Wilson</surname><given-names>C</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>H</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>BY</given-names> </name></person-group><article-title>Clickstream User Behavior Models</article-title><source>ACM Trans Web</source><year>2017</year><month>11</month><day>30</day><volume>11</volume><issue>4</issue><fpage>1</fpage><lpage>37</lpage><pub-id pub-id-type="doi">10.1145/3068332</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Gerken</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bak</surname><given-names>P</given-names> </name><name name-style="western"><surname>Jetter</surname><given-names>HC</given-names> </name><name name-style="western"><surname>Klinkhammer</surname><given-names>D</given-names> </name><name name-style="western"><surname>Reiterer</surname><given-names>H</given-names> </name></person-group><article-title>How to use interaction logs effectively for usability evaluation</article-title><year>2008</year><access-date>2025-08-25</access-date><conf-name>CHI 2008 Workshop BELIV &#x2019; 08: Beyond time and errors&#x2014;novel evaluation methods for Information</conf-name><conf-date>Apr 2008</conf-date><comment><ext-link ext-link-type="uri" xlink:href="http://nbn-resolving.de/urn:nbn:de:bsz:352-opus-52435">http://nbn-resolving.de/urn:nbn:de:bsz:352-opus-52435</ext-link></comment></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Dumais</surname><given-names>S</given-names> </name><name name-style="western"><surname>Jeffries</surname><given-names>R</given-names> </name><name name-style="western"><surname>Russell</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Tang</surname><given-names>D</given-names> </name><name name-style="western"><surname>Teevan</surname><given-names>J</given-names> </name></person-group><article-title>Understanding user behavior through log data and analysis</article-title><source>Ways of Knowing in HCI</source><year>2014</year><publisher-name>Springer Science &#x0026; Business</publisher-name><pub-id pub-id-type="doi">10.1007/978-1-4939-0378-8_14</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Roberts</surname><given-names>MJ</given-names> </name></person-group><article-title>Objective and subjective methods for evaluating the usability of schematic maps: the case against informal expert assessments</article-title><source>Cartogr J</source><year>2023</year><month>10</month><day>2</day><volume>60</volume><issue>4</issue><fpage>308</fpage><lpage>325</lpage><pub-id pub-id-type="doi">10.1080/00087041.2023.2246742</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gao</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kortum</surname><given-names>P</given-names> </name></person-group><article-title>The relationship between subjective and objective usability metrics for home healthcare devices</article-title><source>Proc Hum Factors Ergon Soc Annu Meet</source><year>2015</year><month>09</month><volume>59</volume><issue>1</issue><fpage>1001</fpage><lpage>1005</lpage><pub-id pub-id-type="doi">10.1177/1541931215591286</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mann</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Chokshi</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Kushniruk</surname><given-names>A</given-names> </name></person-group><article-title>Bridging the gap between academic research and pragmatic needs in usability: a hybrid approach to usability evaluation of health care information systems</article-title><source>JMIR Hum Factors</source><year>2018</year><month>11</month><day>28</day><volume>5</volume><issue>4</issue><fpage>e10721</fpage><pub-id pub-id-type="doi">10.2196/10721</pub-id><pub-id pub-id-type="medline">30487119</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Callejo</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mac&#x00ED;as</surname><given-names>JA</given-names> </name></person-group><article-title>Enhancing tree testing analysis to improve the usability evaluation of websites</article-title><source>Behav Inf Technol</source><year>2026</year><month>04</month><day>3</day><volume>45</volume><issue>6</issue><fpage>1117</fpage><lpage>1135</lpage><pub-id pub-id-type="doi">10.1080/0144929X.2025.2546971</pub-id></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Feehan</surname><given-names>LM</given-names> </name><name name-style="western"><surname>Geldman</surname><given-names>J</given-names> </name><name name-style="western"><surname>Sayre</surname><given-names>EC</given-names> </name><etal/></person-group><article-title>Accuracy of Fitbit devices: systematic review and narrative syntheses of quantitative data</article-title><source>JMIR Mhealth Uhealth</source><year>2018</year><month>08</month><day>9</day><volume>6</volume><issue>8</issue><fpage>e10527</fpage><pub-id pub-id-type="doi">10.2196/10527</pub-id><pub-id pub-id-type="medline">30093371</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Haghayegh</surname><given-names>S</given-names> </name><name name-style="western"><surname>Khoshnevis</surname><given-names>S</given-names> </name><name name-style="western"><surname>Smolensky</surname><given-names>MH</given-names> </name><name name-style="western"><surname>Diller</surname><given-names>KR</given-names> </name><name name-style="western"><surname>Castriotta</surname><given-names>RJ</given-names> </name></person-group><article-title>Accuracy of wristband Fitbit models in assessing sleep: systematic review and meta-analysis</article-title><source>J Med Internet Res</source><year>2019</year><month>11</month><day>28</day><volume>21</volume><issue>11</issue><fpage>e16273</fpage><pub-id pub-id-type="doi">10.2196/16273</pub-id><pub-id pub-id-type="medline">31778122</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lee</surname><given-names>T</given-names> </name><name name-style="western"><surname>Cho</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Cha</surname><given-names>KS</given-names> </name><etal/></person-group><article-title>Accuracy of 11 wearable, nearable, and airable consumer sleep trackers: prospective multicenter validation study</article-title><source>JMIR Mhealth Uhealth</source><year>2023</year><month>11</month><day>2</day><volume>11</volume><issue>1</issue><fpage>e50983</fpage><pub-id pub-id-type="doi">10.2196/50983</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hermans</surname><given-names>F</given-names> </name><name name-style="western"><surname>Arents</surname><given-names>E</given-names> </name><name name-style="western"><surname>Blondeel</surname><given-names>A</given-names> </name><etal/></person-group><article-title>Validity of a consumer-based wearable to measure clinical parameters in patients with chronic obstructive pulmonary disease and healthy controls: observational study</article-title><source>JMIR Mhealth Uhealth</source><year>2024</year><month>11</month><day>6</day><volume>12</volume><issue>1</issue><fpage>e56027</fpage><lpage>e56027</lpage><pub-id pub-id-type="doi">10.2196/56027</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Caunca</surname><given-names>MR</given-names> </name><name name-style="western"><surname>Simonetto</surname><given-names>M</given-names> </name><name name-style="western"><surname>Hartley</surname><given-names>G</given-names> </name><name name-style="western"><surname>Wright</surname><given-names>CB</given-names> </name><name name-style="western"><surname>Czaja</surname><given-names>SJ</given-names> </name></person-group><article-title>Design and usability testing of the stroke caregiver support system: a mobile-friendly website to reduce stroke caregiver burden</article-title><source>Rehabil Nurs</source><year>2020</year><volume>45</volume><issue>3</issue><fpage>166</fpage><lpage>177</lpage><pub-id pub-id-type="doi">10.1097/RNJ.0000000000000196</pub-id><pub-id pub-id-type="medline">30418319</pub-id></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Abbate</surname><given-names>S</given-names> </name><name name-style="western"><surname>Avvenuti</surname><given-names>M</given-names> </name><name name-style="western"><surname>Light</surname><given-names>J</given-names> </name></person-group><article-title>Usability study of a wireless monitoring system among Alzheimer&#x2019;s disease elderly population</article-title><source>Int J Telemed Appl</source><year>2014</year><volume>2014</volume><fpage>617495</fpage><pub-id pub-id-type="doi">10.1155/2014/617495</pub-id><pub-id pub-id-type="medline">24963289</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lehmann</surname><given-names>J</given-names> </name><name name-style="western"><surname>Schreyer</surname><given-names>I</given-names> </name><name name-style="western"><surname>Riedl</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Usability evaluation of the Computer-Based Health Evaluation System (CHES) eDiary for patients with faecal incontinence: a pilot study</article-title><source>BMC Med Inform Decis Mak</source><year>2022</year><month>03</month><day>28</day><volume>22</volume><issue>1</issue><fpage>81</fpage><pub-id pub-id-type="doi">10.1186/s12911-022-01818-5</pub-id><pub-id pub-id-type="medline">35346170</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Panagopoulos</surname><given-names>C</given-names> </name><name name-style="western"><surname>Menychtas</surname><given-names>A</given-names> </name><name name-style="western"><surname>Tsanakas</surname><given-names>P</given-names> </name><name name-style="western"><surname>Maglogiannis</surname><given-names>I</given-names> </name></person-group><article-title>Increasing usability of homecare applications for older adults: a case study</article-title><source>Designs</source><year>2019</year><volume>3</volume><issue>2</issue><fpage>23</fpage><pub-id pub-id-type="doi">10.3390/designs3020023</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>&#x00D8;stervang</surname><given-names>C</given-names> </name><name name-style="western"><surname>Jensen</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Coyne</surname><given-names>E</given-names> </name><name name-style="western"><surname>Dieperink</surname><given-names>KB</given-names> </name><name name-style="western"><surname>Lassen</surname><given-names>A</given-names> </name></person-group><article-title>Usability and evaluation of a health information system in the emergency department: mixed methods study</article-title><source>JMIR Hum Factors</source><year>2024</year><month>02</month><day>21</day><volume>11</volume><fpage>e48445</fpage><pub-id pub-id-type="doi">10.2196/48445</pub-id><pub-id pub-id-type="medline">38381502</pub-id></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Paulissen</surname><given-names>JMJ</given-names> </name><name name-style="western"><surname>Zegers</surname><given-names>CML</given-names> </name><name name-style="western"><surname>Nijsten</surname><given-names>IR</given-names> </name><etal/></person-group><article-title>Performance and usability evaluation of a mobile health data capture application in clinical cancer trials follow-up</article-title><source>Tech Innov Patient Support Radiat Oncol</source><year>2022</year><month>12</month><volume>24</volume><fpage>107</fpage><lpage>112</lpage><pub-id pub-id-type="doi">10.1016/j.tipsro.2022.10.005</pub-id><pub-id pub-id-type="medline">36387779</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Borsci</surname><given-names>S</given-names> </name><name name-style="western"><surname>Federici</surname><given-names>S</given-names> </name><name name-style="western"><surname>Lauriola</surname><given-names>M</given-names> </name></person-group><article-title>On the dimensionality of the System Usability Scale: a test of alternative measurement models</article-title><source>Cogn Process</source><year>2009</year><month>08</month><volume>10</volume><issue>3</issue><fpage>193</fpage><lpage>197</lpage><pub-id pub-id-type="doi">10.1007/s10339-009-0268-9</pub-id><pub-id pub-id-type="medline">19565283</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lewis</surname><given-names>JR</given-names> </name><name name-style="western"><surname>Sauro</surname><given-names>J</given-names> </name></person-group><article-title>The factor structure of the System Usability Scale</article-title><year>2009</year><conf-name>Proceedings of the 1st International Conference on Human Centered Design: Held as Part of HCI International 2009</conf-name><conf-date>Jul 19-24, 2009</conf-date><conf-loc>San Diego, California, United States</conf-loc><publisher-name>Springer</publisher-name><pub-id pub-id-type="doi">10.1007/978-3-642-02806-9_12</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Tan</surname><given-names>H</given-names> </name><name name-style="western"><surname>Cao</surname><given-names>G</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>Y</given-names> </name></person-group><article-title>Enhancing user engagement through adaptive UI/UX design: A study on personalized mobile app interfaces</article-title><source>World J Innov Mod Technol</source><year>2024</year><volume>7</volume><issue>5</issue><fpage>1</fpage><lpage>21</lpage><pub-id pub-id-type="doi">10.53469/wjimt.2024.07(05).01</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Wibawa</surname><given-names>AP</given-names> </name><name name-style="western"><surname>Manik</surname><given-names>LP</given-names> </name><name name-style="western"><surname>Pranolo</surname><given-names>A</given-names> </name><name name-style="western"><surname>Drezewski</surname><given-names>R</given-names> </name><name name-style="western"><surname>Hernandez</surname><given-names>L</given-names> </name><name name-style="western"><surname>Ismail</surname><given-names>AR</given-names> </name><etal/></person-group><article-title>Exploring usage-based and usability metrics for user experience for sustainable e-learning systems</article-title><year>2024</year><conf-name>International Conference on Computer Science, Electronics, and Information (ICCSEI 2023)</conf-name><conf-date>Mar 17-19, 2023</conf-date><pub-id pub-id-type="doi">10.1051/e3sconf/202450102003</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Trukenbrod</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Backhaus</surname><given-names>N</given-names> </name><name name-style="western"><surname>Thomaschke</surname><given-names>R</given-names> </name></person-group><article-title>Measuring subjectively experienced time in usability and user experience testing scenarios</article-title><source>Int J Hum Comput Stud</source><year>2020</year><month>06</month><volume>138</volume><fpage>102399</fpage><pub-id pub-id-type="doi">10.1016/j.ijhcs.2020.102399</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yang</surname><given-names>J</given-names> </name><name name-style="western"><surname>Abraham</surname><given-names>A</given-names> </name></person-group><article-title>Analyzing the features, usability, and performance of deploying a containerized mobile web application on serverless cloud platforms</article-title><source>Future Internet</source><year>2024</year><volume>16</volume><issue>12</issue><fpage>475</fpage><pub-id pub-id-type="doi">10.3390/fi16120475</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Debora</surname><given-names>D</given-names> </name><name name-style="western"><surname>Kharisma</surname><given-names>NN</given-names> </name><name name-style="western"><surname>Rifaldi</surname><given-names>W</given-names> </name><name name-style="western"><surname>Nugraha</surname><given-names>U</given-names> </name></person-group><article-title>UI/UX transformation of XYZ retail information system through user-centered design approach</article-title><source>Jurnal Sistem Informasi dan Teknologi Informasi [J Inform Syst Inform Technol]</source><year>2024</year><volume>2</volume><issue>2</issue><pub-id pub-id-type="doi">10.33197/justinfo.v2i2.2539</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="thesis"><person-group person-group-type="author"><name name-style="western"><surname>Henriksson</surname><given-names>E</given-names> </name><name name-style="western"><surname>Lundstr&#x00F6;m</surname><given-names>M</given-names> </name></person-group><article-title>Navigation systems&#x2019; impact on usability in mobile applications: a study on mobile newspaper applications</article-title><year>2021</year><publisher-name>Jonkoping University</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://urn.kb.se/resolve?urn=urn:nbn:se:hj:diva-53474">https://urn.kb.se/resolve?urn=urn:nbn:se:hj:diva-53474</ext-link></comment></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Weingarden</surname><given-names>H</given-names> </name><name name-style="western"><surname>Garriga Calleja</surname><given-names>R</given-names> </name><name name-style="western"><surname>Greenberg</surname><given-names>JL</given-names> </name><etal/></person-group><article-title>Characterizing observed and effective behavioral engagement with smartphone cognitive behavioral therapy for body dysmorphic disorder: a methods roadmap and use case</article-title><source>Internet Interv</source><year>2023</year><month>04</month><volume>32</volume><fpage>100615</fpage><pub-id pub-id-type="doi">10.1016/j.invent.2023.100615</pub-id><pub-id pub-id-type="medline">36969390</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Lalmas</surname><given-names>M</given-names> </name><name name-style="western"><surname>O&#x2019;Brien</surname><given-names>H</given-names> </name><name name-style="western"><surname>Yom-Tov</surname><given-names>E</given-names> </name></person-group><source>Measuring User Engagement</source><year>2022</year><publisher-name>Springer Nature</publisher-name><pub-id pub-id-type="other">3031022890</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bobko</surname><given-names>P</given-names> </name><name name-style="western"><surname>Roth</surname><given-names>PL</given-names> </name><name name-style="western"><surname>Buster</surname><given-names>MA</given-names> </name></person-group><article-title>The usefulness of unit weights in creating composite scores</article-title><source>Organ Res Methods</source><year>2007</year><month>10</month><volume>10</volume><issue>4</issue><fpage>689</fpage><lpage>709</lpage><pub-id pub-id-type="doi">10.1177/1094428106294734</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wehbe</surname><given-names>C</given-names> </name><name name-style="western"><surname>Baroud</surname><given-names>H</given-names> </name></person-group><article-title>Limitations and considerations of using composite indicators to measure vulnerability to natural hazards</article-title><source>Sci Rep</source><year>2024</year><month>08</month><day>20</day><volume>14</volume><issue>1</issue><fpage>19333</fpage><pub-id pub-id-type="doi">10.1038/s41598-024-68060-z</pub-id><pub-id pub-id-type="medline">39164315</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alabbas</surname><given-names>A</given-names> </name><name name-style="western"><surname>Alomar</surname><given-names>K</given-names> </name></person-group><article-title>A weighted composite metric for evaluating user experience in educational chatbots: balancing usability, engagement, and effectiveness</article-title><source>Future Internet</source><year>2025</year><volume>17</volume><issue>2</issue><fpage>64</fpage><pub-id pub-id-type="doi">10.3390/fi17020064</pub-id></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tavakol</surname><given-names>M</given-names> </name><name name-style="western"><surname>Dennick</surname><given-names>R</given-names> </name></person-group><article-title>Making sense of Cronbach&#x2019;s alpha</article-title><source>Int J Med Educ</source><year>2011</year><month>06</month><day>27</day><volume>2</volume><fpage>53</fpage><lpage>55</lpage><pub-id pub-id-type="doi">10.5116/ijme.4dfb.8dfd</pub-id><pub-id pub-id-type="medline">28029643</pub-id></nlm-citation></ref><ref id="ref63"><label>63</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Lewis</surname><given-names>JR</given-names> </name></person-group><article-title>The System Usability Scale: past, present, and future</article-title><source>Int J Hum Comput Interact</source><year>2018</year><month>07</month><day>3</day><volume>34</volume><issue>7</issue><fpage>577</fpage><lpage>590</lpage><pub-id pub-id-type="doi">10.1080/10447318.2018.1455307</pub-id></nlm-citation></ref><ref id="ref64"><label>64</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Hornb&#x00E6;k</surname><given-names>K</given-names> </name></person-group><article-title>Current practice in measuring usability: Challenges to usability studies and research</article-title><source>Int J Hum Comput Stud</source><year>2006</year><month>02</month><volume>64</volume><issue>2</issue><fpage>79</fpage><lpage>102</lpage><pub-id pub-id-type="doi">10.1016/j.ijhcs.2005.06.002</pub-id></nlm-citation></ref><ref id="ref65"><label>65</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Egorow</surname><given-names>O</given-names> </name><name name-style="western"><surname>Siegert</surname><given-names>I</given-names> </name><name name-style="western"><surname>Wendemuth</surname><given-names>A</given-names> </name><name name-style="western"><surname>Egorow</surname><given-names>O</given-names> </name><name name-style="western"><surname>Siegert</surname><given-names>I</given-names> </name><name name-style="western"><surname>Wendemuth</surname><given-names>A</given-names> </name></person-group><article-title>Prediction of user satisfaction in naturalistic human-computer interaction</article-title><source>Kognitive Systeme</source><year>2017</year><issue>1</issue><pub-id pub-id-type="doi">10.17185/duepublico/44534</pub-id></nlm-citation></ref><ref id="ref66"><label>66</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fennell</surname><given-names>PG</given-names> </name><name name-style="western"><surname>Zuo</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Lerman</surname><given-names>K</given-names> </name></person-group><article-title>Predicting and explaining behavioral data with structured feature space decomposition</article-title><source>EPJ Data Sci</source><year>2019</year><month>12</month><volume>8</volume><issue>1</issue><pub-id pub-id-type="doi">10.1140/epjds/s13688-019-0201-0</pub-id></nlm-citation></ref><ref id="ref67"><label>67</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Alenazi</surname><given-names>SA</given-names> </name></person-group><article-title>Predictive modelling of omni-channel customer behavior using big data analytics for retail marketing</article-title><source>Int J Innov Res Sci Stud</source><year>2025</year><volume>8</volume><issue>5</issue><fpage>1350</fpage><lpage>1359</lpage><pub-id pub-id-type="doi">10.53894/ijirss.v8i5.9134</pub-id></nlm-citation></ref><ref id="ref68"><label>68</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Orn</surname><given-names>A</given-names> </name></person-group><article-title>Pros and cons of the system usability scale (SUS)</article-title><source>Research Collective</source><year>2017</year><access-date>2026-05-13</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://research-collective.com/pros-and-cons-of-the-system-usability-scale-sus">https://research-collective.com/pros-and-cons-of-the-system-usability-scale-sus</ext-link></comment></nlm-citation></ref><ref id="ref69"><label>69</label><nlm-citation citation-type="web"><person-group person-group-type="author"><name name-style="western"><surname>Momand</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Mongkolnam</surname><given-names>P</given-names> </name><name name-style="western"><surname>Chan</surname><given-names>J</given-names> </name><name name-style="western"><surname>Charoenkitkarn</surname><given-names>N</given-names> </name><name name-style="western"><surname>Pal</surname><given-names>D</given-names> </name></person-group><article-title>Longitudinal wearable physiological dataset of elderly individuals</article-title><source>Zenodo</source><access-date>2026-05-25</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://zenodo.org/records/18745170">https://zenodo.org/records/18745170</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Screenshots of the elderly digital twin system functions, interfaces, and key caregiver-facing modules.</p><media xlink:href="aging_v9i1e91873_app1.pdf" xlink:title="PDF File, 1473 KB"/></supplementary-material></app-group></back></article>