<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Aging</journal-id><journal-id journal-id-type="publisher-id">aging</journal-id><journal-id journal-id-type="index">31</journal-id><journal-title>JMIR Aging</journal-title><abbrev-journal-title>JMIR Aging</abbrev-journal-title><issn pub-type="epub">2561-7605</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e77017</article-id><article-id pub-id-type="doi">10.2196/77017</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Machine Learning&#x2013;Derived Cardiovascular Aging Phenotypes From Cardiac Function and Stroke Risk in the UK Biobank: Cohort Study</article-title></title-group><contrib-group><contrib contrib-type="author"><name name-style="western"><surname>Yuan</surname><given-names>Kang</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Kong</surname><given-names>Deyan</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zhong</surname><given-names>Jinghui</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Xie</surname><given-names>Mengdi</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Liu</surname><given-names>Rui</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Sun</surname><given-names>Wen</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Liu</surname><given-names>Xinfeng</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Neurology, Affiliated Jinling Hospital, Medical School of Nanjing University</institution><addr-line>305 Zhongshan East Road, Xuanwu District</addr-line><addr-line>Nanjing</addr-line><addr-line>Jiangsu Province</addr-line><country>China</country></aff><aff id="aff2"><institution>Department of Neurology, The Second Affiliated Hospital of Guangxi Medical University</institution><addr-line>Nanning</addr-line><addr-line>Guangxi</addr-line><country>China</country></aff><aff id="aff3"><institution>Department of Neurology, Centre for Leading Medicine and Advanced Technologies of IHM, The First Affiliated Hospital of USTC, Division of Life Sciences and Medicine, University of Science and Technology of China</institution><addr-line>Hefei</addr-line><addr-line>Anhui</addr-line><country>China</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Wang</surname><given-names>Jinjiao</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Yang</surname><given-names>Chao</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Dall&#x2019;Olio</surname><given-names>Lorenzo</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Xinfeng Liu, PhD, Department of Neurology, Affiliated Jinling Hospital, Medical School of Nanjing University, 305 Zhongshan East Road, Xuanwu District, Nanjing, Jiangsu Province, 210002, China, 86 2584801861, 86 2584805169; <email>xfliu2@vip.163.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>27</day><month>4</month><year>2026</year></pub-date><volume>9</volume><elocation-id>e77017</elocation-id><history><date date-type="received"><day>06</day><month>05</month><year>2025</year></date><date date-type="rev-recd"><day>09</day><month>03</month><year>2026</year></date><date date-type="accepted"><day>24</day><month>03</month><year>2026</year></date></history><copyright-statement>&#x00A9; Kang Yuan, Deyan Kong, Jinghui Zhong, Mengdi Xie, Rui Liu, Wen Sun, Xinfeng Liu. Originally published in JMIR Aging (<ext-link ext-link-type="uri" xlink:href="https://aging.jmir.org">https://aging.jmir.org</ext-link>), 27.4.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Aging, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://aging.jmir.org">https://aging.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://aging.jmir.org/2026/1/e77017"/><abstract><sec><title>Background</title><p>Cardiovascular magnetic resonance (CMR) is widely used across various cardiac conditions and systematically assesses cardiac anatomical structures and functional dynamics. Machine learning (ML) can accurately predict outcomes and understand the inherent features of clinical data.</p></sec><sec><title>Objective</title><p>This study aimed to derive CMR phenotypes related to cardiovascular aging, investigate the relationship between these phenotypes and stroke risk, and relearn these phenotypes using supervised ML.</p></sec><sec sec-type="methods"><title>Methods</title><p>We enrolled 36,467 participants without stroke and extracted CMR parameters from the UK Biobank, with follow-up data extending until September 30, 2023. Using the generative topographic mapping technique, we identified latent grid nodes among participants and then derived phenotypes through agglomerative hierarchical clustering. We used supervised ML models to predict cardiac function phenotypes and used Cox proportional hazards models to assess the association between these phenotypes and long-term stroke risk.</p></sec><sec sec-type="results"><title>Results</title><p>We enrolled 36,467 participants in the study. The mean age was 54.9 (SD 7.5) years, with 17,442 (47.8%) male participants. During a mean follow-up time of 14.7 (SD 1.1) years, 500 (1.4%) participants developed stroke and 664 (1.8%) participants died, respectively. After generative topographic mapping modeling, we identified 2 distinct phenotypes: phenotype 1, characterized by adverse cardiac function and an accumulation of cardiovascular risk factors, reflecting cardiovascular aging; and phenotype 2, associated with a lower risk of stroke (hazard ratio 0.695, 95% CI 0.559-0.864; <italic>P</italic>=.001), which remained significant after accounting for competing mortality (hazard ratio 0.578, 95% CI 0.484-0.691; <italic>P</italic>&#x003C;.001). We selected the random forest model as the optimal model for the phenotypes, demonstrating high accuracy (area under the curve 0.914, 95% CI 0.911-0.918 for training and 0.867, 95% CI 0.858-0.876 for validation) and calibration ability (Brier score 0.111, 95% CI 0.109-0.113 for training and 0.132, 95% CI 0.127-0.137 for validation).</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>By integrating unsupervised and supervised ML methods, we identified cardiovascular aging&#x2013;related phenotypes that demonstrate robust predictive ability for incident stroke, which may have the potential to improve preventive and therapeutic strategies for high-risk populations.</p></sec></abstract><kwd-group><kwd>stroke</kwd><kwd>generative topographic mapping</kwd><kwd>UK Biobank</kwd><kwd>machine learning</kwd><kwd>cardiac function</kwd><kwd>aging</kwd><kwd>phenotypes</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Stroke is a major cause of mortality and morbidity worldwide [<xref ref-type="bibr" rid="ref1">1</xref>]. Aging is associated with progressive structural and functional deterioration of the cardiovascular system [<xref ref-type="bibr" rid="ref2">2</xref>]. Several conditions associated with cardiovascular aging [<xref ref-type="bibr" rid="ref3">3</xref>,<xref ref-type="bibr" rid="ref4">4</xref>], including atrial fibrillation, heart failure, and myocardial infarction, are recognized as important risk factors for stroke [<xref ref-type="bibr" rid="ref5">5</xref>-<xref ref-type="bibr" rid="ref8">8</xref>]. Cardiovascular magnetic resonance (CMR) enables systematic assessment of cardiac structural and functional remodeling and has been reported to be associated with the aging process [<xref ref-type="bibr" rid="ref9">9</xref>]. Previous studies have shown that atrial mechanical dysfunction and left ventricular (LV) structural abnormalities assessed by CMR are associated with stroke events [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. However, CMR metrics are relatively complex, and extracting phenotypes from these metrics may provide insight into their relationship with cardiovascular aging and help clarify their association with stroke risk.</p><p>The application of artificial intelligence in clinical practice for disease prediction and detection has grown tremendously in recent years [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. Supervised machine learning (ML) can accurately predict clinical outcomes, while unsupervised ML can identify the inherent features of data without requiring labeled outcomes [<xref ref-type="bibr" rid="ref14">14</xref>]. Previous studies have used unsupervised ML models to delineate prognostically distinct clusters using variables related to LV diastolic function derived from transthoracic echocardiography [<xref ref-type="bibr" rid="ref15">15</xref>]. Additionally, the hierarchical k-means clustering algorithm has also been effective in distinguishing potential embolic source groups in cryptogenic stroke [<xref ref-type="bibr" rid="ref16">16</xref>]. Generative topographic mapping (GTM) is a probabilistic model used for dimensionality reduction and data visualization, exhibiting superiority over the self-organizing map algorithm by explicitly modeling probability distributions [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>]. GTM can reduce data dimensionality to a latent space and reveal the underlying structure with robustness across diverse sources [<xref ref-type="bibr" rid="ref19">19</xref>]. However, previous studies applying GTM to derive phenotypes have been limited, with applications reported in general and critical care populations [<xref ref-type="bibr" rid="ref20">20</xref>].</p><p>Therefore, the aim of this study was to use the GTM model to identify distinct cardiac function phenotypes related to cardiovascular aging, examine their association with long-term stroke risk, and develop supervised ML models to predict these phenotypes using data from a prospective longitudinal cohort.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Population</title><p>The UK Biobank is a large, population-based prospective cohort study comprising more than 500,000 participants aged 49 to 69 years, enrolled from 22 assessment centers in the United Kingdom between 2006 and 2010. Details of the UK Biobank protocols are accessible online [<xref ref-type="bibr" rid="ref21">21</xref>]. Participants diagnosed with stroke at baseline (n=7780, 1.5%), lacking follow-up information (n=20,251, 4%), or without CMR data (n=437,713, 87.2%) were excluded, resulting in a final cohort of 36,467 (7.3%) participants.</p><p>We included the following CMR measures in the study: LV stroke volume (LVSV), LV myocardial mass (LVMM), LV end-diastolic volume (LVEDV), LV end-systolic volume (LVESV), LV ejection fraction (LVEF), LV global longitudinal strain (LVGLS), left atrial (LA) maximum volume (LAMV), and LA ejection fraction (LAEF) (<xref ref-type="fig" rid="figure1">Figure 1</xref>).</p><p>Stroke diagnosis was ascertained through linkage to self-reported medical conditions, hospital inpatient data, and death register records based on <italic>International Classification of Diseases</italic> codes, with the earliest recorded date of outcome provided in Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The follow-up time was defined as the interval from the date of recruitment to the occurrence of stroke, all-cause mortality, loss to follow-up, or September 30, 2023, whichever came first. Details of covariates were shown in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. This study was reported according to the transparent reporting of a multivariable prediction model for individual prognosis or diagnosis (TRIPOD) guidelines (<xref ref-type="supplementary-material" rid="app2">Checklist 1</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Cardiovascular aging phenotypes and stroke. LA: left atrial; LV: left ventricular.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e77017_fig01.png"/></fig></sec><sec id="s2-2"><title>GTM Modeling and Phenotypes</title><p>Inspired by the algorithm introduced by Bellfield et al [<xref ref-type="bibr" rid="ref20">20</xref>], we used a Gaussian mixture model to train the GTM model and visualize the distribution of data in the latent space. GTM uses a soft assignment method to estimate the probability of each participant being assigned to a cluster. The high-dimensional data were then visualized in a 2D latent space. After preprocessing the dataset, we used the <italic>ugtm</italic> Python (Python Software Foundation) package for GTM modeling and applied 10-fold cross-validation with the expectation-maximization algorithm to optimize the parameters. After GTM modeling, the generated latent space illustrated the distribution of participants in each cluster, with darker colors indicating higher densities. The modeling parameters (cardiac function variables) demonstrated the impact of cardiac function on each latent grid node in the GTM model. We aggregated the latent grid nodes by calculating the Euclidean distances between their modeling parameters and applied agglomerative hierarchical clustering using the Ward minimum variance method to derive phenotypes [<xref ref-type="bibr" rid="ref22">22</xref>]. The characteristics of the phenotypes were compared to evaluate the distribution of risk factors for cardiovascular aging.</p></sec><sec id="s2-3"><title>Phenotypes and Stroke Risk</title><p>We used Cox proportional hazards models to evaluate the association between cardiac function phenotypes and long-term stroke risk, reporting results as hazard ratios (HRs) with 95% CIs. In multivariable analyses, model 1 was an unadjusted model; model 2 was adjusted for age at recruitment, sex, Townsend deprivation index at recruitment, smoking status, alcohol intake frequency, systolic blood pressure, diastolic blood pressure, and BMI; and model 3 was additionally adjusted for atrial fibrillation, type 2 diabetes, coronary heart disease, heart failure, antihypertensive drugs, and statins. In sensitivity analyses, we explored the association of cardiac function phenotypes with the risk of different stroke types. Additionally, we performed a competing risk analysis for stroke risk using the Fine and Gray method, accounting for mortality as the competing event.</p></sec><sec id="s2-4"><title>Supervised ML Frameworks</title><p>Following the categorization of participants into different phenotypes through the GTM approach, we deployed several supervised ML models to predict cardiac function phenotypes. Hyperparameters for each model are detailed in Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Hyperparameter optimization was conducted using grid search and Bayesian optimization. Discriminatory ability was evaluated using the receiver operating characteristic curve. Calibration performance was assessed using the calibration curve. We selected the best-performing method as the final algorithm for developing a phenotype prediction model. We constructed a website using the Flask framework and the DeepSeek-R1 API (application programming interface). The predicted probabilities and individualized metrics were sent to the DeepSeek-R1 model to generate a detailed analysis of health status and provide professional recommendations. Detailed descriptions of the methods are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-5"><title>Ethical Considerations</title><p>The ethical framework of the UK Biobank was approved by the North West Multi-centre Research Ethics Committee (11/NW/0382). All participants provided informed consent through electronic signature at enrollment.</p></sec><sec id="s2-6"><title>Statistical Analysis</title><p>Normally distributed continuous data are presented as mean (SD), and group comparisons were performed using 2-tailed <italic>t</italic> tests. Categorical data were presented as frequency (percentage), and group comparisons were conducted using chi-square tests. To account for multiple comparisons, <italic>P</italic> values were adjusted using the false discovery rate method. Statistical tests were conducted with R software (version 4.2.1; R Foundation for Statistical Computing), and a 2-sided <italic>P</italic> value &#x003C;.05 was considered statistically significant.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Study Population</title><p>The study design is shown in <xref ref-type="fig" rid="figure2">Figure 2</xref>. Of the 36,467 participants included in the study (<xref ref-type="fig" rid="figure2">Figure 2</xref>), the mean age was 54.9 (SD 7.5) years, with 17,442 (47.8%) male participants. In total, 14,373 (39.5%) of participants were current or former smokers, 8180 (22.4%) had daily or almost daily alcohol intake, 1047 (2.9%) had type 2 diabetes, 345 (0.9%) had atrial fibrillation, and 48 (0.1%) had heart failure at baseline. During a mean follow-up time of 14.7 (SD 1.1) years, 500 (1.4%) and 664 (1.8%) participants developed stroke and died, respectively (<xref ref-type="table" rid="table1">Table 1</xref>).</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Flowchart illustrating the study design. CMR: cardiovascular magnetic resonance.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e77017_fig02.png"/></fig><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Characteristics of the participants included in the study.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Characteristics</td><td align="left" valign="bottom">Total (n=36,467)</td><td align="left" valign="bottom">Phenotype 1 (n=10,749)</td><td align="left" valign="bottom">Phenotype 2 (n=25,718)</td><td align="left" valign="bottom">Chi square (<italic>df</italic>) or t test (<italic>df</italic>)</td><td align="left" valign="bottom"><italic>P</italic> value</td><td align="left" valign="bottom">Adjusted <italic>P</italic> value<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td></tr></thead><tbody><tr><td align="left" valign="top">Age (years), mean (SE)</td><td align="left" valign="top">54.9 (0.0)</td><td align="left" valign="top">54.4 (0.1)</td><td align="left" valign="top">55 (0.0)</td><td align="left" valign="top">&#x2212;6.74 (19,563.5)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Male, n (%)</td><td align="left" valign="top">17,442 (47.8)</td><td align="left" valign="top">9333 (86.8)</td><td align="left" valign="top">8109 (31.5)</td><td align="left" valign="top">9287 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top" colspan="4">Ethnicity, n (%)</td><td align="left" valign="top">78.9 (4)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;Asian</td><td align="left" valign="top">367 (1.0)</td><td align="left" valign="top">45 (0.4)</td><td align="left" valign="top">322 (1.3)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Black</td><td align="left" valign="top">219 (0.6)</td><td align="left" valign="top">76 (0.7)</td><td align="left" valign="top">143 (0.6)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Chinese</td><td align="left" valign="top">102 (0.3)</td><td align="left" valign="top">9 (0.1)</td><td align="left" valign="top">93 (0.4)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Mixed</td><td align="left" valign="top">162 (0.4)</td><td align="left" valign="top">40 (0.4)</td><td align="left" valign="top">122 (0.5)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>White<sup><xref ref-type="table-fn" rid="table1fn4">d</xref></sup></td><td align="left" valign="top">35,342 (97.7)</td><td align="left" valign="top">10,503 (98.4)</td><td align="left" valign="top">24,839 (97.3)</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">Townsend deprivation index, mean (SE)</td><td align="left" valign="top">&#x2212;1.9 (0.0)</td><td align="left" valign="top">&#x2212;2 (0.0)</td><td align="left" valign="top">&#x2212;1.9 (0.0)</td><td align="left" valign="top">&#x2212;2.39 ( 20,325.8)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top">.02</td><td align="left" valign="top">.02</td></tr><tr><td align="left" valign="top" colspan="4">Overall health rating, n (%)</td><td align="left" valign="top">35.6 (3)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;Poor</td><td align="left" valign="top">629 (1.7)</td><td align="left" valign="top">199 (1.9)</td><td align="left" valign="top">430 (1.7)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Fair</td><td align="left" valign="top">5123 (14.1)</td><td align="left" valign="top">1683 (15.7)</td><td align="left" valign="top">3440 (13.4)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Good</td><td align="left" valign="top">22,137 (60.8)</td><td align="left" valign="top">6359 (59.2)</td><td align="left" valign="top">15,778 (61.5)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Excellent</td><td align="left" valign="top">8503 (23.4)</td><td align="left" valign="top">2492 (23.2)</td><td align="left" valign="top">6011 (23.4)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top" colspan="4">Smoking status, n (%)</td><td align="left" valign="top">88.8 (2)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;Current</td><td align="left" valign="top">2297 (6.3)</td><td align="left" valign="top">771 (7.2)</td><td align="left" valign="top">1526 (5.9)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Previous</td><td align="left" valign="top">12,076 (33.2)</td><td align="left" valign="top">3859 (36.0)</td><td align="left" valign="top">8217 (32.0)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Never</td><td align="left" valign="top">22,007 (60.5)</td><td align="left" valign="top">6089 (56.8)</td><td align="left" valign="top">15,918 (62.0)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top" colspan="4">Alcohol intake frequency, n (%)</td><td align="left" valign="top">415 (5)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;Daily or almost daily</td><td align="left" valign="top">8180 (22.4)</td><td align="left" valign="top">2800 (26.1)</td><td align="left" valign="top">5380 (20.9)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;3 or 4 times a week</td><td align="left" valign="top">10,190 (28.0)</td><td align="left" valign="top">3339 (31.1)</td><td align="left" valign="top">6851 (26.7)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Once or twice a week</td><td align="left" valign="top">9389 (25.8)</td><td align="left" valign="top">2712 (25.2)</td><td align="left" valign="top">6677 (26.0)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;1-3 times a month</td><td align="left" valign="top">3963 (10.9)</td><td align="left" valign="top">946 (8.8)</td><td align="left" valign="top">3017 (11.7)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Special occasions only</td><td align="left" valign="top">2997 (8.2)</td><td align="left" valign="top">554 (5.2)</td><td align="left" valign="top">2443 (9.5)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Never</td><td align="left" valign="top">1728 (4.7)</td><td align="left" valign="top">393 (3.7)</td><td align="left" valign="top">1335 (5.2)</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top" colspan="7">Comorbidity, n (%)</td></tr><tr><td align="left" valign="top">&#x2003;Dementia</td><td align="left" valign="top">8 (0.0)</td><td align="left" valign="top">2 (0.0)</td><td align="left" valign="top">6 (0.0)</td><td align="left" valign="top">0.001 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">.99</td><td align="left" valign="top">.99</td></tr><tr><td align="left" valign="top">&#x2003;Major adverse cardiac events</td><td align="left" valign="top">857 (2.4)</td><td align="left" valign="top">432 (4.0)</td><td align="left" valign="top">425 (1.7)</td><td align="left" valign="top">184 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;Type 2 diabetes</td><td align="left" valign="top">1047 (2.9)</td><td align="left" valign="top">368 (3.4)</td><td align="left" valign="top">679 (2.6)</td><td align="left" valign="top">16.4 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;Liver disease</td><td align="left" valign="top">416 (1.1)</td><td align="left" valign="top">118 (1.1)</td><td align="left" valign="top">298 (1.2)</td><td align="left" valign="top">0.199 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">.66</td><td align="left" valign="top">.73</td></tr><tr><td align="left" valign="top">&#x2003;Renal disease</td><td align="left" valign="top">446 (1.2)</td><td align="left" valign="top">132 (1.2)</td><td align="left" valign="top">314 (1.2)</td><td align="left" valign="top">0.001 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">.99</td><td align="left" valign="top">.99</td></tr><tr><td align="left" valign="top">&#x2003;Atrial fibrillation</td><td align="left" valign="top">345 (0.9)</td><td align="left" valign="top">212 (2.0)</td><td align="left" valign="top">133 (0.5)</td><td align="left" valign="top">170 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;Heart failure</td><td align="left" valign="top">48 (0.1)</td><td align="left" valign="top">35 (0.3)</td><td align="left" valign="top">13 (0.1)</td><td align="left" valign="top">41.6 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;Coronary heart disease</td><td align="left" valign="top">1090 (3.0)</td><td align="left" valign="top">528 (4.9)</td><td align="left" valign="top">562 (2.2)</td><td align="left" valign="top">193 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;Venous thrombosis</td><td align="left" valign="top">471 (1.3)</td><td align="left" valign="top">141 (1.3)</td><td align="left" valign="top">330 (1.3)</td><td align="left" valign="top">0.029 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">.87</td><td align="left" valign="top">.91</td></tr><tr><td align="left" valign="top">&#x2003;Abdominal aortic aneurysm</td><td align="left" valign="top">5 (0.0)</td><td align="left" valign="top">3 (0.0)</td><td align="left" valign="top">2 (0.0)</td><td align="left" valign="top">1.01 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">.31</td><td align="left" valign="top">.39</td></tr><tr><td align="left" valign="top">&#x2003;Peripheral arterial disease</td><td align="left" valign="top">255 (0.7)</td><td align="left" valign="top">68 (0.6)</td><td align="left" valign="top">187 (0.7)</td><td align="left" valign="top">0.844 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top">.36</td><td align="left" valign="top">.44</td></tr><tr><td align="left" valign="top" colspan="5">Cardiac function, mean (SE)<sup>c</sup></td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;Left ventricular stroke volume (mL)</td><td align="left" valign="top">87.5 (0.1)</td><td align="left" valign="top">104 (0.2)</td><td align="left" valign="top">80.6 (0.1)</td><td align="left" valign="top">113 (15,816.1)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Left ventricular myocardial mass (g)</td><td align="left" valign="top">86.1 (0.1)</td><td align="left" valign="top">109.2 (0.2)</td><td align="left" valign="top">76.4 (0.1)</td><td align="left" valign="top">161 (17,230.0)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Left ventricular end-diastolic volume (mL)</td><td align="left" valign="top">147.9 (0.2)</td><td align="left" valign="top">184.7 (0.3)</td><td align="left" valign="top">132.5 (0.1)</td><td align="left" valign="top">171 (16,189.1)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Left ventricular end-systolic volume (mL)</td><td align="left" valign="top">60.5 (0.1)</td><td align="left" valign="top">80.7 (0.2)</td><td align="left" valign="top">52 (0.1)</td><td align="left" valign="top">149 (14,438.1)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Left ventricular ejection fraction (%)</td><td align="left" valign="top">59.5 (0.0)</td><td align="left" valign="top">56.3 (0.1)</td><td align="left" valign="top">60.9 (0.0)</td><td align="left" valign="top">&#x2212;64.2 (17,086.9)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Left ventricular longitudinal strain global (%)</td><td align="left" valign="top">&#x2212;18.5 (0.0)</td><td align="left" valign="top">&#x2212;17.3 (0.0)</td><td align="left" valign="top">&#x2212;19 (0.0)</td><td align="left" valign="top">55 (19,909.5)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Left atrial maximum volume (mL)</td><td align="left" valign="top">72.8 (0.1)</td><td align="left" valign="top">92.6 (0.2)</td><td align="left" valign="top">64.4 (0.1)</td><td align="left" valign="top">109 (15,314.3)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top">&#x2003;Left atrial ejection fraction (%)</td><td align="left" valign="top">61.2 (0)</td><td align="left" valign="top">56.5 (0.1)</td><td align="left" valign="top">63.1 (0.1)</td><td align="left" valign="top">&#x2212;59.8 (17,184.7)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top" colspan="5">Outcomes</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">&#x2003;</td></tr><tr><td align="left" valign="top">&#x2003;Follow-up time (y), mean (SE)</td><td align="left" valign="top">14.7 (0.0)</td><td align="left" valign="top">14.6 (0.0)</td><td align="left" valign="top">14.7 (0.0)</td><td align="left" valign="top">&#x2212;3.05 (19,080.5)<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top">.003</td></tr><tr><td align="left" valign="top">&#x2003;Stroke, n (%)</td><td align="left" valign="top">500 (1.4)</td><td align="left" valign="top">209 (1.9)</td><td align="left" valign="top">291 (1.1)</td><td align="left" valign="top">36.4 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">&#x2003;Mortality, n (%)</td><td align="left" valign="top">664 (1.8)</td><td align="left" valign="top">265 (2.5)</td><td align="left" valign="top">399 (1.6)</td><td align="left" valign="top">34.9 (1)<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top">&#x003C;.001</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup><italic>P</italic> values were adjusted by false discovery rate.</p></fn><fn id="table1fn2"><p><sup>b</sup><italic>t</italic> test.</p></fn><fn id="table1fn3"><p><sup>c</sup>Chi-square test.</p></fn><fn id="table1fn4"><p><sup>d</sup>Missing values for this row: n=275 missing for the Total column, n=76 missing for the Phenotype 1 column, and n=199 missing for the Phenotype 2 column.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>GTM Modeling and Cardiac Aging Phenotypes</title><p><xref ref-type="fig" rid="figure3">Figure 3</xref> illustrates the latent space generated by the GTM model. The number of participants in clusters is represented using the &#x201C;viridis&#x201D; color scheme and visualized as circles, where a deeper blue hue and larger circle diameter indicate a higher number of participants. LVSV, LVMM, LVEDV, LVESV, LVEF, LVGLS, LAMV, and LAEF are aligned point-to-point with their latent space in a light teal blue scheme. In the dendrogram plot, 2 cardiac function phenotypes are identified, clearly separating the dataset into 2 major branches at a relatively large linkage distance. Figure S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> illustrates that stroke diagnoses among participants were mainly distributed in the area of phenotype 1.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Derived phenotypes of cardiac function. (A) Latent space showing the distribution of participants; (B) latent space displaying the distribution of cardiac function markers derived from cardiovascular magnetic resonance; (C) dendrogram using Ward linkage and Euclidean distance to identify 2 cardiac function phenotypes; and (D) phenotypes and latent grid nodes of cardiac function. LA: left atrial; LV: left ventricular.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e77017_fig03.png"/></fig><p>To further characterize the phenotype patterns, we compared the distributions of investigatory variables and visualized them on the latent space with the light orange color scheme (Figures S2-S7 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Significant differences were observed between the 2 cardiac function phenotypes across demographic characteristics, cardiovascular risk factors, and cardiac function parameters. Participants in phenotype 1 exhibited larger cardiac chamber volumes and greater myocardial mass, with higher LVEF and LAEF but lower LVSV, LVMM, LVEDV, LVESV, LVGLS, and LAMV compared with phenotype 2 (all <italic>P</italic>&#x003C;.001). In addition, phenotype 1 demonstrated a higher burden of cardiovascular risk factors and comorbidities, including a greater prevalence of major adverse cardiac events, atrial fibrillation, heart failure, coronary heart disease, and type 2 diabetes (<italic>P</italic>&#x003C;.001). Participants in phenotype 1 also had higher blood pressure, arterial stiffness index, and more adverse metabolic profiles. Taken together, these structural, functional, and clinical differences suggest that phenotype 1 represents a cardiovascular aging&#x2013;related phenotype, characterized by cardiac remodeling, increased cardiovascular risk burden, and elevated incidence of stroke and mortality (<xref ref-type="table" rid="table1">Table 1</xref> and Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s3-3"><title>Phenotypes and Stroke Risk</title><p>Multivariable modeling identified that cardiovascular aging phenotypes were associated with the long-term risk of stroke and mortality. Compared with phenotype 1, phenotype 2 was significantly associated with a decreased risk of stroke in the unadjusted model (HR 0.579, 95% CI 0.484-0.691; <italic>P</italic>&#x003C;.001); model 2 (HR 0.671, 95% CI 0.541-0.833; <italic>P</italic>&#x003C;.001); and model 3 (HR 0.695, 95% CI 0.559-0.864; <italic>P</italic>=.001; <xref ref-type="table" rid="table2">Table 2</xref>).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Association between cardiovascular aging phenotypes and long-term risk of stroke and mortality.</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Outcome (phenotype 2 vs phenotype 1)</td><td align="left" valign="bottom" colspan="2">Stroke</td><td align="left" valign="bottom" colspan="3">Mortality</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="top">HR<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup> (95% CI)</td><td align="left" valign="top"><italic>P</italic> value</td><td align="left" valign="top">HR (95% CI)</td><td align="left" valign="top" colspan="2"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Model 1<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup></td><td align="left" valign="top">0.579 (0.484-0.691)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">0.625 (0.535-0.730)</td><td align="left" valign="top" colspan="2">&#x003C;.001</td></tr><tr><td align="left" valign="top">Model 2<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="top">0.671 (0.541-0.833)</td><td align="left" valign="top">&#x003C;.001</td><td align="left" valign="top">0.760 (0.632-0.913)</td><td align="left" valign="top" colspan="2">.003</td></tr><tr><td align="left" valign="top">Model 3<sup><xref ref-type="table-fn" rid="table2fn4">d</xref></sup></td><td align="left" valign="top">0.695 (0.559-0.864)</td><td align="left" valign="top">.001</td><td align="left" valign="top">0.772 (0.641-0.929)</td><td align="left" valign="top" colspan="2">.006</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>HR: hazard ratio.</p></fn><fn id="table2fn2"><p><sup>b</sup>Model 1 was unadjusted.</p></fn><fn id="table2fn3"><p><sup>c</sup>Model 2 was adjusted for age at recruitment, sex, Townsend deprivation index at recruitment, smoking status, alcohol intake frequency, systolic blood pressure, diastolic blood pressure, and BMI.</p></fn><fn id="table2fn4"><p><sup>d</sup>Model 3 was additionally adjusted for atrial fibrillation, type 2 diabetes, coronary heart disease, heart failure, antihypertensive drugs, and statins.</p></fn></table-wrap-foot></table-wrap><p>Kaplan-Meier survival curves revealed that the phenotype 1 group had a higher risk of stroke (<italic>P</italic>&#x003C;.001; <xref ref-type="fig" rid="figure4">Figure 4</xref>).</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Kaplan-Meier survival curves of stroke-free probability by phenotype.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e77017_fig04.png"/></fig><p>Regarding stroke subtypes, cardiac function phenotypes were associated with cerebral infarction and other nontraumatic intracranial hemorrhage (all <italic>P</italic>&#x003C;.05; Table S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). When mortality was considered as a competing risk, phenotype 2 remained significantly associated with stroke risk (HR 0.578, 95% CI 0.484-0.691; <italic>P</italic>&#x003C;.001; Figure S8 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s3-4"><title>Supervised ML</title><p>Basal metabolic rate, sex, testosterone, standing height, weight, forced vital capacity, waist circumference, creatinine, forced expiratory volume in 1 second, and urate were included in the ML models (Table S6 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). By integrating the accuracy in the training and validation sets, we selected the random forest model as the optimal model based on its excellent accuracy (area under the curve 0.914, 95% CI 0.911-0.918 for training and 0.867, 95% CI 0.858-0.876 for validation; and accuracy 0.837, 95% CI 0.833-0.841 for training and 0.805, 95% CI 0.804-0.806 for validation) without overfitting the training set (<xref ref-type="fig" rid="figure5">Figure 5</xref>). Calibration plots exhibited that the random forest model had good performance in the calibration quality (Brier score 0.111, 95% CI 0.109-0.113 for training and 0.132, 95% CI 0.127-0.137 for validation; <xref ref-type="table" rid="table3">Table 3</xref> and Tables S7 and S8 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). We drew a feature importance plot to better visualize the contributions of the predictors to the predictive power of the random forest model (Figure S9 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Machine learning for phenotypes. ANN: artificial neural network; AUC: area under the curve; KNN: k-nearest neighbors; LGBM: light gradient boosting machine; LR: logistic regression; RF: random forest; SVM: support vector machine; XGB: extreme gradient boosting (XGBoost).</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="aging_v9i1e77017_fig05.png"/></fig><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Model evaluation and validation.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Models</td><td align="left" valign="bottom" colspan="2">Training set</td><td align="left" valign="bottom" colspan="2">Validation set</td></tr><tr><td align="left" valign="bottom"/><td align="left" valign="top">Accuracy (95% CI)</td><td align="left" valign="top">Brier score (95% CI)</td><td align="left" valign="top">Accuracy (95% CI)</td><td align="left" valign="top">Brier score (95% CI)</td></tr></thead><tbody><tr><td align="left" valign="top">K-nearest neighbor</td><td align="left" valign="top">1.000 (1.000-1.000)</td><td align="left" valign="top">0.000 (0.000-0.000)</td><td align="left" valign="top">0.800 (0.800-0.800)</td><td align="left" valign="top">0.134 (0.130-0.139)</td></tr><tr><td align="left" valign="top">Logistic regression</td><td align="left" valign="top">0.797 (0.793-0.802)</td><td align="left" valign="top">0.136 (0.134-0.139)</td><td align="left" valign="top">0.802 (0.802-0.802)</td><td align="left" valign="top">0.132 (0.127-0.137)</td></tr><tr><td align="left" valign="top">Support vector machine</td><td align="left" valign="top">0.795 (0.791-0.800)</td><td align="left" valign="top">0.137 (0.135-0.140)</td><td align="left" valign="top">0.802 (0.802-0.802)</td><td align="left" valign="top">0.133 (0.128-0.138)</td></tr><tr><td align="left" valign="top">Random forest</td><td align="left" valign="top">0.837 (0.833-0.841)</td><td align="left" valign="top">0.111 (0.109-0.113)</td><td align="left" valign="top">0.805 (0.804-0.806)</td><td align="left" valign="top">0.132 (0.127-0.137)</td></tr><tr><td align="left" valign="top">Light gradient boosting machine</td><td align="left" valign="top">0.810 (0.805-0.814)</td><td align="left" valign="top">0.126 (0.124-0.128)</td><td align="left" valign="top">0.805 (0.805-0.805)</td><td align="left" valign="top">0.132 (0.128-0.137)</td></tr><tr><td align="left" valign="top">Extreme Gradient Boosting</td><td align="left" valign="top">0.799 (0.795-0.804)</td><td align="left" valign="top">0.134 (0.132-0.137)</td><td align="left" valign="top">0.804 (0.804-0.804)</td><td align="left" valign="top">0.132 (0.127-0.137)</td></tr><tr><td align="left" valign="top">Artificial neural networks</td><td align="left" valign="top">0.797 (0.793-0.802)</td><td align="left" valign="top">0.136 (0.133-0.138)</td><td align="left" valign="top">0.803 (0.803-0.804)</td><td align="left" valign="top">0.132 (0.127-0.136)</td></tr></tbody></table></table-wrap><p>After entering the participant information, the local model calculated the corresponding phenotype, and the DeepSeek-R1 model provided an analysis of the participant&#x2019;s health status along with recommendations for potential clinical application (Figure S10 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>In this study, we identified distinct cardiac function phenotypes related to cardiovascular aging using the GTM model based on CMR parameters. These phenotypes were significantly associated with long-term stroke risk and could be reliably predicted by supervised ML models.</p><p>CMR is important for evaluating cardiovascular pathologies and for assessing the etiology and prognosis of patients with stroke. A previous study demonstrated that cardiovascular aging is associated with reduced LV volumes and increased LV concentricity on CMR, with notable sex-specific differences in systolic cardiac function [<xref ref-type="bibr" rid="ref9">9</xref>]. CMR also exhibited high sensitivity in detecting intraventricular thrombi and thrombi within the LA appendage [<xref ref-type="bibr" rid="ref23">23</xref>]. Additionally, CMR imaging could affect the management of acute stroke by detecting aortic plaques, cardiac structural abnormalities, and intracardiac thrombi in patients with stroke [<xref ref-type="bibr" rid="ref24">24</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. However, CMR metrics represented multidimensional data with complex interrelations, potentially involving collinearity and interaction effects. Using unsupervised ML may improve the ability to reveal the inherent structure of the data and achieve more accurate classification.</p><p>GTM incorporated probability distribution functions to refine the self-organizing map algorithms and mitigated their inherent limitations, such as convergence issues, insufficient neighborhood preservation, and the absence of a distinct objective function. Moreover, GTM was capable of visually representing phenotypes through latent spaces [<xref ref-type="bibr" rid="ref17">17</xref>]. Sattarov et al [<xref ref-type="bibr" rid="ref26">26</xref>] applied GTM to explore the latent space of Simplified Molecular Input Line Entry System&#x2013;based autoencoders for generating targeted molecular libraries and visualized the autoencoder latent space on a 2D topographic map. These findings indicated a promising application of GTM in structure-based affinity assessments. However, unsupervised ML faces challenges related to limited interpretability and scalability, making the derived phenotypes and their clinical relevance difficult to translate into real-world medical practice. Therefore, we innovatively applied supervised ML to relearn the phenotype labels obtained from GTM, constructing a random forest model that accurately predicted the 2 distinct phenotypes. Given the high cost and inconvenience of CMR scans for patients with stroke [<xref ref-type="bibr" rid="ref27">27</xref>], using clinical variables allowed for a reduction in model application requirements while preserving accuracy, making the classification model more suitable for clinical use.</p><p>The phenotypes derived from CMR metrics may reflect distinct patterns of cardiac structural and functional remodeling associated with cardiovascular aging. Key variables contributing to phenotype differentiation, including LVMM and concentric geometry, have been linked to vascular aging markers, supporting the connection between cardiovascular aging and cardiac structural changes [<xref ref-type="bibr" rid="ref28">28</xref>]. LA enlargement and functional impairment are also recognized markers of cardiovascular aging and are related to chronic diastolic dysfunction and atrial fibrillation [<xref ref-type="bibr" rid="ref29">29</xref>]. In addition, accelerated cardiovascular aging driven by cumulative risk factors such as hypertension, obesity, diabetes, and coronary artery disease may further promote cardiac remodeling, consistent with the differing comorbidity profiles observed between the phenotypes in our study [<xref ref-type="bibr" rid="ref30">30</xref>]. Notably, the cardiovascular aging&#x2013;related phenotype in our study was characterized by LV and LA abnormalities indicative of volume or pressure overload and myocardial dysfunction. These alterations have been associated with increased risks of cardioembolic stroke and subclinical cerebral infarction [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. Therefore, the CMR-derived phenotypes may capture different stages of cardiovascular aging and help explain the heterogeneity of cardiac remodeling and its potential contribution to long-term stroke risk.</p><p>In our study, supervised ML models identified several clinical parameters as predictors for cardiac function phenotypes. Notably, basal metabolic rate is the energy required to maintain essential functions in a healthy state. Prior research indicated that basal metabolic rate was independently linked to heart failure, atrial fibrillation, and flutter and acted as a risk factor for cardiovascular mortality [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. Furthermore, a pooled analysis of 8 cohorts showed that obstructive and restrictive physiology were associated with incident heart failure with reduced or preserved ejection fraction [<xref ref-type="bibr" rid="ref35">35</xref>]. Moreover, a distinctive J-shaped curve was noted between BMI and waist circumference and the risk of heart failure [<xref ref-type="bibr" rid="ref36">36</xref>]. Additionally, renal impairment in chronic heart failure was typically linked to decreased cardiac output and subsequent renal hypoperfusion, and targeting volume overload may improve outcomes in cardiac dysfunction [<xref ref-type="bibr" rid="ref37">37</xref>]. These findings suggested that the ML model could reflect systemic metabolic, cardiopulmonary, and renal alterations that may explain the clinical characteristics of the identified cardiac function phenotypes.</p><p>To the best of our knowledge, this was the first study to use GTM for clustering CMR parameters and to identify cardiovascular aging phenotypes associated with long-term stroke risk. However, there were several limitations to our study. First, the CMR parameters extracted from the UK Biobank were collected according to the cohort&#x2019;s standardized protocols. Because the CMR examination protocol may differ in other studies, this should be considered when applying our model to other cohorts. Second, while trained on the UK Biobank&#x2019;s large sample, the model&#x2019;s applicability to other cohorts may be limited by environmental, genetic, and cultural variations. Third, given the predominantly White and healthy population in the UK Biobank, selection and health biases may be inevitable. The generalizability of our findings to ancestrally diverse individuals will assist in determining whether more appropriate and ethnically relevant decisions are needed.</p></sec><sec id="s4-2"><title>Conclusions</title><p>In conclusion, we used GTM to identify cardiac function phenotypes based on CMR parameters. The identified phenotypes were significantly associated with stroke risk, with the high-risk phenotype characterized by impaired cardiac function and features related to cardiovascular aging. Furthermore, we relearned phenotype labels using supervised ML models, enabling phenotype prediction from clinical variables. These models may facilitate the identification of individuals at higher risk and support the development of preventive and therapeutic strategies. Further studies are warranted to explore the potential mechanisms linking cardiovascular aging, cardiac phenotypic heterogeneity, and stroke risk.</p></sec></sec></body><back><ack><p>The authors thank the UK Biobank participants. This study was conducted using the UK Biobank resource (application number 106487).</p></ack><notes><sec><title>Funding</title><p>The project was supported by the Program for Innovative Research Team of the First Affiliated Hospital of University of Science and Technology of China (2023IHM01050), the National Natural Science Foundation of China (NSFC-82471341 and NSFC-U22A20341), the Guangxi Natural Science Foundation (2025GXNSFAA069341), and the Joint Project on Regional High-Incidence Diseases Research of the Guangxi Natural Science Foundation (2023GXNSFAA026197).</p></sec><sec><title>Data Availability</title><p>All data used in this study were accessed from the publicly available UK Biobank resource (application number 106487). Data from this study cannot be shared with other investigators. The source code for the analyses and the established machine learning models is available on GitHub [<xref ref-type="bibr" rid="ref38">38</xref>].</p></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: KY, MX, WS</p><p>Data curation: JZ</p><p>Formal analysis: JZ</p><p>Funding acquisition: XL</p><p>Investigation: JZ</p><p>Project administration: WS</p><p>Software: JZ</p><p>Supervision: WS</p><p>Writing&#x2014;original draft: KY, DK</p><p>Writing&#x2014;review and editing: RL, WS, XL</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">API</term><def><p>application programming interface</p></def></def-item><def-item><term id="abb2">CMR</term><def><p>cardiovascular magnetic resonance</p></def></def-item><def-item><term id="abb3">GTM</term><def><p>generative topographic mapping</p></def></def-item><def-item><term id="abb4">HR</term><def><p>hazard ratio</p></def></def-item><def-item><term id="abb5">LA</term><def><p>left atrial</p></def></def-item><def-item><term id="abb6">LAEF</term><def><p>left atrial ejection fraction</p></def></def-item><def-item><term id="abb7">LAMV</term><def><p>left atrial maximum volume</p></def></def-item><def-item><term id="abb8">LV</term><def><p>left ventricular</p></def></def-item><def-item><term id="abb9">LVEDV</term><def><p>left ventricular end-diastolic volume</p></def></def-item><def-item><term id="abb10">LVEF</term><def><p>left ventricular ejection fraction</p></def></def-item><def-item><term id="abb11">LVESV</term><def><p>left ventricular end-systolic volume</p></def></def-item><def-item><term id="abb12">LVGLS</term><def><p>left ventricular global longitudinal strain</p></def></def-item><def-item><term id="abb13">LVMM</term><def><p>left ventricular myocardial mass</p></def></def-item><def-item><term id="abb14">LVSV</term><def><p>left ventricular stroke volume</p></def></def-item><def-item><term id="abb15">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb16">TRIPOD</term><def><p>transparent reporting of a multivariable prediction model for individual prognosis or diagnosis</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><collab>GBD 2019 Stroke Collaborators</collab></person-group><article-title>Global, regional, and national burden of stroke and its risk factors, 1990-2019: a systematic analysis for the Global Burden of Disease Study 2019</article-title><source>Lancet Neurol</source><year>2021</year><month>10</month><volume>20</volume><issue>10</issue><fpage>795</fpage><lpage>820</lpage><pub-id pub-id-type="doi">10.1016/S1474-4422(21)00252-0</pub-id><pub-id pub-id-type="medline">34487721</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vakka</surname><given-names>A</given-names> </name><name name-style="western"><surname>Warren</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Drosatos</surname><given-names>K</given-names> </name></person-group><article-title>Cardiovascular aging: from cellular and molecular changes to therapeutic interventions</article-title><source>J Cardiovasc Aging</source><year>2023</year><volume>3</volume><issue>3</issue><fpage>23</fpage><pub-id pub-id-type="doi">10.20517/jca.2023.09</pub-id><pub-id pub-id-type="medline">37274126</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rim</surname><given-names>D</given-names> </name><name name-style="western"><surname>Henderson</surname><given-names>LA</given-names> </name><name name-style="western"><surname>Macefield</surname><given-names>VG</given-names> </name></person-group><article-title>Brain and cardiovascular-related changes are associated with aging, hypertension, and atrial fibrillation</article-title><source>Clin Auton Res</source><year>2022</year><month>12</month><volume>32</volume><issue>6</issue><fpage>409</fpage><lpage>422</lpage><pub-id pub-id-type="doi">10.1007/s10286-022-00907-9</pub-id><pub-id pub-id-type="medline">36409380</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Subramanian</surname><given-names>V</given-names> </name><name name-style="western"><surname>Tucker</surname><given-names>WJ</given-names> </name><name name-style="western"><surname>Peters</surname><given-names>AE</given-names> </name><name name-style="western"><surname>Upadhya</surname><given-names>B</given-names> </name><name name-style="western"><surname>Kitzman</surname><given-names>DW</given-names> </name><name name-style="western"><surname>Pandey</surname><given-names>A</given-names> </name></person-group><article-title>Cardiovascular aging and exercise: implications for heart failure prevention and management</article-title><source>Circ Res</source><year>2025</year><month>07</month><day>7</day><volume>137</volume><issue>2</issue><fpage>205</fpage><lpage>230</lpage><pub-id pub-id-type="doi">10.1161/CIRCRESAHA.125.325531</pub-id><pub-id pub-id-type="medline">40608862</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Polymeris</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Meinel</surname><given-names>TR</given-names> </name><name name-style="western"><surname>Oehler</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Aetiology, secondary prevention strategies and outcomes of ischaemic stroke despite oral anticoagulant therapy in patients with atrial fibrillation</article-title><source>J Neurol Neurosurg Psychiatry</source><year>2022</year><month>06</month><volume>93</volume><issue>6</issue><fpage>588</fpage><lpage>598</lpage><pub-id pub-id-type="doi">10.1136/jnnp-2021-328391</pub-id><pub-id pub-id-type="medline">35396339</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Doehner</surname><given-names>W</given-names> </name><name name-style="western"><surname>B&#x00F6;hm</surname><given-names>M</given-names> </name><name name-style="western"><surname>Boriani</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Interaction of heart failure and stroke: a clinical consensus statement of the ESC Council on Stroke, the Heart Failure Association (HFA) and the ESC Working Group on Thrombosis</article-title><source>Eur J Heart Fail</source><year>2023</year><month>12</month><volume>25</volume><issue>12</issue><fpage>2107</fpage><lpage>2129</lpage><pub-id pub-id-type="doi">10.1002/ejhf.3071</pub-id><pub-id pub-id-type="medline">37905380</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dutta</surname><given-names>P</given-names> </name><name name-style="western"><surname>Courties</surname><given-names>G</given-names> </name><name name-style="western"><surname>Wei</surname><given-names>Y</given-names> </name><etal/></person-group><article-title>Myocardial infarction accelerates atherosclerosis</article-title><source>Nature</source><year>2012</year><month>07</month><day>19</day><volume>487</volume><issue>7407</issue><fpage>325</fpage><lpage>329</lpage><pub-id pub-id-type="doi">10.1038/nature11260</pub-id><pub-id pub-id-type="medline">22763456</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Mayfield</surname><given-names>JJ</given-names> </name><name name-style="western"><surname>Otto</surname><given-names>CM</given-names> </name></person-group><article-title>Stroke and noninfective native valvular disease</article-title><source>Curr Cardiol Rep</source><year>2023</year><month>05</month><volume>25</volume><issue>5</issue><fpage>333</fpage><lpage>348</lpage><pub-id pub-id-type="doi">10.1007/s11886-023-01855-0</pub-id><pub-id pub-id-type="medline">36971961</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Grassow</surname><given-names>L</given-names> </name><name name-style="western"><surname>Gr&#x00F6;schel</surname><given-names>J</given-names> </name><name name-style="western"><surname>Saad</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Sex-specific structural and functional cardiac remodeling during healthy aging assessed by cardiovascular magnetic resonance</article-title><source>Clin Res Cardiol</source><year>2025</year><month>12</month><volume>114</volume><issue>12</issue><fpage>1619</fpage><lpage>1630</lpage><pub-id pub-id-type="doi">10.1007/s00392-024-02430-5</pub-id><pub-id pub-id-type="medline">38466347</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Maheshwari</surname><given-names>A</given-names> </name><name name-style="western"><surname>Norby</surname><given-names>FL</given-names> </name><name name-style="western"><surname>Inciardi</surname><given-names>RM</given-names> </name><etal/></person-group><article-title>Left atrial mechanical dysfunction and the risk for ischemic stroke in people without prevalent atrial fibrillation or stroke: a prospective cohort study</article-title><source>Ann Intern Med</source><year>2023</year><month>01</month><volume>176</volume><issue>1</issue><fpage>39</fpage><lpage>48</lpage><pub-id pub-id-type="doi">10.7326/M22-1638</pub-id><pub-id pub-id-type="medline">36534978</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tsao</surname><given-names>CW</given-names> </name><name name-style="western"><surname>Gona</surname><given-names>PN</given-names> </name><name name-style="western"><surname>Salton</surname><given-names>CJ</given-names> </name><etal/></person-group><article-title>Left ventricular structure and risk of cardiovascular events: a Framingham Heart Study cardiac magnetic resonance study</article-title><source>J Am Heart Assoc</source><year>2015</year><month>09</month><day>15</day><volume>4</volume><issue>9</issue><fpage>e002188</fpage><pub-id pub-id-type="doi">10.1161/JAHA.115.002188</pub-id><pub-id pub-id-type="medline">26374295</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Narang</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bae</surname><given-names>R</given-names> </name><name name-style="western"><surname>Hong</surname><given-names>H</given-names> </name><etal/></person-group><article-title>Utility of a deep-learning algorithm to guide novices to acquire echocardiograms for limited diagnostic use</article-title><source>JAMA Cardiol</source><year>2021</year><month>06</month><day>1</day><volume>6</volume><issue>6</issue><fpage>624</fpage><lpage>632</lpage><pub-id pub-id-type="doi">10.1001/jamacardio.2021.0185</pub-id><pub-id pub-id-type="medline">33599681</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kusunose</surname><given-names>K</given-names> </name><name name-style="western"><surname>Haga</surname><given-names>A</given-names> </name><name name-style="western"><surname>Abe</surname><given-names>T</given-names> </name><name name-style="western"><surname>Sata</surname><given-names>M</given-names> </name></person-group><article-title>Utilization of artificial intelligence in echocardiography</article-title><source>Circ J</source><year>2019</year><month>07</month><day>25</day><volume>83</volume><issue>8</issue><fpage>1623</fpage><lpage>1629</lpage><pub-id pub-id-type="doi">10.1253/circj.CJ-19-0420</pub-id><pub-id pub-id-type="medline">31257314</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Verbeeck</surname><given-names>N</given-names> </name><name name-style="western"><surname>Caprioli</surname><given-names>RM</given-names> </name><name name-style="western"><surname>Van de Plas</surname><given-names>R</given-names> </name></person-group><article-title>Unsupervised machine learning for exploratory data analysis in imaging mass spectrometry</article-title><source>Mass Spectrom Rev</source><year>2020</year><month>05</month><volume>39</volume><issue>3</issue><fpage>245</fpage><lpage>291</lpage><pub-id pub-id-type="doi">10.1002/mas.21602</pub-id><pub-id pub-id-type="medline">31602691</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chao</surname><given-names>CJ</given-names> </name><name name-style="western"><surname>Kato</surname><given-names>N</given-names> </name><name name-style="western"><surname>Scott</surname><given-names>CG</given-names> </name><etal/></person-group><article-title>Unsupervised machine learning for assessment of left ventricular diastolic function and risk stratification</article-title><source>J Am Soc Echocardiogr</source><year>2022</year><month>12</month><volume>35</volume><issue>12</issue><fpage>1214</fpage><lpage>1225.e8</lpage><pub-id pub-id-type="doi">10.1016/j.echo.2022.06.013</pub-id><pub-id pub-id-type="medline">35840082</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ntaios</surname><given-names>G</given-names> </name><name name-style="western"><surname>Weng</surname><given-names>SF</given-names> </name><name name-style="western"><surname>Perlepe</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Data&#x2010;driven machine&#x2010;learning analysis of potential embolic sources in embolic stroke of undetermined source</article-title><source>Eur J Neurol</source><year>2021</year><month>01</month><volume>28</volume><issue>1</issue><fpage>192</fpage><lpage>201</lpage><pub-id pub-id-type="doi">10.1111/ene.14524</pub-id><pub-id pub-id-type="medline">32918305</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kireeva</surname><given-names>N</given-names> </name><name name-style="western"><surname>Baskin</surname><given-names>II</given-names> </name><name name-style="western"><surname>Gaspar</surname><given-names>HA</given-names> </name><name name-style="western"><surname>Horvath</surname><given-names>D</given-names> </name><name name-style="western"><surname>Marcou</surname><given-names>G</given-names> </name><name name-style="western"><surname>Varnek</surname><given-names>A</given-names> </name></person-group><article-title>Generative topographic mapping (GTM): universal tool for data visualization, structure-activity modeling and dataset comparison</article-title><source>Mol Inform</source><year>2012</year><month>04</month><volume>31</volume><issue>3-4</issue><fpage>301</fpage><lpage>312</lpage><pub-id pub-id-type="doi">10.1002/minf.201100163</pub-id><pub-id pub-id-type="medline">27477099</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Olier</surname><given-names>I</given-names> </name><name name-style="western"><surname>Vellido</surname><given-names>A</given-names> </name></person-group><article-title>Advances in clustering and visualization of time series using GTM through time</article-title><source>Neural Netw</source><year>2008</year><month>09</month><volume>21</volume><issue>7</issue><fpage>904</fpage><lpage>913</lpage><pub-id pub-id-type="doi">10.1016/j.neunet.2008.05.013</pub-id><pub-id pub-id-type="medline">18653311</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ezugwu</surname><given-names>AE</given-names> </name><name name-style="western"><surname>Shukla</surname><given-names>AK</given-names> </name><name name-style="western"><surname>Agbaje</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Oyelade</surname><given-names>ON</given-names> </name><name name-style="western"><surname>Jos&#x00E9;-Garc&#x00ED;a</surname><given-names>A</given-names> </name><name name-style="western"><surname>Agushaka</surname><given-names>JO</given-names> </name></person-group><article-title>Automatic clustering algorithms: a systematic review and bibliometric analysis of relevant literature</article-title><source>Neural Comput Appl</source><year>2021</year><month>06</month><volume>33</volume><fpage>6247</fpage><lpage>6306</lpage><pub-id pub-id-type="doi">10.1007/s00521-020-05395-4</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bellfield</surname><given-names>RA</given-names> </name><name name-style="western"><surname>Olier</surname><given-names>I</given-names> </name><name name-style="western"><surname>Lotto</surname><given-names>R</given-names> </name><etal/></person-group><article-title>AI-based derivation of atrial fibrillation phenotypes in the general and critical care populations</article-title><source>EBioMedicine</source><year>2024</year><month>09</month><volume>107</volume><fpage>105280</fpage><pub-id pub-id-type="doi">10.1016/j.ebiom.2024.105280</pub-id><pub-id pub-id-type="medline">39153412</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="web"><article-title>Health research data for the world</article-title><source>UK Biobank</source><access-date>2026-04-04</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.ukbiobank.ac.uk">https://www.ukbiobank.ac.uk</ext-link></comment></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Vellido</surname><given-names>A</given-names> </name><name name-style="western"><surname>Lisboa</surname><given-names>P</given-names> </name><name name-style="western"><surname>Meehan</surname><given-names>K</given-names> </name></person-group><article-title>The generative topographic mapping as a principal model for data visualization and market segmentation: an electronic commerce case study</article-title><source>Int J Comput Syst Signals</source><year>2000</year><access-date>2026-04-04</access-date><volume>1</volume><issue>2</issue><fpage>119</fpage><lpage>138</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://www.researchgate.net/publication/224881827_The_generative_topographic_mapping_as_a_principal_model_for_data_visualization_and_market_segmentation_An_electronic_commerce_case_study">https://www.researchgate.net/publication/224881827_The_generative_topographic_mapping_as_a_principal_model_for_data_visualization_and_market_segmentation_An_electronic_commerce_case_study</ext-link></comment></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Takasugi</surname><given-names>J</given-names> </name><name name-style="western"><surname>Yamagami</surname><given-names>H</given-names> </name><name name-style="western"><surname>Noguchi</surname><given-names>T</given-names> </name><etal/></person-group><article-title>Detection of left ventricular thrombus by cardiac magnetic resonance in embolic stroke of undetermined source</article-title><source>Stroke</source><year>2017</year><month>09</month><volume>48</volume><issue>9</issue><fpage>2434</fpage><lpage>2440</lpage><pub-id pub-id-type="doi">10.1161/STROKEAHA.117.018263</pub-id><pub-id pub-id-type="medline">28818863</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Siebermair</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kholmovski</surname><given-names>EG</given-names> </name><name name-style="western"><surname>Marrouche</surname><given-names>N</given-names> </name></person-group><article-title>Assessment of left atrial fibrosis by late gadolinium enhancement magnetic resonance imaging: methodology and clinical implications</article-title><source>JACC Clin Electrophysiol</source><year>2017</year><month>08</month><volume>3</volume><issue>8</issue><fpage>791</fpage><lpage>802</lpage><pub-id pub-id-type="doi">10.1016/j.jacep.2017.07.004</pub-id><pub-id pub-id-type="medline">29759774</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fonseca</surname><given-names>AC</given-names> </name><name name-style="western"><surname>Alves</surname><given-names>P</given-names> </name><name name-style="western"><surname>In&#x00E1;cio</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Patients with undetermined stroke have increased atrial fibrosis: a cardiac magnetic resonance imaging study</article-title><source>Stroke</source><year>2018</year><month>03</month><volume>49</volume><issue>3</issue><fpage>734</fpage><lpage>737</lpage><pub-id pub-id-type="doi">10.1161/STROKEAHA.117.019641</pub-id><pub-id pub-id-type="medline">29371431</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sattarov</surname><given-names>B</given-names> </name><name name-style="western"><surname>Baskin</surname><given-names>II</given-names> </name><name name-style="western"><surname>Horvath</surname><given-names>D</given-names> </name><name name-style="western"><surname>Marcou</surname><given-names>G</given-names> </name><name name-style="western"><surname>Bjerrum</surname><given-names>EJ</given-names> </name><name name-style="western"><surname>Varnek</surname><given-names>A</given-names> </name></person-group><article-title>De novo molecular design by combining deep autoencoder recurrent neural networks with generative topographic mapping</article-title><source>J Chem Inf Model</source><year>2019</year><month>03</month><day>25</day><volume>59</volume><issue>3</issue><fpage>1182</fpage><lpage>1196</lpage><pub-id pub-id-type="doi">10.1021/acs.jcim.8b00751</pub-id><pub-id pub-id-type="medline">30785751</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Meinel</surname><given-names>TR</given-names> </name><name name-style="western"><surname>Eggimann</surname><given-names>A</given-names> </name><name name-style="western"><surname>Brignoli</surname><given-names>K</given-names> </name><etal/></person-group><article-title>Cardiovascular MRI compared to echocardiography to identify cardioaortic sources of ischemic stroke: a systematic review and meta-analysis</article-title><source>Front Neurol</source><year>2021</year><volume>12</volume><fpage>699838</fpage><pub-id pub-id-type="doi">10.3389/fneur.2021.699838</pub-id><pub-id pub-id-type="medline">34393979</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>T</given-names> </name><name name-style="western"><surname>Zeng</surname><given-names>J</given-names> </name><name name-style="western"><surname>Zhao</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Relationship between vascular aging and left ventricular geometry in patients with obstructive sleep apnea hypopnea syndrome-related hypertension</article-title><source>Sci Rep</source><year>2025</year><volume>15</volume><issue>1</issue><fpage>6191</fpage><pub-id pub-id-type="doi">10.1038/s41598-025-89964-4</pub-id><pub-id pub-id-type="medline">39979427</pub-id></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Fang</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Raza</surname><given-names>U</given-names> </name><name name-style="western"><surname>Song</surname><given-names>J</given-names> </name><etal/></person-group><article-title>Systemic aging fuels heart failure: molecular mechanisms and therapeutic avenues</article-title><source>ESC Heart Fail</source><year>2025</year><month>04</month><volume>12</volume><issue>2</issue><fpage>1059</fpage><lpage>1080</lpage><pub-id pub-id-type="doi">10.1002/ehf2.14947</pub-id><pub-id pub-id-type="medline">39034866</pub-id></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Triposkiadis</surname><given-names>F</given-names> </name><name name-style="western"><surname>Xanthopoulos</surname><given-names>A</given-names> </name><name name-style="western"><surname>Parissis</surname><given-names>J</given-names> </name><name name-style="western"><surname>Butler</surname><given-names>J</given-names> </name><name name-style="western"><surname>Farmakis</surname><given-names>D</given-names> </name></person-group><article-title>Pathogenesis of chronic heart failure: cardiovascular aging, risk factors, comorbidities, and disease modifiers</article-title><source>Heart Fail Rev</source><year>2022</year><month>01</month><volume>27</volume><issue>1</issue><fpage>337</fpage><lpage>344</lpage><pub-id pub-id-type="doi">10.1007/s10741-020-09987-z</pub-id><pub-id pub-id-type="medline">32524327</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kamel</surname><given-names>H</given-names> </name><name name-style="western"><surname>Okin</surname><given-names>PM</given-names> </name><name name-style="western"><surname>Merkler</surname><given-names>AE</given-names> </name><etal/></person-group><article-title>Relationship between left atrial volume and ischemic stroke subtype</article-title><source>Ann Clin Transl Neurol</source><year>2019</year><month>08</month><volume>6</volume><issue>8</issue><fpage>1480</fpage><lpage>1486</lpage><pub-id pub-id-type="doi">10.1002/acn3.50841</pub-id><pub-id pub-id-type="medline">31402612</pub-id></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Shaikh</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Ahmed</surname><given-names>B</given-names> </name><name name-style="western"><surname>Ahmed</surname><given-names>M</given-names> </name><etal/></person-group><article-title>Left atrial volumes and associated stroke subtypes</article-title><source>BMC Neurol</source><year>2013</year><month>10</month><day>18</day><volume>13</volume><fpage>149</fpage><pub-id pub-id-type="doi">10.1186/1471-2377-13-149</pub-id><pub-id pub-id-type="medline">24139054</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhao</surname><given-names>P</given-names> </name><name name-style="western"><surname>Han</surname><given-names>F</given-names> </name><name name-style="western"><surname>Liang</surname><given-names>X</given-names> </name><etal/></person-group><article-title>Causal effects of basal metabolic rate on cardiovascular disease: a bidirectional Mendelian randomization study</article-title><source>J Am Heart Assoc</source><year>2024</year><month>01</month><day>2</day><volume>13</volume><issue>1</issue><fpage>e031447</fpage><pub-id pub-id-type="doi">10.1161/JAHA.123.031447</pub-id><pub-id pub-id-type="medline">38156559</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ruggiero</surname><given-names>C</given-names> </name><name name-style="western"><surname>Metter</surname><given-names>EJ</given-names> </name><name name-style="western"><surname>Melenovsky</surname><given-names>V</given-names> </name><etal/></person-group><article-title>High basal metabolic rate is a risk factor for mortality: the Baltimore Longitudinal Study of Aging</article-title><source>J Gerontol A Biol Sci Med Sci</source><year>2008</year><month>07</month><volume>63</volume><issue>7</issue><fpage>698</fpage><lpage>706</lpage><pub-id pub-id-type="doi">10.1093/gerona/63.7.698</pub-id><pub-id pub-id-type="medline">18693224</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Eckhardt</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Balte</surname><given-names>PP</given-names> </name><name name-style="western"><surname>Barr</surname><given-names>RG</given-names> </name><etal/></person-group><article-title>Lung function impairment and risk of incident heart failure: the NHLBI Pooled Cohorts Study</article-title><source>Eur Heart J</source><year>2022</year><month>06</month><day>14</day><volume>43</volume><issue>23</issue><fpage>2196</fpage><lpage>2208</lpage><pub-id pub-id-type="doi">10.1093/eurheartj/ehac205</pub-id><pub-id pub-id-type="medline">35467708</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhou</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Chai</surname><given-names>X</given-names> </name><name name-style="western"><surname>Yang</surname><given-names>G</given-names> </name><name name-style="western"><surname>Sun</surname><given-names>X</given-names> </name><name name-style="western"><surname>Xing</surname><given-names>Z</given-names> </name></person-group><article-title>Changes in body mass index and waist circumference and heart failure in type 2 diabetes mellitus</article-title><source>Front Endocrinol (Lausanne)</source><year>2023</year><volume>14</volume><fpage>1305839</fpage><pub-id pub-id-type="doi">10.3389/fendo.2023.1305839</pub-id><pub-id pub-id-type="medline">38179309</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sinkeler</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Damman</surname><given-names>K</given-names> </name><name name-style="western"><surname>van Veldhuisen</surname><given-names>DJ</given-names> </name><name name-style="western"><surname>Hillege</surname><given-names>H</given-names> </name><name name-style="western"><surname>Navis</surname><given-names>G</given-names> </name></person-group><article-title>A re-appraisal of volume status and renal function impairment in chronic heart failure: combined effects of pre-renal failure and venous congestion on renal function</article-title><source>Heart Fail Rev</source><year>2012</year><month>03</month><volume>17</volume><issue>2</issue><fpage>263</fpage><lpage>270</lpage><pub-id pub-id-type="doi">10.1007/s10741-011-9233-7</pub-id><pub-id pub-id-type="medline">21365244</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="web"><article-title>Qianwg/ml_stroke</article-title><source>GitHub</source><access-date>2025-05-25</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://github.com/qianwg/ML_Stroke">https://github.com/qianwg/ML_Stroke</ext-link></comment></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Additional methods and results detailing cardiovascular magnetic resonance analysis, generative topographic mapping for cardiac phenotyping, and machine learning frameworks for stroke risk prediction. Includes comprehensive methodology, participant characteristics, and model validation metrics using UK Biobank data.</p><media xlink:href="aging_v9i1e77017_app1.docx" xlink:title="DOCX File, 8399 KB"/></supplementary-material><supplementary-material id="app2"><label>Checklist 1</label><p>TRIPOD checklist.</p><media xlink:href="aging_v9i1e77017_app2.pdf" xlink:title="PDF File, 681 KB"/></supplementary-material></app-group></back></article>