<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JA</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Aging</journal-id>
      <journal-title>JMIR Aging</journal-title>
      <issn pub-type="epub">2561-7605</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v8i1e65178</article-id>
      <article-id pub-id-type="pmid"/>
      <article-id pub-id-type="doi">10.2196/65178</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Unsupervised Deep Learning of Electronic Health Records to Characterize Heterogeneity Across Alzheimer Disease and Related Dementias: Cross-Sectional Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Liu</surname>
            <given-names>Darren</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Zapata</surname>
            <given-names>Ruben</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chrimes</surname>
            <given-names>Dillon</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chaturvedi</surname>
            <given-names>Akhil</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>West</surname>
            <given-names>Matthew</given-names>
          </name>
          <degrees>MPhys, SM</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0006-5455-8693</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Cheng</surname>
            <given-names>You</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-3141-0104</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>He</surname>
            <given-names>Yingnan</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0009-0003-6082-3893</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author">
          <name name-style="western">
            <surname>Leng</surname>
            <given-names>Yu</given-names>
          </name>
          <degrees>SM</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7039-4127</ext-link>
        </contrib>
        <contrib id="contrib5" contrib-type="author">
          <name name-style="western">
            <surname>Magdamo</surname>
            <given-names>Colin</given-names>
          </name>
          <degrees>BS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-8965-4630</ext-link>
        </contrib>
        <contrib id="contrib6" contrib-type="author">
          <name name-style="western">
            <surname>Hyman</surname>
            <given-names>Bradley T</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-7959-9401</ext-link>
        </contrib>
        <contrib id="contrib7" contrib-type="author">
          <name name-style="western">
            <surname>Dickson</surname>
            <given-names>John R</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0135-7928</ext-link>
        </contrib>
        <contrib id="contrib8" contrib-type="author">
          <name name-style="western">
            <surname>Serrano-Pozo</surname>
            <given-names>Alberto</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-0899-7530</ext-link>
        </contrib>
        <contrib id="contrib9" contrib-type="author">
          <name name-style="western">
            <surname>Blacker</surname>
            <given-names>Deborah</given-names>
          </name>
          <degrees>MD, PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6107-7376</ext-link>
        </contrib>
        <contrib id="contrib10" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Das</surname>
            <given-names>Sudeshna</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Massachusetts General Hospital</institution>
            <addr-line>65 Landsdowne Street</addr-line>
            <addr-line>Cambridge, MA, 02139</addr-line>
            <country>United States</country>
            <phone>1 617 768 8254</phone>
            <email>sdas5@mgh.harvard.edu</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9486-6811</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Massachusetts General Hospital</institution>
        <addr-line>Cambridge, MA</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Sudeshna Das <email>sdas5@mgh.harvard.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2025</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>31</day>
        <month>3</month>
        <year>2025</year>
      </pub-date>
      <volume>8</volume>
      <elocation-id>e65178</elocation-id>
      <history>
        <date date-type="received">
          <day>7</day>
          <month>8</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>29</day>
          <month>1</month>
          <year>2025</year>
        </date>
        <date date-type="rev-recd">
          <day>19</day>
          <month>2</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>10</day>
          <month>3</month>
          <year>2025</year>
        </date>
      </history>
      <copyright-statement>©Matthew West, You Cheng, Yingnan He, Yu Leng, Colin Magdamo, Bradley T Hyman, John R Dickson, Alberto Serrano-Pozo, Deborah Blacker, Sudeshna Das. Originally published in JMIR Aging (https://aging.jmir.org), 31.03.2025.</copyright-statement>
      <copyright-year>2025</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Aging, is properly cited. The complete bibliographic information, a link to the original publication on https://aging.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://aging.jmir.org/2025/1/e65178" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Alzheimer disease and related dementias (ADRD) exhibit prominent heterogeneity. Identifying clinically meaningful ADRD subtypes is essential for tailoring treatments to specific patient phenotypes.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aimed to use unsupervised learning techniques on electronic health records (EHRs) from memory clinic patients to identify ADRD subtypes.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We used pretrained embeddings of non-ADRD diagnosis codes (<italic>International Classification of Diseases, Ninth Revision</italic>) and large language model (LLM)–derived embeddings of clinical notes from patient EHRs. Hierarchical clustering of these embeddings was used to identify ADRD subtypes. Clusters were characterized regarding their demographic and clinical features.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We analyzed a cohort of 3454 patients with ADRD from a memory clinic at Massachusetts General Hospital, each with a specialist diagnosis. Clustering pretrained embeddings of the non-ADRD diagnosis codes in patient EHRs revealed the following 3 patient subtypes: one with skin conditions, another with psychiatric disorders and an earlier age of onset, and a third with diabetes complications. Similarly, using LLM-derived embeddings of clinical notes, we identified 3 subtypes of patients as follows: one with psychiatric manifestations and higher prevalence of female participants (prevalence ratio: 1.59), another with cardiovascular and motor problems and higher prevalence of male participants (prevalence ratio: 1.75), and a third one with geriatric health disorders. Notably, we observed significant overlap between clusters from both data modalities (<italic>χ</italic><sup>2</sup><sub>4</sub>=89.4; <italic>P</italic>&lt;.001).</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>By integrating <italic>International Classification of Diseases, Ninth Revision</italic> codes and LLM-derived embeddings, our analysis delineated 2 distinct ADRD subtypes with sex-specific comorbid and clinical presentations, offering insights for potential precision medicine approaches.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>Alzheimer disease and related dementias</kwd>
        <kwd>electronic health records</kwd>
        <kwd>large language models</kwd>
        <kwd>clustering</kwd>
        <kwd>unsupervised learning</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Alzheimer disease (AD) is a neurodegenerative condition which affects more than 55 million people globally [<xref ref-type="bibr" rid="ref1">1</xref>], and it is the seventh leading cause of death in the United States [<xref ref-type="bibr" rid="ref2">2</xref>]. Despite its substantial public health burden, AD remains poorly understood, with limited treatment options available. AD and related dementias (ADRD) is an umbrella term that refers to multiple dementing illnesses, including AD, frontotemporal dementia (FTD), Lewy body dementia (LBD), and vascular dementia. AD is the most prevalent, accounting for around 60% to 80% of all dementia [<xref ref-type="bibr" rid="ref2">2</xref>]. While these diseases have distinct clinical and neuropathological criteria, there is substantial overlap in both clinical presentation and autopsy findings at the individual patient level. For example, AD is clinically characterized by an amnestic-predominant dementia and neuropathologically defined by the build-up of amyloid beta (Aβ) plaques and neurofibrillary tangles formed by hyperphosphorylated tau protein [<xref ref-type="bibr" rid="ref3">3</xref>]; however, these lesions are frequently accompanied by cerebrovascular disease (CVD) [<xref ref-type="bibr" rid="ref4">4</xref>] or Lewy body pathology [<xref ref-type="bibr" rid="ref5">5</xref>], which can influence clinical presentation. Likewise, LBD is defined by Lewy bodies but is also associated with plaques and tangles [<xref ref-type="bibr" rid="ref6">6</xref>], which may accelerate the rate of cognitive decline [<xref ref-type="bibr" rid="ref7">7</xref>]. This clinical and neuropathological heterogeneity limits our ability to target disease-modifying drugs to each specific neuropathological lesion. The so-called <italic>amyloid hypothesis</italic> has prevailed as the leading explanation of AD disease etiology, where it is held that Aβ toxicity leads to tau hyperphosphorylation, synaptic dysfunction, and neurodegeneration [<xref ref-type="bibr" rid="ref8">8</xref>]. However, treatments targeting this hypothesis only show limited efficacy, which may stem in part from the clinical and neuropathological comorbidities [<xref ref-type="bibr" rid="ref9">9</xref>], highlighting the need for a tailored approach to identify potential subtypes of disease and develop more effective targeted treatments.</p>
        <p>Previous approaches to AD subtyping have focused on RNA expression, as well as brain imaging and cognitive assessments. Neff et al [<xref ref-type="bibr" rid="ref10">10</xref>] identified 5 molecular subtypes of AD using RNA-sequencing signatures, characterized by different dysregulated pathways related to tau-mediated neurodegeneration, Aβ neuroinflammation, synaptic signaling, immune activity, mitochondria organization, and myelination. The Subtype and Stage Inference algorithm, applied to magnetic resonance imaging and positron emission tomography imaging data, identified distinct AD trajectories based on the rate and sequence of brain atrophy [<xref ref-type="bibr" rid="ref11">11</xref>] and tau deposition [<xref ref-type="bibr" rid="ref12">12</xref>]. Cognitive subtypes have also been identified based on memory, visuospatial and linguistic capabilities, and executive function [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref15">15</xref>]. These studies were limited to research cohorts with specific selection criteria, and it is unclear whether these subtypes can be extended to larger samples.</p>
        <p>In contrast, real-world data, such as, electronic health records (EHRs), provide readily accessible large observational datasets and have been used for clustering AD or ADRD subtypes [<xref ref-type="bibr" rid="ref16">16</xref>]. Unsupervised learning approaches on EHR datasets have revealed latent structure in conditions, such as autism [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>] and Parkinson disease [<xref ref-type="bibr" rid="ref19">19</xref>]. For AD subtyping, EHR-based approaches have used the <italic>International Classification of Diseases</italic> (<italic>ICD</italic>) or similar diagnostic codes, showing varying success depending on the methodology and population. Xu et al [<xref ref-type="bibr" rid="ref20">20</xref>] used hierarchical clustering on EHR data from patients with AD, identifying subtypes related to CVD, mental illness, age of onset, and sensory problems. Alexander et al [<xref ref-type="bibr" rid="ref21">21</xref>] found the following 5 patient subtypes: mental health, nontypical AD, typical AD, CVD, and men with cancer. They later identified a consistent subtype with early-onset AD, predominantly female participants, with a faster rate of progression using various machine learning methods [<xref ref-type="bibr" rid="ref22">22</xref>]. Landi et al [<xref ref-type="bibr" rid="ref23">23</xref>] used unsupervised deep learning to encode EHRs with temporal information, identifying early-onset AD, later-onset AD with mild comorbidities, and typical-onset AD with moderate symptoms. He et al [<xref ref-type="bibr" rid="ref24">24</xref>] applied spectral clustering to EHRs of patients with AD, discerning 4 subtypes with significant demographic, mortality, and medication use differences. Tang et al [<xref ref-type="bibr" rid="ref25">25</xref>] analyzed comorbidity patterns in EHRs of patients with AD, revealing sex-dependent variations. In another study, Tang et al [<xref ref-type="bibr" rid="ref26">26</xref>] used EHRs with knowledge networks to predict AD onset and identify sex-specific genetic markers. These studies collectively highlight the varied methodologies and results in EHR-based research, emphasizing the complexity and potential of these approaches for a deeper understanding of AD.</p>
        <p>However, none of these prior studies leveraged the richer representation of EHR data by embedding full sequences of clinical text. Transformers have emerged as state-of-the-art architecture for language modeling and are broadly characterized by the concept of attention [<xref ref-type="bibr" rid="ref27">27</xref>]. Attention, named for its similarity to cognitive attention, enables the sharing of contextual information among word representations without directly encoding their sequence. The transformer used in this work is a version of the Bidirectional Encoder Representations from Transformers (BERT) architecture [<xref ref-type="bibr" rid="ref28">28</xref>]. This architecture consists of an encoder which can be fine-tuned on downstream applications and domains. Specifically, we use Clinical BERT [<xref ref-type="bibr" rid="ref29">29</xref>], which is pretrained on a large corpus of clinical notes from the critical care database Medical Information Mart for Intensive Care (MIMIC) [<xref ref-type="bibr" rid="ref30">30</xref>].</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>In this work, we used both pretrained embeddings of <italic>ICD-9</italic> code diagnostic data and transformer-derived embeddings of clinical notes. This dual approach addresses the limitations of previous studies by incorporating structured <italic>ICD</italic> codes, which allow us to study subtypes of patients with similar <italic>ICD</italic> codes (non-ADRD diagnosis in charts), and unstructured clinical notes, which capture detailed clinical history and manifestations provided by specialists. By combining these 2 modalities, we aimed to enhance the clustering of patient ADRD subtypes.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Cohort Selection Process</title>
        <p>Patients were selected from the Massachusetts General Hospital (MGH) EHR database. The selection criteria included patients who had at least 2 MGH memory clinic visits (either an in-person office visit or a video telemedicine visit) from August 2015 to June 2022, were aged &gt;50 years at their first visit, and had progress notes of substantial length (≥512 characters). These criteria were chosen due to the richness of the notes for the clustering analysis and the high quality of the ADRD diagnosis from specialists. From the identified patient cohort, 2 datasets were extracted as follows: one containing structured diagnostic <italic>ICD</italic> code data from the patients’ entire medical history and another consisting of unstructured clinical notes authored by memory clinic specialists, limited to the most recent visit. We chose only the most recent visit note because it typically consolidates the patient’s prior history, thereby reducing redundancy and providing a focused, up-to-date clinical snapshot. In addition, the dataset was filtered to exclude patients who did not have ADRD diagnoses (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>), as well as those who lacked non-ADRD <italic>ICD</italic> codes (ie, patients who only had ADRD <italic>ICD</italic> codes were excluded).</p>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study was approved by the Mass General Brigham Institutional Review Board (protocol 2015P001915), which granted a waiver of informed consent for secondary analysis of electronic health data. No participant compensation was provided. Electronic health data was queried from Epic and securely stored on servers within the Mass General Brigham firewall. Access was restricted to authorized study personnel, in full compliance with institutional privacy and data security policies.</p>
      </sec>
      <sec>
        <title>Embedding Methodology</title>
        <sec>
          <title>ICD Codes</title>
          <p>Before clustering, it was necessary to derive a patient-level representation that encoded information relevant to phenotype in a single vector. While some prior work has relied on one-hot encoding (where categorical data are converted into binary vectors) of clinical data to represent patient phenotype, we leverage existing pretrained embeddings that capture relevant biomedical semantics in their latent representations of clinical concepts. In particular, we use a set of 300-dimensional embeddings for <italic>ICD-9</italic> codes, derived from prior work by Choi et al [<xref ref-type="bibr" rid="ref31">31</xref>].</p>
          <p>For a count-based encoded representation of <italic>m ICD-9</italic> codes across our cohort, <italic>P</italic> <italic>∈</italic> R<sup>3454</sup><italic><sup>×m</sup></italic>, and an embedding matrix, <italic>E∈</italic>R<italic><sup>m×</sup></italic><sup>300</sup>, our design matrix for clustering, <italic>X</italic> <italic>∈</italic> R<sup>3454</sup><italic><sup>×</sup></italic><sup>300</sup>, is given by the following matrix multiplication: <italic>X = P · E.</italic></p>
          <p>This matrix multiplication sums the non-ADRD <italic>ICD</italic> embeddings across a patient record, and the resultant embedding is directly affected by the number of times each code appears in a patient’s history. ADRD codes were dropped from the matrix <italic>P</italic> to not confound clustering based on structured ADRD phenotype. A schematic depicting the <italic>ICD</italic> representation pipeline is provided in <xref rid="figure1" ref-type="fig">Figure 1</xref>A.</p>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Visualization of the clustering pipeline for (A) International Classification of Diseases (ICD) codes and (B) notes. For each subfigure, the workflow goes from left to right. BERT: Bidirectional Encoder Representations from Transformers.</p>
            </caption>
            <graphic xlink:href="aging_v8i1e65178_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Clinical Notes</title>
          <p>Clinical notes were encoded using Clinical BERT before clustering. To derive patient-level representations of clinic notes, several preprocessing steps were undertaken. First, unwanted delimiter characters were stripped from patient notes, and notes were chunked into contiguous sections of up to 1024 characters. This resulted in a distribution of token numbers of ∼200 to 300 per note following BERT’s WordPiece encoding of input sequences. After passing through the transformer encoding, we took the final layer representation averaged over the 12 attention heads, such that each note was represented by a matrix of dimension (768, n), corresponding to each of the n input tokens having a 768-dimensional contextual vector representing it. Following this encoding, the representation was averaged over the token dimension to arrive at a single 768-dimensional vector for the whole note. This was explored using both simple averaging (arithmetic mean) over the token dimension, as well as attention-weighted averaging based on row-wise entropy of the final layer attention matrix. Attention-weighted averaging was used in patient representations due to the resultant lower inertia and increased silhouette score on average. A schematic depicting the note representation pipeline is provided in <xref rid="figure1" ref-type="fig">Figure 1</xref>B.</p>
        </sec>
      </sec>
      <sec>
        <title>Attention-Weighted Averaging</title>
        <p>For a given input sequence of length <italic>n</italic>, the final layer representation in a transformer model has an associated self-attention matrix, <italic>A</italic> <italic>∈</italic> R<italic><sup>n×</sup></italic><sup>n</sup>. For BERT-based models, <italic>n</italic> is <italic>≤</italic>512 due to the constraint on the length of the context window. To provide weights for averaging the embedding, <italic>E</italic> <italic>∈</italic> R<sup>768</sup><italic><sup>×n</sup></italic>, over the token dimension, we compute the row-wise differential entropy of the attention matrix, given in equation (1). Differential entropy is the continuous analog of Shannon entropy, which is usually only defined for discrete random variables [<xref ref-type="bibr" rid="ref32">32</xref>]. In particular, the method described in Ebrahimi et al [<xref ref-type="bibr" rid="ref33">33</xref>] is used to approximate the differential entropy, implemented in the Python (Python Software Foundation) library <italic>SciPy version 1.7.3</italic> [<xref ref-type="bibr" rid="ref34">34</xref>], as the closed-form expression for the attention distribution for a given row <italic>f</italic> (<italic>x</italic>) is not known analytically from the values of attention sampled. The differential entropy for a row <italic>i</italic> is given by</p>
        <disp-formula>
          <graphic xlink:href="aging_v8i1e65178_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          
        </disp-formula>
        <p>and the corresponding vector <italic>h</italic> <italic>∈</italic> R<italic><sup>n×</sup></italic><sup>1</sup> corresponds to the entropy across every row. From the row-wise entropy, this vector is softmaxed to obtain the corresponding weights, <italic>w ∈</italic> R<italic><sup>n×</sup></italic><sup>1</sup>, as follows:</p>
        <disp-formula>
          <graphic xlink:href="aging_v8i1e65178_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          
        </disp-formula>
        <p>The resultant embedding for a note sequence, <italic>N</italic> <italic>∈</italic> R<sup>768</sup><italic><sup>×1</sup></italic>, is then given by the matrix multiplication as follows:</p>
        <disp-formula>
          <graphic xlink:href="aging_v8i1e65178_fig9.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          
        </disp-formula>
        <p>and the final patient-level representation is the simple average over all note fragments for a given patient, for their most recent encounter. A visualization of attention matrices with varying row-wise entropy and thus varying weighting per token is provided in Figures S1 and S2 in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
      </sec>
      <sec>
        <title>Hierarchical Clustering</title>
        <p>Clustering analysis was performed on <italic>ICD-9</italic> embeddings and clinical text representations to identify ADRD subtypes. We selected hierarchical agglomerative clustering with Ward linkage due to its ability to capture the hierarchical structure of clinical data, as seen in <italic>ICD-9</italic> codes (eg, metabolic disorders branching into type 1 and type 2 diabetes) and clinical notes (eg, cognitive impairment branching into memory loss and aphasia). Cluster quality was evaluated using elbow plots and silhouette scores, with implementation via <italic>Scikit-learn v1.0.1</italic> [<xref ref-type="bibr" rid="ref35">35</xref>].</p>
      </sec>
      <sec>
        <title>Optimal Transport</title>
        <p>To address provider-specific effects in embeddings of clinical notes, we first applied Uniform Manifold Approximation and Projection (UMAP) to reduce the dimensionality of the data and then applied the earth mover distance transport approach using the Python <italic>Optimal Transport</italic> package [<xref ref-type="bibr" rid="ref36">36</xref>]. <italic>Optimal Transport</italic> provides a mathematical framework to minimize the cost of transforming one distribution into another, which can address the problem of domain adaptation [<xref ref-type="bibr" rid="ref37">37</xref>]. Domain adaptation involves adjusting data from different sources to make their data distributions more comparable, ensuring that models trained on these data perform well across various settings. In this context, the earth mover distance method was used to align the embeddings from various providers to a standard reference. This alignment ensured that the subsequent clustering analysis was less skewed by provider-related differences, allowing a more accurate interpretation of the underlying phenotypic variation.</p>
      </sec>
      <sec>
        <title>Enrichment Analysis: ICD Clusters</title>
        <p><italic>ICD</italic> clusters were phenotypically characterized by testing for enrichment of <italic>ICD-9</italic> codes within each cluster. For each cluster, a 2×2 contingency table was generated for each <italic>ICD-9</italic> diagnosis code, comparing counts of patients with that code within cluster to counts of patients with that same code in other clusters. A chi-square test for enrichment was performed; the prevalence ratio (PR), calculated as the prevalence of each code in one cluster divided by its prevalence in the rest, was calculated to measure the strength of the association. A Bonferroni correction was applied to the resultant <italic>P</italic> values to correct for multiple comparisons, and <italic>ICD</italic> codes in each cluster were ranked by corrected <italic>P</italic> value to characterize the most significant enrichments. All <italic>P</italic> values in this investigation were two-sided, with a postcorrected α of 0.05 to determine significance. The top-10 significant diagnoses with the highest PR were extracted from each cluster for interpretation. If a cluster lacked significant diagnoses, the top diagnoses with the highest PR among the nonsignificant ones were selected. The enrichment analyses were conducted in Python version 3.8.15.</p>
      </sec>
      <sec>
        <title>Topic Modeling: Note Clusters</title>
        <p>We used BERTopic [<xref ref-type="bibr" rid="ref38">38</xref>], using the Python package <italic>BERTopic</italic> v0.16.0, to identify representative topics and key terms within each note cluster. Embeddings obtained through optimal transport were directly used for clustering and topic assignment, bypassing the need for additional embedding and dimensionality reduction steps. Before conducting cluster-based term frequency–inverse document frequency (TF-IDF) for topic assignment, the clinical text was preprocessed using a vectorizer to remove stop words and exclude common terms that appeared too frequently across most notes. Furthermore, to fine-tune and enhance the word representation of topics, we applied the KeyBERTInspired model, which extracts keywords by leveraging embeddings and cosine similarity to find the words with the closest semantic relationship to the note texts, thereby making them more representative of the topics. Following the extraction of representative terms within each cluster, we used GPT-4 (OpenAI) [<xref ref-type="bibr" rid="ref39">39</xref>], a state-of-the-art large language model (LLM), to enhance interpretability. GPT-4 summarized the representative words provided by BERTopic into coherent themes with greater clinical significance, such as specific medical conditions, treatments, and medications. The PR, calculated as the prevalence of each word in one cluster divided by its prevalence in the rest, was calculated to measure the strength of the semantic relationship. The BERTopic modeling and analyses were conducted in Python version 3.9.6.</p>
      </sec>
      <sec>
        <title>ADRD Diagnosis Categorization</title>
        <p>The categorization of ADRD diagnoses was conducted using an extensive list of diagnostic names based on disease etiology. This list was meticulously reviewed for each unique diagnosis name recorded for the MGH memory clinic patients in the EHR system. The ADRD diagnoses categories included AD; dementia unspecified; FTD; LBD; vascular cognitive impairment (VCI); and others, such as posterior cortical atrophy (PCA), progressive supranuclear palsy, corticobasal degeneration, and primary progressive aphasia. An expert behavioral neurologist (JRD) provided critical input during this process, helping to develop a comprehensive mapping list that correlates specific diagnosis names with their corresponding ADRD categories. The application of this mapping to the data was performed using R version 4.3.2 (R Foundation for Statistical Computing). The full list of diagnosis names corresponding to ADRD diagnosis categories is provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
      </sec>
      <sec>
        <title>Cluster Characterizations</title>
        <p>To assess associations between clusters and sex, as well as ADRD diagnoses, we used the chi-square test. For each cluster, a 2×2 contingency table was generated for each variable, comparing the counts of patients with the characteristic within the cluster to those in other clusters. The PR, defined as the prevalence of a characteristic in one cluster divided by its prevalence in the remaining clusters, was calculated to measure the strength of the association: 1 indicates no difference in prevalence between the 2 groups, &gt;1 indicates higher prevalence in the first group, and &lt;1 indicates lower prevalence in the first group. In addition, to examine variations in the age of onset across clusters, we initially conducted a Kruskal-Wallis Rank Sum Test using the <italic>stats</italic> package from R. <italic>η</italic><sup>2</sup> (calculated by subtracting the number of groups from the Kruskal-Wallis H statistic plus one, and then dividing this result by the total number of observations minus the number of groups) based on the H statistic was reported as the effect size: values closer to 0 indicate a smaller effect and values closer to 1 indicate a larger effect. Following significant findings, further post hoc analyses using the Dunn test were performed to delineate differences between groups. The <italic>P</italic> values were adjusted for multiple comparisons using the Benjamini-Hochberg method to control the false discovery rate (FDR). Age-of-onset data were rigorously annotated by human experts reviewing clinical notes; where notes did not specify an exact age of onset, the age at the first clinical visit within the memory clinic was used as an approximation. Finally, we conducted a chi-square test between <italic>ICD</italic> clusters and note clusters to test whether patient cluster assignment was consistent across note and <italic>ICD</italic> representations. If the contingency table was larger than 2×2, Cramér V (calculated as the square root of the chi-square statistic divided by the product of the sample size and the minimum dimension minus one) was reported as the effect size: 0 indicates no association and 1 indicates a strong association. Standardized residuals (standardized differences between the observed count and the expected count) were reported for each cell: values close to 0 indicate the observed count is close to the expected count, positive values indicate the observed count is higher than expected, and negative values indicate the observed count is lower than expected. All statistical analyses were conducted in R version 4.3.2.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Study Population</title>
        <p>Our final study population consisted of 3454 patients from the MGH tertiary care memory clinic with clinical notes and <italic>ICD</italic> codes in the EHR system. The average age of onset for patients was 72.1 (SD 9.5) years, with 1678 (48.58%) being female. The majority were White (n=3059, 88.56%), followed by Asian (n=90, 2.61%), Black or African American (n=77, 2.23%), American Indian or Alaska Native (n=4, 0.12%), and Native Hawaiian or Other Pacific Islander (n=1, 0.03%). In addition, 103 (2.98%) identified as belonging to other races, and race data were not available for 120 (3.47%) patients. Regarding ethnicity, 3020 (87.43%) identified as non-Hispanic, 106 (3.07%) as Hispanic, and ethnicity data were not available for 328 (9.5%) patients. AD was the most prevalent diagnosis, affecting 1317 (38.13%) patients, followed by dementia unspecified, which accounted for 1101 (31.88%) patients. Each encounter recorded only one diagnosis name, and only the most recent encounter was used. The patient selection details are illustrated in <xref rid="figure2" ref-type="fig">Figure 2</xref>. The demographic and ADRD diagnosis breakdowns are provided in <xref ref-type="table" rid="table1">Table 1</xref> and ADRD categorization details are provided in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>CONSORT (Consolidated Standards of Reporting Trials) diagram illustrating the selection of patients from the Massachusetts General Hospital (MGH) electronic health record (EHR) system. ADRD: Alzheimer disease and related dementias; Dx: diagnosis; ICD: International Classification of Diseases.</p>
          </caption>
          <graphic xlink:href="aging_v8i1e65178_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>Summary statistics of the final study population.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="190"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="130"/>
            <col width="0"/>
            <col width="110"/>
            <col width="0"/>
            <col width="100"/>
            <col width="0"/>
            <col width="100"/>
            <col width="0"/>
            <col width="100"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Characteristics</td>
                <td colspan="2">Total (N=3454)</td>
                <td colspan="2">AD<sup>a</sup> (n=1317)</td>
                <td colspan="2">Dementia unspecified (n=1101)</td>
                <td colspan="2">FTD<sup>b</sup> (n=190)</td>
                <td colspan="2">LBD<sup>c</sup> (n=261)</td>
                <td colspan="2">VCI<sup>d</sup> (n=96)</td>
                <td>Other<sup>e</sup> (n=489)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Age of onset<sup>f</sup> (y), mean (SD)</td>
                <td colspan="2">72.1 (9.5)</td>
                <td colspan="2">74.6 (7.8)</td>
                <td colspan="2">73.3 (9.7)</td>
                <td colspan="2">63.8 (8.2)</td>
                <td colspan="2">71.4 (7.7)</td>
                <td colspan="2">76 (7.7)</td>
                <td>65.1 (9.4)</td>
              </tr>
              <tr valign="top">
                <td colspan="16">
                  <bold>Sex, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td colspan="2">1678 (48.58)</td>
                <td colspan="2">717 (54.44)</td>
                <td colspan="2">538 (48.86)</td>
                <td colspan="2">78 (41.1)</td>
                <td colspan="2">64 (24.5)</td>
                <td colspan="2">41 (43)</td>
                <td colspan="2">240 (49.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td colspan="2">1776 (51.42)</td>
                <td colspan="2">600 (45.56)</td>
                <td colspan="2">563 (51.14)</td>
                <td colspan="2">112 (58.9)</td>
                <td colspan="2">197 (75.5)</td>
                <td colspan="2">55 (57)</td>
                <td colspan="2">249 (50.9)</td>
              </tr>
              <tr valign="top">
                <td colspan="16">
                  <bold>Race, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>White</td>
                <td colspan="2">3059 (88.56)</td>
                <td colspan="2">1149 (87.24)</td>
                <td colspan="2">988 (89.74)</td>
                <td colspan="2">168 (88.4)</td>
                <td colspan="2">227 (87.0)</td>
                <td colspan="2">80 (83)</td>
                <td colspan="2">447 (91.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Black or African American</td>
                <td colspan="2">77 (2.23)</td>
                <td colspan="2">27 (2.05)</td>
                <td colspan="2">22 (2.00)</td>
                <td colspan="2">6 (3.2)</td>
                <td colspan="2">4 (1.5)</td>
                <td colspan="2">9 (9)</td>
                <td colspan="2">9 (1.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asian</td>
                <td colspan="2">90 (2.61)</td>
                <td colspan="2">34 (2.58)</td>
                <td colspan="2">31 (2.82)</td>
                <td colspan="2">6 (3.2)</td>
                <td colspan="2">14 (5.4)</td>
                <td colspan="2">1 (1)</td>
                <td colspan="2">4 (0.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>American Indian or Alaska Native</td>
                <td colspan="2">4 (0.12)</td>
                <td colspan="2">2 (0.15)</td>
                <td colspan="2">1 (0.09)</td>
                <td colspan="2">0 (0.0)</td>
                <td colspan="2">0 (0.0)</td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">1 (0.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Native Hawaiian or Other Pacific Islander</td>
                <td colspan="2">1 (0.03)</td>
                <td colspan="2">1 (0.08)</td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">0 (0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td colspan="2">103 (2.98)</td>
                <td colspan="2">52 (3.95)</td>
                <td colspan="2">32 (2.91)</td>
                <td colspan="2">2 (1.1)</td>
                <td colspan="2">2 (0.8)</td>
                <td colspan="2">3 (3)</td>
                <td colspan="2">12 (2.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unavailable</td>
                <td colspan="2">120 (3.47)</td>
                <td colspan="2">52 (3.95)</td>
                <td colspan="2">27 (2.45)</td>
                <td colspan="2">8 (4.2)</td>
                <td colspan="2">14 (5.4)</td>
                <td colspan="2">3 (3)</td>
                <td colspan="2">16 (3.3)</td>
              </tr>
              <tr valign="top">
                <td colspan="16">
                  <bold>Ethnicity, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Not Hispanic or Latino</td>
                <td colspan="2">3020 (87.43)</td>
                <td colspan="2">1133 (86.03)</td>
                <td colspan="2">987 (89.65)</td>
                <td colspan="2">161 (84.7)</td>
                <td colspan="2">228 (87.4)</td>
                <td colspan="2">83 (87)</td>
                <td colspan="2">428 (87.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hispanic or Latino</td>
                <td colspan="2">106 (3.07)</td>
                <td colspan="2">53 (4.02)</td>
                <td colspan="2">37 (3.36)</td>
                <td colspan="2">2 (1.1)</td>
                <td colspan="2">3 (1.1)</td>
                <td colspan="2">3 (3)</td>
                <td colspan="2">8 (1.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unavailable</td>
                <td colspan="2">328 (9.50)</td>
                <td colspan="2">131 (9.95)</td>
                <td colspan="2">77 (6.99)</td>
                <td colspan="2">27 (14.2)</td>
                <td colspan="2">30 (11.5)</td>
                <td colspan="2">10 (10)</td>
                <td colspan="2">53 (10.8)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table1fn1">
              <p><sup>a</sup>AD: Alzheimer disease.</p>
            </fn>
            <fn id="table1fn2">
              <p><sup>b</sup>FTD: frontotemporal dementia.</p>
            </fn>
            <fn id="table1fn3">
              <p><sup>c</sup>LBD: Lewy body dementia.</p>
            </fn>
            <fn id="table1fn4">
              <p><sup>d</sup>VCI: vascular cognitive impairment.</p>
            </fn>
            <fn id="table1fn5">
              <p><sup>e</sup>Includes posterior cortical atrophy, progressive supranuclear palsy, corticobasal degeneration, and primary progressive aphasia.</p>
            </fn>
            <fn id="table1fn6">
              <p><sup>f</sup>Age of onset was manually annotated by experts viewing clinical notes; for notes without age of onset, we approximated with the age of first encounter.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>ICD Clustering</title>
        <p>To investigate the clinical heterogeneity within ADRD, we clustered the embeddings of non-ADRD <italic>ICD</italic> codes assigned to this tertiary care sample from the MGH ADRD cohort. We hypothesized that this approach would reveal distinct clinical subtypes based on clinical comorbidities, which were associated with demographics (ie, age of onset and sex). The hierarchical agglomerative clustering method revealed 3 distinct clusters in the embeddings of non-ADRD <italic>ICD</italic> codes, as determined by the silhouette score. <xref rid="figure3" ref-type="fig">Figure 3</xref>A depicts a heatmap of enriched <italic>ICD</italic> codes across each cluster, and a 2D UMAP projection of these <italic>ICD</italic> code embeddings, colored by cluster, is displayed in <xref rid="figure4" ref-type="fig">Figure 4</xref>A. The distribution of patients across the clusters was as follows: cluster 1 included 1501 (43.46%) patients, cluster 2 included 1597 (46.24%) patients, and cluster 3 included 356 (10.31%) patients. Detailed summary statistics for these clusters are presented in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
        <fig id="figure3" position="float">
          <label>Figure 3</label>
          <caption>
            <p>Heatmap of enrichment in International Classification of Diseases (ICD) clusters and topics in note clusters. (A) This heatmap displays the enrichment of ICD-9 codes across ICD embedding clusters. Cluster 1 is primarily dominated by skin-related and certain cardiovascular conditions. Cluster 2 is marked by its exclusive and high prevalence ratios (PR) in psychiatric and behavioral conditions. Cluster 3 shows a diverse set of conditions with a significant prevalence of respiratory, pain-related, and complicated diabetic mellitus. (B) This heatmap displays representative words for each note cluster identified through topic modeling. Cluster 1 is primarily dominated by psychiatric manifestations and medications. Cluster 2 highlights cardiovascular, motor, and sensory issues. Cluster 3 covers a variety of symptoms and conditions, including autoimmune issues, behavioral and movement disorders, sleep disturbances, etc. In both (A) and (B), the color intensity of each code or word-cluster pairing reflects the PR (prevalence of code or word in observed group divided by prevalence in other groups) associated with that code or word. Words colored as exclusive were only present in one cluster.</p>
          </caption>
          <graphic xlink:href="aging_v8i1e65178_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure4" position="float">
          <label>Figure 4</label>
          <caption>
            <p>Clustering of International Classification of Diseases (ICD) embeddings and their demographic and diagnostic associations. (A) Uniform Manifold Approximation and Projection (UMAP) visualization of ICD embeddings were characterized by 3 clusters: cluster 1 includes 1501 (43.5%) patients, cluster 2 comprises 1597 (46.2%) patients, and cluster 3 contains 356 (10.3%) patients. (B) Bar plot showing prevalence for sex by cluster, significance based on a chi-square test. Notably, cluster 3 has a significantly higher proportion of female participants compared to male participants (P<sub>FDR</sub>=.009). (C) Violin plot illustrating the distribution of age of onset across clusters. Each violin plot shows the kernel density estimate of the data, with the center line representing the median age of onset. Box plot elements are overlaid, where the box limits indicate the upper and lower quartiles, and the whiskers extend to 1.5 times the IQR. Individual points are hidden for clarity. Significant differences are observed, with cluster 2 showing the earliest average age of onset at 69.8 (SD 9.6) years, and cluster 3 the latest at 75.5 (SD 8.1) years (<italic>P</italic>&lt;.001). (D) Heatmap showing prevalence ratio for Alzheimer disease and related dementias (ADRD) diagnoses across clusters, significance derived from a chi-squared test. Clinical diagnoses include Alzheimer disease (AD); dementia unspecified; frontotemporal dementia (FTD); Lewy body dementia (LBD); vascular cognitive impairment (VCI); and others such as posterior cortical atrophy (PCA), progressive supranuclear palsy (PSP), corticobasal degeneration (CBD), and primary progressive aphasia (PPA). Significant distribution variations are evident across clusters. The circle size, color, and number indicate the magnitude of the prevalence ratio. Blue indicates underrepresentation while red indicates overrepresentation. <italic>P</italic> values were corrected with false discovery rate adjustments.</p>
          </caption>
          <graphic xlink:href="aging_v8i1e65178_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <p>We examined differences in non-ADRD <italic>ICD</italic> code frequency across patient <italic>ICD</italic> embedding clusters (<xref rid="figure3" ref-type="fig">Figure 3</xref>A). In cluster 1, diagnoses, such as seborrheic keratoses (<italic>χ</italic><sup>2</sup><sub>1</sub>=243.15; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=3.32), actinic keratosis (<italic>χ</italic><sup>2</sup><sub>1</sub>=236.53; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=3.91), pure hypercholesterolemia (<italic>χ</italic><sup>2</sup><sub>1</sub>=199.13; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=2.71), history of basal cell cancer (<italic>χ</italic><sup>2</sup><sub>1</sub>=196.22; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=4.45), and nevus (<italic>χ</italic><sup>2</sup><sub>1</sub>=184.53; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=4.23), show notably high PRs. These diagnoses largely fall into skin-related disorders (such as various types of skin cancer and keratoses). Cluster 2 appears to be unique, with top PRs noted only for clinical signs, such as disinhibition behavior (<italic>χ</italic><sup>2</sup><sub>1</sub>=1.14; <italic>P</italic><sub>FDR</sub>=.99; PR=4.65), alexia (<italic>χ</italic><sup>2</sup><sub>1</sub>=0.426; <italic>P</italic><sub>FDR</sub>=.99; PR=3.49), and orofacial dyskinesia (<italic>χ</italic><sup>2</sup><sub>1</sub>=0.017; <italic>P</italic><sub>FDR</sub>=.99; PR=2.33), suggesting behavioral and psychiatric manifestations which are consistent with the FTD enrichment and earlier onset noted above. Notably, although these diagnoses did not reach significance in cluster 2, they were absent in the other clusters. Moreover, many diagnoses in cluster 2 were marked with a lack of PR, indicating a lower relevance of these diagnoses compared to clusters 1 or 3. Cluster 3 exhibited significant increases in diagnoses from a variety of categories, including respiratory issues (eg, cough: <italic>χ</italic><sup>2</sup><sub>1</sub>=339.47; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=3.77 and shortness of breath: <italic>χ</italic><sup>2</sup><sub>1</sub>=306.60; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=6.03), chronic pain (<italic>χ</italic><sup>2</sup><sub>1</sub>=460.55; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=4.80), musculoskeletal problems (eg, bilateral low back pain without sciatica: <italic>χ</italic><sup>2</sup><sub>1</sub>=456.91; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=4.80 and foot pain: <italic>χ</italic><sup>2</sup><sub>1</sub>=372.91; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=3.86), and complications of diabetes mellitus. Notably, diabetes mellitus (type 2 with autonomic neuropathy: <italic>χ</italic><sup>2</sup><sub>1</sub>=322.98; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=11.60 and insulin-dependent diabetes: <italic>χ</italic><sup>2</sup><sub>1</sub>=308.96; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=11.30) had exceptionally high PRs, suggesting a very strong association with these severe diabetes conditions in cluster 3.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Summary statistics of International Classification of Diseases clusters.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="0"/>
            <col width="370"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Characteristics</td>
                <td>Total (N=3454)</td>
                <td>Cluster 1 (n=1501)</td>
                <td>Cluster 2 (n=1597)</td>
                <td>Cluster 3 (n=356)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Age of onset<sup>a</sup> (y), mean (SD)</td>
                <td>72.1 (9.5)</td>
                <td>73.6 (9.1)</td>
                <td>69.8 (9.6)</td>
                <td>75.5 (8.1)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Sex, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Female</td>
                <td>1678 (48.58)</td>
                <td>709 (47.24)</td>
                <td>769 (48.15)</td>
                <td>200 (56.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Male</td>
                <td>1776 (51.42)</td>
                <td>792 (52.76)</td>
                <td>828 (51.85)</td>
                <td>156 (43.8)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Race, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">White</td>
                <td>3059 (88.56)</td>
                <td>1335 (88.94)</td>
                <td>1421 (88.98)</td>
                <td>303 (85.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Black or African American</td>
                <td>77 (2.23)</td>
                <td>37 (2.47)</td>
                <td>25 (1.57)</td>
                <td>15 (4.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Asian</td>
                <td>90 (2.61)</td>
                <td>40 (2.66)</td>
                <td>40 (2.5)</td>
                <td>10 (2.8)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">American Indian or Alaska Native</td>
                <td>4 (0.12)</td>
                <td>0 (0)</td>
                <td>2 (0.13)</td>
                <td>2 (0.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Native Hawaiian or Other Pacific Islander</td>
                <td>1 (0.03)</td>
                <td>0 (0)</td>
                <td>1 (0.06)</td>
                <td>0 (0)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Other</td>
                <td>103 (2.98)</td>
                <td>51 (3.4)</td>
                <td>34 (2.13)</td>
                <td>18 (5.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Unavailable</td>
                <td>120 (3.47)</td>
                <td>38 (2.53)</td>
                <td>74 (4.63)</td>
                <td>8 (2.2)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>Ethnicity, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Not Hispanic or Latino</td>
                <td>3020 (87.43)</td>
                <td>1358 (90.47)</td>
                <td>1326 (83.03)</td>
                <td>336 (94.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Hispanic or Latino</td>
                <td>106 (3.07)</td>
                <td>45 (3)</td>
                <td>42 (2.63)</td>
                <td>19 (5.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Unavailable</td>
                <td>328 (9.5)</td>
                <td>98 (6.53)</td>
                <td>229 (14.34)</td>
                <td>1 (0.3)</td>
              </tr>
              <tr valign="top">
                <td colspan="7">
                  <bold>ADRD Dx<sup>b</sup>, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">AD<sup>c</sup></td>
                <td>1317 (38.13)</td>
                <td>584 (38.91)</td>
                <td>636 (39.82)</td>
                <td>97 (27.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Dementia unspecified</td>
                <td>1101 (31.88)</td>
                <td>540 (35.98)</td>
                <td>388 (24.3)</td>
                <td>173 (48.6)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">FTD<sup>d</sup></td>
                <td>190 (5.5)</td>
                <td>64 (4.26)</td>
                <td>121 (7.58)</td>
                <td>5 (1.4)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">LBD<sup>e</sup></td>
                <td>261 (7.56)</td>
                <td>111 (7.4)</td>
                <td>127 (7.95)</td>
                <td>23 (6.5)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">
                  <break/>
                </td>
                <td>VCI<sup>f</sup></td>
                <td>96 (2.78)</td>
                <td>44 (2.93)</td>
                <td>33 (2.07)</td>
                <td>19 (5.3)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="2">Other<sup>g</sup></td>
                <td>489 (14.16)</td>
                <td>158 (10.53)</td>
                <td>292 (18.28)</td>
                <td>39 (11)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table2fn1">
              <p><sup>a</sup>Age of onset was manually annotated by experts viewing clinical notes; for notes without age of onset, we approximated with the age of first encounter.</p>
            </fn>
            <fn id="table2fn2">
              <p><sup>b</sup>Dx: diagnosis.</p>
            </fn>
            <fn id="table2fn3">
              <p><sup>c</sup>AD: Alzheimer disease.</p>
            </fn>
            <fn id="table2fn4">
              <p><sup>d</sup>FTD: frontotemporal dementia.</p>
            </fn>
            <fn id="table2fn5">
              <p><sup>e</sup>LBD: Lewy body dementia.</p>
            </fn>
            <fn id="table2fn6">
              <p><sup>f</sup>VCI: vascular cognitive impairment.</p>
            </fn>
            <fn id="table2fn7">
              <p><sup>g</sup>Includes posterior cortical atrophy, progressive supranuclear palsy, corticobasal degeneration, and primary progressive aphasia.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>Furthermore, statistical analyses revealed significant associations between ICD cluster membership, demographic variables, and diagnostic categories. Cluster 3 had an overrepresentation of female participants relative to clusters 1 and 2 (<italic>χ</italic><sup>2</sup><sub>1</sub>=8.8; <italic>P</italic><sub>FDR</sub>=.009; PR=1.178); however, clusters 1 and 2 showed no significant differences in sex distribution (cluster 1: <italic>χ</italic><sup>2</sup><sub>1</sub>=1.8; <italic>P</italic><sub>FDR</sub>=.26 and cluster 2: <italic>χ</italic><sup>2</sup><sub>1</sub>=0.2; <italic>P</italic><sub>FDR</sub>=.66; <xref rid="figure4" ref-type="fig">Figure 4</xref>B). In addition, the age of onset varied significantly among the ICD clusters (Kruskal-Wallis <italic>χ</italic><sup>2</sup><sub>2</sub>=182.6; <italic>P</italic><sub>FDR</sub>&lt;.001, <italic>η</italic><sup>2</sup>=0.052). Cluster 2, with a mean age of onset of 69.8 (SD 9.6) years, had a significantly earlier age of onset compared with clusters 1 (<italic>Z</italic>=10.13; <italic>P</italic><sub>FDR</sub>&lt;.001) and 3 (<italic>Z</italic>=−8.83; <italic>P</italic><sub>FDR</sub>&lt;.001). Moreover, cluster 1 (mean 73.6, SD 9.1 years) had an earlier onset than cluster 3 (mean 75.5, SD 8.1 years; <italic>Z</italic>=−2.61; <italic>P</italic><sub>FDR</sub>=.009; <xref rid="figure4" ref-type="fig">Figure 4</xref>C). Cluster 1 was significantly enriched by dementia unspecified (<italic>χ</italic><sup>2</sup><sub>1</sub>=20.2; 𝑃<sub>FDR</sub>&lt;.001; PR<italic>=</italic>1.252); cluster 2 was significantly enriched by FTD (<italic>χ</italic><sup>2</sup><sub>1</sub>=23.9; 𝑃<sub>FDR</sub>&lt;.001; PR<italic>=</italic>2.039) and other rare ADRDs (<italic>χ</italic><sup>2</sup><sub>1</sub>=41; 𝑃<sub>FDR</sub> &lt;.001; PR<italic>=</italic>1.724); and cluster 3 was significantly enriched by VCI (<italic>χ</italic><sup>2</sup><sub>1</sub>=8.6; 𝑃<sub>FDR</sub>=.007; PR<italic>=</italic>2.147) and dementia unspecified (<italic>χ</italic><sup>2</sup><sub>1</sub>=50.2; 𝑃<sub>FDR</sub>&lt;.001; PR<italic>=</italic>1.622). In contrast, no cluster was significantly enriched by AD, though AD was significantly underrepresented in cluster 3 (cluster 1: <italic>χ</italic><sup>2</sup><sub>1</sub>=0.6; 𝑃<sub>FDR</sub>=.53; cluster 2: <italic>χ</italic><sup>2</sup><sub>1</sub>=3.5; 𝑃<sub>FDR</sub>=.09; and cluster 3: <italic>χ</italic><sup>2</sup><sub>1</sub>=19.4; 𝑃<sub>FDR</sub>&lt;.001; <xref rid="figure4" ref-type="fig">Figure 4</xref>D) or LBD (cluster 1: <italic>χ</italic><sup>2</sup><sub>1</sub>=0.1; 𝑃<sub>FDR</sub>=.80; cluster 2: <italic>χ</italic><sup>2</sup><sub>1</sub>=0.5; 𝑃<sub>FDR</sub>=.53; and cluster 3: <italic>χ</italic><sup>2</sup><sub>1</sub>=0.5; 𝑃<sub>FDR</sub>=.53; <xref rid="figure4" ref-type="fig">Figure 4</xref>D). Additional visualizations of the UMAP projections colored by sex, age of onset, and ADRD diagnoses are available in Figures S3A, S3B, and S3C, respectively, in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
      </sec>
      <sec>
        <title>Note Clustering</title>
        <p>Initially, a provider effect was detected in the UMAP projection of note embeddings from the latest clinical notes of 3454 patients (Figure S4A in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). To address this, we used an optimal transport method, aligning the embeddings from all providers to the 2D embedding of a selected reference provider (Figure S4B in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>). Following this alignment, hierarchical agglomerative clustering was applied to the adjusted note embeddings, revealing 3 distinct clusters, as determined by the silhouette score. The adjusted UMAP projection, color coded by cluster, is presented in <xref rid="figure5" ref-type="fig">Figure 5</xref>A. The patient distribution within these clusters was as follows: cluster 1 included 1280 (37.06%) patients, cluster 2 included 1161 (33.61%) patients, and cluster 3 included 1013 (29.33%) patients. Detailed summary statistics for each cluster are outlined in <xref ref-type="table" rid="table3">Table 3</xref>.</p>
        <fig id="figure5" position="float">
          <label>Figure 5</label>
          <caption>
            <p>Clustering of note embeddings and their demographic and Alzheimer disease and related dementias (ADRD) diagnosis associations. (A) Uniform Manifold Approximation and Projection (UMAP) visualization of note embeddings characterized by 3 clusters: cluster 1 includes 1280 (37.1%) patients, cluster 2 includes 1161 (33.6%) patients, and cluster 3 includes 1013 (29.3%) patients. (B) Bar plot showing prevalence for sex by cluster, with significance based on chi-square tests. Notably, cluster 1 and cluster 3 were both enriched by female participants (<italic>P</italic>&lt;.001) while cluster 2 was enriched by male participants (<italic>P</italic>&lt;.001). (C) Violin plot illustrating the distribution of age of onset across clusters. Each violin plot shows the kernel density estimate of the data, with the center line representing the median age of onset. Box plot elements are overlaid, where the box limits indicate the upper and lower quartiles, and the whiskers extend to 1.5 times the IQR. Individual points are hidden for clarity. Significant differences are observed, with cluster 2 showing the latest average age of onset at 72.8 (SD 9.2) years, and cluster 1 the earliest at 71.5 (SD 9.3) years (<italic>P</italic>&lt;.001). (D) Heatmap showing prevalence ratio for ADRD diagnoses across clusters, with significance derived from a chi-square test. Diagnoses include Alzheimer disease (AD); dementia unspecified; frontotemporal dementia (FTD); Lewy body dementia (LBD); vascular cognitive impairment (VCI); and others such as posterior cortical atrophy (PCA), progressive supranuclear palsy (PSP), corticobasal degeneration (CBD), and primary progressive aphasia (PPA). No significant distribution variations are observed across clusters (<italic>P</italic>&gt;.05). The circle size, color, and number indicate the magnitude of the prevalence ratio. Blue indicates underrepresentation while red indicates overrepresentation. <italic>P</italic> values were corrected with false discovery rate (FDR) adjustments.</p>
          </caption>
          <graphic xlink:href="aging_v8i1e65178_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Summary statistics of note clusters.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="370"/>
            <col width="0"/>
            <col width="150"/>
            <col width="0"/>
            <col width="150"/>
            <col width="0"/>
            <col width="150"/>
            <col width="0"/>
            <col width="150"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Characteristics</td>
                <td colspan="2">Total (N=3454)</td>
                <td colspan="2">Cluster 1 (n=1280)</td>
                <td colspan="2">Cluster 2 (n=1161)</td>
                <td>Cluster 3 (n=1013)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="3">Age of onset<sup>a</sup> (y), mean (SD)</td>
                <td colspan="2">72.1 (9.5)</td>
                <td colspan="2">71.5 (9.3)</td>
                <td colspan="2">72.8 (9.2)</td>
                <td>71.9 (9.8)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Sex, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td colspan="2">1678 (48.58)</td>
                <td colspan="2">812 (63.44)</td>
                <td colspan="2">327 (28.17)</td>
                <td colspan="2">539 (53.21)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td colspan="2">1776 (51.42)</td>
                <td colspan="2">468 (36.56)</td>
                <td colspan="2">834 (71.83)</td>
                <td colspan="2">474 (46.79)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Race, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>White</td>
                <td colspan="2">3059 (88.56)</td>
                <td colspan="2">1129 (88.20)</td>
                <td colspan="2">1032 (88.89)</td>
                <td colspan="2">898 (88.56)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Black or African American</td>
                <td colspan="2">77 (2.23)</td>
                <td colspan="2">30 (2.34)</td>
                <td colspan="2">26 (2.24)</td>
                <td colspan="2">21 (2.07)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Asian</td>
                <td colspan="2">90 (2.61)</td>
                <td colspan="2">36 (2.81)</td>
                <td colspan="2">25 (2.15)</td>
                <td colspan="2">29 (2.86)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>American Indian or Alaska Native</td>
                <td colspan="2">4 (0.12)</td>
                <td colspan="2">1 (0.08)</td>
                <td colspan="2">1 (0.09)</td>
                <td colspan="2">2 (0.2)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Native Hawaiian or Other Pacific Islander</td>
                <td colspan="2">1 (0.03)</td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">0 (0)</td>
                <td colspan="2">1 (0.1)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other</td>
                <td colspan="2">103 (2.98)</td>
                <td colspan="2">34 (2.66)</td>
                <td colspan="2">44 (3.79)</td>
                <td colspan="2">25 (2.47)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unavailable</td>
                <td colspan="2">120 (3.47)</td>
                <td colspan="2">50 (3.91)</td>
                <td colspan="2">33 (2.84)</td>
                <td colspan="2">37 (3.65)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>Ethnicity, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Not Hispanic or Latino</td>
                <td colspan="2">3020 (87.43)</td>
                <td colspan="2">1128 (88.13)</td>
                <td colspan="2">1004 (86.48)</td>
                <td colspan="2">888 (87.66)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Hispanic or Latino</td>
                <td colspan="2">106 (3.07)</td>
                <td colspan="2">36 (2.81)</td>
                <td colspan="2">39 (3.36)</td>
                <td colspan="2">31 (3.06)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Unavailable</td>
                <td colspan="2">328 (9.5)</td>
                <td colspan="2">116 (9.06)</td>
                <td colspan="2">118 (10.16)</td>
                <td colspan="2">94 (9.28)</td>
              </tr>
              <tr valign="top">
                <td colspan="10">
                  <bold>ADRD Dx<sup>b</sup>, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>AD<sup>c</sup></td>
                <td colspan="2">1317 (38.13)</td>
                <td colspan="2">519 (40.55)</td>
                <td colspan="2">435 (37.47)</td>
                <td colspan="2">363 (35.83)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Dementia unspecified</td>
                <td colspan="2">1101 (31.88)</td>
                <td colspan="2">389 (30.39)</td>
                <td colspan="2">381 (32.82)</td>
                <td colspan="2">331 (32.68)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>FTD<sup>d</sup></td>
                <td colspan="2">190 (5.5)</td>
                <td colspan="2">69 (5.39)</td>
                <td colspan="2">65 (5.6)</td>
                <td colspan="2">56 (5.53)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>LBD<sup>e</sup></td>
                <td colspan="2">261 (7.56)</td>
                <td colspan="2">81 (6.33)</td>
                <td colspan="2">104 (8.96)</td>
                <td colspan="2">76 (7.5)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>VCI<sup>f</sup></td>
                <td colspan="2">96 (2.78)</td>
                <td colspan="2">36 (2.81)</td>
                <td colspan="2">40 (3.45)</td>
                <td colspan="2">20 (1.97)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Other<sup>g</sup></td>
                <td colspan="2">489 (14.16)</td>
                <td colspan="2">186 (14.53)</td>
                <td colspan="2">136 (11.71)</td>
                <td colspan="2">167 (16.49)</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Age of onset was manually annotated by experts viewing clinical notes; for notes without age of onset, we approximated with the age of first encounter.</p>
            </fn>
            <fn id="table3fn2">
              <p><sup>b</sup>Dx: diagnosis.</p>
            </fn>
            <fn id="table3fn3">
              <p><sup>c</sup>AD: Alzheimer disease.</p>
            </fn>
            <fn id="table3fn4">
              <p><sup>d</sup>FTD: frontotemporal dementia.</p>
            </fn>
            <fn id="table3fn5">
              <p><sup>e</sup>LBD: Lewy body dementia.</p>
            </fn>
            <fn id="table3fn6">
              <p><sup>f</sup>VCI: vascular cognitive impairment.</p>
            </fn>
            <fn id="table3fn7">
              <p><sup>g</sup>Includes posterior.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <p>We extracted common topics from each note cluster using topic modeling and examined the distribution of ADRD diagnoses across these clusters. In cluster 1, we found more terms related to psychiatric manifestations (eg, compulsive, indifference, and anxiety) and medications (eg, clozaril, trazodone, and sertraline), with a slight but nonsignificant enrichment in AD diagnosis (<italic>χ</italic><sup>2</sup><sub>1</sub>=4.9; <italic>P</italic><sub>FDR</sub>=.14; PR=1.10). Cluster 2 had more terms related to cardiovascular issues (eg, pacemaker, hypotension, and arrhythmia) and motor and sensory issues (eg, slurring, cochlear, and tremors), with a slight but nonsignificant enrichment in LBD (<italic>χ</italic><sup>2</sup><sub>1</sub>=4.6; <italic>P</italic><sub>FDR</sub>=.14; PR=1.31) and VCI (<italic>χ</italic><sup>2</sup><sub>1</sub>=2.5; <italic>P</italic><sub>FDR</sub>=.25; PR=1.41) diagnoses. Cluster 3 encompassed a wide variety of symptoms and conditions common in geriatric populations, including autoimmune (eg, scleroderma and vasculitis), behavioral changes and movement (eg, usual jocular behavior and imbalance, dysphagia), sleep (eg, insomnia), and sensory (eg, diplopia) problems, with a slight but not-significant enrichment in rare ADRD diagnoses (<italic>χ</italic><sup>2</sup><sub>1</sub>=3; <italic>P</italic><sub>FDR</sub>=.12; PR=1.25). <xref rid="figure3" ref-type="fig">Figure 3</xref>B depicts the list of representative words from each cluster and their PR, and Figure S5D in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref> illustrates sentence examples from each cluster.</p>
        <p>Furthermore, statistical analyses revealed significant associations of note cluster membership, with demographic variables, but not with ADRD diagnoses. First, both cluster 1 and 3 were significantly enriched by female participants (cluster 1: <italic>χ</italic><sup>2</sup><sub>1</sub>=178.7; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=1.593 and cluster 3: <italic>χ</italic><sup>2</sup><sub>1</sub>=12; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=1.14) while cluster 2 was enriched by male participants (<italic>χ</italic><sup>2</sup><sub>1</sub>=290.5; <italic>P</italic><sub>FDR</sub>&lt;.001; PR=1.749; <xref rid="figure5" ref-type="fig">Figure 5</xref>B). In addition, age of onset varied significantly among the note clusters (Kruskal-Wallis <italic>χ</italic><sup>2</sup><sub>2</sub>=14.9; <italic>P</italic>&lt;.001; <italic>η<sup>2</sup></italic>=0.004), with cluster 2 (mean 72.8, SD 9.2 years) having a significantly later age of onset compared to cluster 1 (<italic>Z</italic>=−3.82; <italic>P</italic><sub>FDR</sub>&lt;.001) and cluster 3 (<italic>Z</italic>=2.31; <italic>P</italic><sub>FDR</sub>=.03), while cluster 1 (mean 71.5, SD 9.3 years) and cluster 3 (mean 71.9, SD 9.8 years) did not differ (<italic>Z</italic>=−1.33; <italic>P</italic><sub>FDR</sub>=.19; <xref rid="figure5" ref-type="fig">Figure 5</xref>C). However, no association was observed between note cluster membership and ADRD diagnoses (Cluster 1-AD: <italic>χ</italic><sup>2</sup><sub>1</sub>=4.9; <italic>P</italic><sub>FDR</sub>=.14; Cluster 1-dementia unspecified: <italic>χ</italic><sup>2</sup><sub>1</sub>=1.9; <italic>P</italic><sub>FDR</sub>=.32; Cluster 1-FTD: <italic>χ</italic><sup>2</sup><sub>1</sub>=0.02; <italic>P</italic><sub>FDR</sub>=.99; Cluster 1-LBD: <italic>χ</italic><sup>2</sup><sub>1</sub>=4.1; <italic>P</italic><sub>FDR</sub>=.15; Cluster 1-other: <italic>χ</italic><sup>2</sup><sub>1</sub>=0.19; <italic>P</italic><sub>FDR</sub>=.92; Cluster 1-VCI: <italic>χ</italic><sup>2</sup><sub>1</sub>&lt;0.001, <italic>P</italic><sub>FDR</sub>=.99; Cluster 2-AD: <italic>χ</italic><sup>2</sup><sub>1</sub>=0.3; <italic>P</italic><sub>FDR</sub>=.89; Cluster 2-dementia unspecified: <italic>χ</italic><sup>2</sup><sub>1</sub>=0.6; <italic>P</italic><sub>FDR</sub>=.76; Cluster 2-FTD: <italic>χ</italic><sup>2</sup><sub>1</sub>=0.01; <italic>P</italic><sub>FDR</sub>=.99; Cluster 2-LBD: <italic>χ</italic><sup>2</sup><sub>1</sub>=4.6; <italic>P</italic><sub>FDR</sub>=.14; Cluster 2-other: <italic>χ</italic><sup>2</sup><sub>1</sub>=8.3; <italic>P</italic><sub>FDR</sub>=.07; Cluster 2-VCI: <italic>χ</italic><sup>2</sup><sub>1</sub>=2.5; <italic>P</italic><sub>FDR</sub>=.25; Cluster 3-AD: <italic>χ</italic><sup>2</sup><sub>1</sub>=3.1; <italic>P</italic><sub>FDR</sub>=.21; Cluster 3-dementia unspecified: <italic>χ</italic><sup>2</sup><sub>1</sub>=0.4; <italic>P</italic><sub>FDR</sub>=.89; Cluster 3-FTD: <italic>χ</italic><sup>2</sup><sub>1</sub>&lt;0.001; <italic>P</italic><sub>FDR</sub>=.99; Cluster 3-LBD: <italic>χ</italic><sup>2</sup><sub>1</sub>&lt;0.001; <italic>P</italic><sub>FDR</sub>=.99; Cluster 3-other: <italic>χ</italic><sup>2</sup><sub>1</sub>=6.1; <italic>P</italic><sub>FDR</sub>=.12; Cluster 3-VCI: <italic>χ</italic><sup>2</sup><sub>1</sub>=3; <italic>P</italic><sub>FDR</sub>=.21; <xref rid="figure5" ref-type="fig">Figure 5</xref>D). Additional visualizations of the UMAP projections colored by sex, age of onset, and ADRD diagnoses are provided in Figures S5A, S5B, and S5C, respectively, in <xref ref-type="supplementary-material" rid="app2">Multimedia Appendix 2</xref>.</p>
      </sec>
      <sec>
        <title>Comparison Between ICD Clusters and Note Clusters</title>
        <p>Statistical analysis demonstrated significant associations between <italic>ICD</italic> and note clusters (<italic>χ</italic><sup>2</sup><sub>4</sub>=89.43; <italic>P</italic>&lt;.001; Cramér <italic>V</italic>=0.114). Specifically, note cluster 1, characterized by more female participants (PR=1.593) and terms related to psychiatric manifestations and medications, significantly overlapped (standardized residual=8.42; <italic>P</italic><sub>FDR</sub>&lt;.001) with <italic>ICD</italic> cluster 2, which is noted for the earliest onset of disease (mean 69.8, SD 9.6 years) and a higher prevalence of psychiatric disorders and higher proportion of patients with FTD (PR<italic>=</italic>2.039). In addition, note cluster 2, which had higher proportion of male participants (PR<italic>=</italic>1.749) and terms related to cardiovascular and motor issues, overlapped significantly (standardized residual=4.90; <italic>P</italic><sub>FDR</sub>&lt;.001) with <italic>ICD</italic> cluster 3, which is marked by the oldest onset of disease (mean 75.5, SD 8.1 years), a higher occurrence of VCI (PR<italic>=</italic>2.147), and dementia unspecified (PR<italic>=</italic>1.622) and had high prevalence of diabetes. These findings suggest a meaningful pattern of cluster correspondence across modalities (<xref rid="figure6" ref-type="fig">Figure 6</xref>).</p>
        <fig id="figure6" position="float">
          <label>Figure 6</label>
          <caption>
            <p>Heatmap of the association of International Classification of Diseases (ICD) clusters with note clusters. Heatmap of the association of ICD clusters with note clusters. ICD clusters were significantly associated with note clusters (<italic>P</italic>&lt;.001). Post hoc analyses revealed that note cluster 1 was positively associated with ICD cluster 2 (standardized residual=8.42, <italic>P</italic>&lt;.001) and negatively associated with ICD clusters 1 and 3 (cluster 1: standardized residual=−4.57, <italic>P</italic>&lt;.001; cluster 3: standardized residual=−6.36, <italic>P</italic>&lt;.001). Furthermore, note cluster 2 was positively associated with ICD cluster 3 (standardized residual=4.9, <italic>P</italic>&lt;.001) and negatively associated with ICD cluster 2 (standardized residual=−5.48, <italic>P</italic>&lt;.001). Finally, note cluster 3 was negatively associated with ICD cluster 2 (standardized residual=−3.25, <italic>P</italic>=.003). Each cell displays standardized residuals (standardized differences between the observed count and the expected count) along with the count of overlapping patients (n). Color bar represents the value of the standardized residual. <italic>P</italic> values were corrected with false discovery rate adjustments.</p>
          </caption>
          <graphic xlink:href="aging_v8i1e65178_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>This study aimed to characterize the clinical heterogeneity across ADRD by applying representation learning techniques on patient EHRs in a tertiary care clinic. We used pretrained <italic>ICD</italic> code embeddings, a transformer architecture for encoding clinical notes, and unsupervised learning to identify distinct ADRD subtypes. This work represents the first example of clustering patients with ADRD using embeddings derived directly from an LLM, without prior rule-based extraction of relevant medical concepts from the clinical note. The <italic>ICD</italic> codes allowed us to investigate subtypes of patients with similar <italic>ICD</italic> codes (non-ADRD diagnosis in charts), while the clinical notes allowed us to capture clinical history and presentation recorded by memory specialists. Our results demonstrate distinct patterns of disease manifestation with significant overlap between the <italic>ICD</italic> and note clusters. The overlap of clusters between the 2 approaches suggests that the subtypes may reflect common underlying clinical heterogeneity, as distinct subtypes can be identified through different data modalities.</p>
        <p>Our choice of hierarchical agglomerative clustering was guided by the hierarchical nature of our data, empirical evidence from prior dementia subtyping studies, and theoretical limitations of alternative algorithms. Alternative methods, such as K-means, Gaussian mixture models [<xref ref-type="bibr" rid="ref40">40</xref>], and density-based spatial clustering of applications with noise (DBSCAN) [<xref ref-type="bibr" rid="ref41">41</xref>], face theoretical limitations: K-means assumes spherical clusters that is difficult to satisfy in high-dimensional embeddings; DBSCAN relies on density thresholds that break down in such spaces; and Gaussian mixture models can be unstable with overlapping subtypes. In contrast, hierarchical clustering preserves these nested relationships, resulting in more homogeneous [<xref ref-type="bibr" rid="ref42">42</xref>] and reproducible [<xref ref-type="bibr" rid="ref43">43</xref>] clusters.</p>
        <p>In our study, we identified 3 clusters from <italic>ICD</italic> embeddings, each characterized by distinct health conditions. Cluster 1 predominantly featured issues related to skin health, with a commonality of dementia unspecified diagnoses and an average age of onset in the early 70s. The association between skin health and dementia in this cluster may be attributed to age, as both conditions become more prevalent with advancing age. This aligns with findings from previous studies, which reported an increase in the prevalence of actinic keratosis [<xref ref-type="bibr" rid="ref44">44</xref>] and seborrheic keratosis [<xref ref-type="bibr" rid="ref45">45</xref>], as well as AD [<xref ref-type="bibr" rid="ref46">46</xref>], with age. Cluster 2 is marked by early-onset, psychiatric and behavioral manifestations; enrichment in FTD and other less common forms of ADRD; and the earliest age of onset among our clusters, typically in the late 60s. This cluster extends the characterization found in previous studies that described a behavioral symptom subtype in patients [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>] by demonstrating similar characteristics in a broader population of patients with ADRD. Cluster 3 encompasses a broad array of conditions like respiratory issues and severe diabetes, affecting older patients, more female participants than male participants, with a higher incidence of VCI and dementia unspecified, and an age of onset in the mid-70s. Reflecting the AD subtype identified by previous researchers, this group was characterized as being overall older and having more comorbidities [<xref ref-type="bibr" rid="ref20">20</xref>]. Landi et al [<xref ref-type="bibr" rid="ref23">23</xref>] further differentiated patients with AD by onset timing, which we also observed but across a more diverse set of ADRD diagnoses. Notably, our <italic>ICD</italic>-based clustering did not reveal clearly separated clusters in the 2D UMAP projections. While UMAP aims to preserve both local and global relationships when reducing high-dimensional data to a lower-dimensional space, some distortions may inevitably occur during dimensionality reduction. Alternatively, the overlapping clusters could reflect the complexity of comorbid conditions in ADRD, which may not form clearly distinguishable subgroups.</p>
        <p>In addition, our analysis of clinical notes revealed 3 distinct subtypes. Cluster 1 featured terms related to psychiatric manifestations and medications, aligning with findings from previous studies [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>]. Cluster 2 included terms related to cardiovascular and various motor and sensory issues, supported by previous studies that identified subtypes of CVD [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref21">21</xref>] and aligning with the predominant diagnoses of VCI and LBD within this cluster. Cluster 3 covered a wide array of health conditions, consistent with the higher occurrence of rare ADRD diagnoses, which tend to involve more heterogeneous health conditions. Notably, we observed significant overlap between <italic>ICD</italic> and note clusters, identifying 2 ADRD subtypes of interest that were concordant across the 2 data modalities: the first subtype, “psychiatric manifestations,” and the second subtype, “diabetes with cardiovascular or motor issues.” Thus, our analysis delineated 2 distinct ADRD subtypes with specific diagnostic and symptomatic profiles.</p>
        <p>Our study identified sex differences across all clinical note clusters with substantial effects observed in note clusters 1 and 2. For example, note cluster 1 was significantly overrepresented in female participants and had a higher prevalence of AD (PR=1.1). It also overlapped significantly (<italic>P</italic>&lt;.001) with <italic>ICD</italic> cluster 2, which was enriched for psychiatric and behavioral symptoms (eg, apathy). This aligns with Tang et al [<xref ref-type="bibr" rid="ref25">25</xref>], who reported stronger psychiatric associations in female patients with AD, including greater links to depression. This pattern may be partially attributed to women’s greater likelihood of seeking mental health care [<xref ref-type="bibr" rid="ref47">47</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]. In contrast, note cluster 2 was overrepresented in male participants, with higher prevalence of VCI (PR=1.41) and LBD (PR=1.31), consistent with Tang et al [<xref ref-type="bibr" rid="ref25">25</xref>], who found vascular dementia was more common in male participants. The higher prevalence of VCI in male participants may be related to a greater burden of hypertension, particularly in early life [<xref ref-type="bibr" rid="ref49">49</xref>]. In addition, the increased representation of male participants with LBD may reflect potential underdiagnosis in female participants [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>]. Given the clinical impact of sex disparities in ADRD—particularly in AD and LBD [<xref ref-type="bibr" rid="ref52">52</xref>]—future studies integrating longitudinal data and clinicopathological evidence will be crucial to disentangling biological influences from health care–seeking behaviors.</p>
        <p>Another interesting observation relates to variations in age of onset, a key indicator of disease severity, across the identified subtypes in both clinical notes and <italic>ICD</italic>-based clusters, with notable differences in the <italic>ICD</italic>-derived subtypes. For instance, the early-onset <italic>ICD</italic> cluster 2 was enriched with psychiatric disorders and included diseases known with early-onset, including FTD [<xref ref-type="bibr" rid="ref53">53</xref>] and other rare ADRD categories, such as PCA [<xref ref-type="bibr" rid="ref54">54</xref>]. In contrast, the late-onset <italic>ICD</italic> cluster 3, exhibited a higher prevalence of diverse health conditions, including respiratory issues (eg, cough and shortness of breath), chronic pain, musculoskeletal conditions, such as bilateral low back pain and foot pain, as well as diabetes mellitus. While chronic pain is not typically associated with ADRD, pain could indicate the general aging process [<xref ref-type="bibr" rid="ref55">55</xref>], and relate to osteoporosis and osteoarthritis, which likely contribute to chronic pain in older adults. Other symptoms, such as foot pain and shortness of breath, may reflect comorbidities of diabetes.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>Our study has a few limitations. First, there are the challenges associated with using real-world EHR data. Differences in how health care providers document information, stemming from variations in training, personal documentation habits, and clinical judgment, may have contributed to inconsistencies. Furthermore, health care use patterns, such as visit regularity, may influence our clustering results. For example, variations in visit frequency could lead to overrepresentation of certain symptom clusters or skewed associations. Future studies adjusting for health care use patterns may help address this limitation. Second, the inclusion of long-term patient histories in clinical notes—where recent notes may capture both current and past symptoms—could introduce extraneous information, making it difficult to isolate content relevant to the latest diagnosis. This mixture of historical and recent data may have diluted the association between documented ADRD diagnoses and their actual clinical significance, leading to observed trends rather than clear associations. Furthermore, the repetition of relevant language across multiple encounters may have influenced the clustering process, potentially reflecting the frequency of patient visits to the memory clinic, rather than clinical characteristics. Third, our study is constrained by the absence of an independent validation cohort to confirm the identified clusters. While the relative overlap in clusters identified through <italic>ICD</italic> codes and note contents, along with the alignment with findings from previous research, offers some validation, the results could be strengthened by applying the same encoding and clustering techniques to an external validation cohort. To ensure external validity, these results need to be validated at other health care institutions. Fourth, another limitation of this study is that our subtyping characterization only focused on ADRD diagnoses based on etiology, but did not address the stage of disease, which clearly affects the neuropsychological profile. This calls for a focus on the heterogeneity of disease stage in future research. Moreover, there may be sex differences in who receives health care at different stages and ages, adding another layer of complexity to our findings. Finally, our study is limited by the lack of racial diversity in the cohort, with 88.6% of participants being White. Given known racial differences in AD incidence, comorbidities, and health care access [<xref ref-type="bibr" rid="ref56">56</xref>-<xref ref-type="bibr" rid="ref59">59</xref>]—and particularly the heightened impact of hypertension on AD risk in some minoritized groups [<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>]—our findings may not fully capture the spectrum of ADRD subtypes in these populations. Future studies with broader representation are necessary to improve the generalizability of our subtyping approach.</p>
      </sec>
      <sec>
        <title>Future Directions</title>
        <p>In future work, the preprocessing of clinical notes could be enhanced by implementing multiple methods, such as medspaCy [<xref ref-type="bibr" rid="ref61">61</xref>], with a focus on targeting sections most relevant to diagnoses, such as medical history. To further improve the extraction and analysis of pertinent data, the use of emerging LLMs, such as GPT [<xref ref-type="bibr" rid="ref39">39</xref>], should be explored. In addition, validating an independent dataset and enriching the patient population would help increase the robustness and reliability of the identified ADRD subtypes. To advance this work, we will use a dual-modality approach that leverages both structured and unstructured data sources, such as medications and imaging. A deep autoencoder that uses multiple modalities simultaneously could offer methodological improvements over our current practice of conducting parallel clustering analyses and relying on heuristic averaging of embeddings. Furthermore, explicitly using the temporal or graph properties of EHRs could yield more informative representations, enhancing unsupervised clustering capabilities, as has been shown in prior approaches in a supervised learning setting [<xref ref-type="bibr" rid="ref62">62</xref>,<xref ref-type="bibr" rid="ref63">63</xref>]. Ultimately, our goal is to develop machine learning models capable of predicting these ADRD subtypes from real-word health care systems. Such models may aid in more precise diagnostics, prognostics, and the formulation of targeted treatment strategies.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>List of diagnosis names to Alzheimer disease and related dementias diagnosis categories. This document provides a list of diagnosis names from the electronic health records of patients at a memory clinic to various Alzheimer disease and related dementias diagnosis categories.</p>
        <media xlink:href="aging_v8i1e65178_app1.pdf" xlink:title="PDF File  (Adobe PDF File), 613 KB"/>
      </supplementary-material>
      <supplementary-material id="app2">
        <label>Multimedia Appendix 2</label>
        <p>Visualizations of model attention and embedding representations. This appendix includes attention heatmaps from the final transformer layer across heads, as well as Uniform Manifold Approximation and Projection projections of International Classification of Diseases code, and clinical note embeddings, characterized by sex, age of onset, Alzheimer disease and related dementia diagnosis, and provider information.</p>
        <media xlink:href="aging_v8i1e65178_app2.docx" xlink:title="DOCX File , 2067 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AD</term>
          <def>
            <p>Alzheimer disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">ADRD</term>
          <def>
            <p>Alzheimer disease and related dementia</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">Aβ</term>
          <def>
            <p>amyloid beta</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">BERT</term>
          <def>
            <p>Bidirectional Encoder Representations from Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">CVD</term>
          <def>
            <p>cerebrovascular disease</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">DBSCAN</term>
          <def>
            <p>density-based spatial clustering of applications with noise</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">FDR</term>
          <def>
            <p>false discovery rate</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">FTD</term>
          <def>
            <p>frontotemporal dementia</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">ICD</term>
          <def>
            <p>International Classification of Diseases</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb11">LBD</term>
          <def>
            <p>Lewy body dementia</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb12">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb13">MGH</term>
          <def>
            <p>Massachusetts General Hospital</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb14">MIMIC</term>
          <def>
            <p>Medical Information Mart for Intensive Care</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb15">PCA</term>
          <def>
            <p>posterior cortical atrophy</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb16">PR</term>
          <def>
            <p>prevalence ratio</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb17">TF-IDF</term>
          <def>
            <p>term frequency–inverse document frequency</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb18">UMAP</term>
          <def>
            <p>Uniform Manifold Approximation and Projection </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb19">VCI</term>
          <def>
            <p>vascular cognitive impairment</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was funded by National Institute of Aging P30AG062421 (SD and BTH). The funder played no role in study design, data collection, analysis and interpretation of data, or the writing of this manuscript. The authors acknowledge Yoonchul Shin and Qinglin Gou for annotating the age of onset from clinical notes.</p>
    </ack>
    <notes>
      <sec>
        <title>Data Availability</title>
        <p>The data used for this study are available from the Mass General Brigham Healthcare System, but restrictions apply to the availability of these data, which were used under permission for this study, and so are not publicly available. Code will be available on GitHub upon publication.</p>
      </sec>
    </notes>
    <fn-group>
      <fn fn-type="con">
        <p>MW was responsible for conceptualization, formal analysis, investigation, methodology, software, and writing original draft. YC was responsible for data curation, formal analysis, investigation, methodology, software, visualization, writing original draft, review, and editing. YH was responsible for data curation and analysis, review, and editing. YL was responsible for formal analysis, methodology, and software. CM was responsible for conceptualization, review, and editing. BTH was responsible for review and editing. JRD was responsible for data curation, review, and editing. AS-P was responsible for review and editing. DB was responsible for review and editing. SD was responsible for conceptualization, funding acquisition, investigation, methodology, supervision, review, and editing.</p>
      </fn>
      <fn fn-type="conflict">
        <p>JRD served on a scientific review board for I-Mab Biopharma. All other authors declare no conflicts of interest.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="web">
          <article-title>Dementia fact sheet</article-title>
          <source>World Health Organization</source>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.who.int/news-room/fact-sheets/detail/dementia">https://www.who.int/news-room/fact-sheets/detail/dementia</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="web">
          <article-title>Alzheimer's disease fact sheet</article-title>
          <source>National Institute on Aging</source>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.nia.nih.gov/health/alzheimers-and-dementia/alzheimers-disease-fact-sheet">https://www.nia.nih.gov/health/alzheimers-and-dementia/alzheimers-disease-fact-sheet</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bloom</surname>
              <given-names>GS</given-names>
            </name>
          </person-group>
          <article-title>Amyloid-β and tau: the trigger and bullet in Alzheimer disease pathogenesis</article-title>
          <source>JAMA Neurol</source>
          <year>2014</year>
          <month>04</month>
          <day>01</day>
          <volume>71</volume>
          <issue>4</issue>
          <fpage>505</fpage>
          <lpage>8</lpage>
          <pub-id pub-id-type="doi">10.1001/jamaneurol.2013.5847</pub-id>
          <pub-id pub-id-type="medline">24493463</pub-id>
          <pub-id pub-id-type="pii">1817720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stampfer</surname>
              <given-names>MJ</given-names>
            </name>
          </person-group>
          <article-title>Cardiovascular disease and Alzheimer's disease: common links</article-title>
          <source>J Intern Med</source>
          <year>2006</year>
          <month>09</month>
          <day>26</day>
          <volume>260</volume>
          <issue>3</issue>
          <fpage>211</fpage>
          <lpage>23</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/doi/10.1111/j.1365-2796.2006.01687.x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1365-2796.2006.01687.x</pub-id>
          <pub-id pub-id-type="medline">16918818</pub-id>
          <pub-id pub-id-type="pii">JIM1687</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kotzbauer</surname>
              <given-names>PT</given-names>
            </name>
            <name name-style="western">
              <surname>Trojanowsk</surname>
              <given-names>JQ</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>VM</given-names>
            </name>
          </person-group>
          <article-title>Lewy body pathology in Alzheimer's disease</article-title>
          <source>J Mol Neurosci</source>
          <year>2001</year>
          <month>10</month>
          <volume>17</volume>
          <issue>2</issue>
          <fpage>225</fpage>
          <lpage>32</lpage>
          <pub-id pub-id-type="doi">10.1385/jmn:17:2:225</pub-id>
          <pub-id pub-id-type="medline">11816795</pub-id>
          <pub-id pub-id-type="pii">JMN:17:2:225</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Irwin</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Grossman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Weintraub</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hurtig</surname>
              <given-names>HI</given-names>
            </name>
            <name name-style="western">
              <surname>Duda</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Xie</surname>
              <given-names>SX</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>van Deerlin</surname>
              <given-names>VM</given-names>
            </name>
            <name name-style="western">
              <surname>Lopez</surname>
              <given-names>OL</given-names>
            </name>
            <name name-style="western">
              <surname>Kofler</surname>
              <given-names>JK</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>PT</given-names>
            </name>
            <name name-style="western">
              <surname>Jicha</surname>
              <given-names>GA</given-names>
            </name>
            <name name-style="western">
              <surname>Woltjer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Quinn</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Kaye</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Leverenz</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Tsuang</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Longfellow</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yearout</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kukull</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Keene</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Montine</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zabetian</surname>
              <given-names>CP</given-names>
            </name>
            <name name-style="western">
              <surname>Trojanowski</surname>
              <given-names>JQ</given-names>
            </name>
          </person-group>
          <article-title>Neuropathological and genetic correlates of survival and dementia onset in synucleinopathies: a retrospective analysis</article-title>
          <source>Lancet Neurol</source>
          <year>2017</year>
          <month>01</month>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>55</fpage>
          <lpage>65</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27979356"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S1474-4422(16)30291-5</pub-id>
          <pub-id pub-id-type="medline">27979356</pub-id>
          <pub-id pub-id-type="pii">S1474-4422(16)30291-5</pub-id>
          <pub-id pub-id-type="pmcid">PMC5181646</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferreira</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Przybelski</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Lesnick</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>Lemstra</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Londos</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Blanc</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Nedelska</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Schwarz</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Graff-Radford</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Senjem</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Fields</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Knopman</surname>
              <given-names>DS</given-names>
            </name>
            <name name-style="western">
              <surname>Savica</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ferman</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Graff-Radford</surname>
              <given-names>NR</given-names>
            </name>
            <name name-style="western">
              <surname>Lowe</surname>
              <given-names>VJ</given-names>
            </name>
            <name name-style="western">
              <surname>Jack</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Petersen</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Mollenhauer</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Garcia-Ptacek</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Abdelnour</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Hort</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bonanni</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Oppedal</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kramberger</surname>
              <given-names>MG</given-names>
            </name>
            <name name-style="western">
              <surname>Boeve</surname>
              <given-names>BF</given-names>
            </name>
            <name name-style="western">
              <surname>Aarsland</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Westman</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kantarci</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>β-Amyloid and tau biomarkers and clinical phenotype in dementia with Lewy bodies</article-title>
          <source>Neurology</source>
          <year>2020</year>
          <month>12</month>
          <day>15</day>
          <volume>95</volume>
          <issue>24</issue>
          <fpage>e3257</fpage>
          <lpage>68</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32989106"/>
          </comment>
          <pub-id pub-id-type="doi">10.1212/WNL.0000000000010943</pub-id>
          <pub-id pub-id-type="medline">32989106</pub-id>
          <pub-id pub-id-type="pii">WNL.0000000000010943</pub-id>
          <pub-id pub-id-type="pmcid">PMC7836666</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hardy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Selkoe</surname>
              <given-names>DJ</given-names>
            </name>
          </person-group>
          <article-title>The amyloid hypothesis of Alzheimer's disease: progress and problems on the road to therapeutics</article-title>
          <source>Science</source>
          <year>2002</year>
          <month>07</month>
          <day>19</day>
          <volume>297</volume>
          <issue>5580</issue>
          <fpage>353</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1126/science.1072994</pub-id>
          <pub-id pub-id-type="medline">12130773</pub-id>
          <pub-id pub-id-type="pii">297/5580/353</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mukhopadhyay</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Banerjee</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>A primer on the evolution of aducanumab: the first antibody approved for treatment of Alzheimer's disease</article-title>
          <source>J Alzheimers Dis</source>
          <year>2021</year>
          <volume>83</volume>
          <issue>4</issue>
          <fpage>1537</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.3233/JAD-215065</pub-id>
          <pub-id pub-id-type="medline">34366359</pub-id>
          <pub-id pub-id-type="pii">JAD215065</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Neff</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Vatansever</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Ming</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Horgusluoglu-Moloch</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Castranio</surname>
              <given-names>EL</given-names>
            </name>
            <name name-style="western">
              <surname>Tcw</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Goate</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Fossati</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Noggle</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gandy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ehrlich</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Katsel</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schadt</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Cai</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brennand</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Haroutunian</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Molecular subtyping of Alzheimer's disease using RNA sequencing data reveals novel mechanisms and targets</article-title>
          <source>Sci Adv</source>
          <year>2021</year>
          <month>01</month>
          <day>08</day>
          <volume>7</volume>
          <issue>2</issue>
          <fpage>eabb5398</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https:///www.science.org/doi/10.1126/sciadv.abb5398?url_ver=Z39.88-2003&amp;rfr_id=ori:rid:crossref.org&amp;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1126/sciadv.abb5398</pub-id>
          <pub-id pub-id-type="medline">33523961</pub-id>
          <pub-id pub-id-type="pii">7/2/eabb5398</pub-id>
          <pub-id pub-id-type="pmcid">PMC7787497</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Young</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Marinescu</surname>
              <given-names>RV</given-names>
            </name>
            <name name-style="western">
              <surname>Oxtoby</surname>
              <given-names>NP</given-names>
            </name>
            <name name-style="western">
              <surname>Bocchetta</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Yong</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Firth</surname>
              <given-names>NC</given-names>
            </name>
            <name name-style="western">
              <surname>Cash</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Thomas</surname>
              <given-names>DL</given-names>
            </name>
            <name name-style="western">
              <surname>Dick</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Cardoso</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van Swieten</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Borroni</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Galimberti</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Masellis</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tartaglia</surname>
              <given-names>MC</given-names>
            </name>
            <name name-style="western">
              <surname>Rowe</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Graff</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Tagliavini</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Frisoni</surname>
              <given-names>GB</given-names>
            </name>
            <name name-style="western">
              <surname>Laforce</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Finger</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>de Mendonça</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sorbi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Warren</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Crutch</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Fox</surname>
              <given-names>NC</given-names>
            </name>
            <name name-style="western">
              <surname>Ourselin</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Schott</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Rohrer</surname>
              <given-names>JD</given-names>
            </name>
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>DC</given-names>
            </name>
            <collab>Genetic FTD Initiative (GENFI)</collab>
            <collab>Alzheimer’s Disease Neuroimaging Initiative (ADNI)</collab>
          </person-group>
          <article-title>Uncovering the heterogeneity and temporal complexity of neurodegenerative diseases with Subtype and Stage Inference</article-title>
          <source>Nat Commun</source>
          <year>2018</year>
          <month>10</month>
          <day>15</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>4273</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://air.unimi.it/handle/2434/625633"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41467-018-05892-0</pub-id>
          <pub-id pub-id-type="medline">30323170</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41467-018-05892-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC6189176</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vogel</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Young</surname>
              <given-names>AL</given-names>
            </name>
            <name name-style="western">
              <surname>Oxtoby</surname>
              <given-names>NP</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ossenkoppele</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Strandberg</surname>
              <given-names>OT</given-names>
            </name>
            <name name-style="western">
              <surname>La Joie</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Aksman</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Grothe</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Iturria-Medina</surname>
              <given-names>Y</given-names>
            </name>
            <collab>Alzheimer’s Disease Neuroimaging Initiative</collab>
            <name name-style="western">
              <surname>Pontecorvo</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Devous</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Rabinovici</surname>
              <given-names>GD</given-names>
            </name>
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Lyoo</surname>
              <given-names>CH</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Hansson</surname>
              <given-names>O</given-names>
            </name>
          </person-group>
          <article-title>Four distinct trajectories of tau deposition identified in Alzheimer's disease</article-title>
          <source>Nat Med</source>
          <year>2021</year>
          <month>05</month>
          <volume>27</volume>
          <issue>5</issue>
          <fpage>871</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33927414"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41591-021-01309-6</pub-id>
          <pub-id pub-id-type="medline">33927414</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-021-01309-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC8686688</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Scheltens</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Tijms</surname>
              <given-names>BM</given-names>
            </name>
            <name name-style="western">
              <surname>Koene</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Barkhof</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Teunissen</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Wolfsgruber</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wagner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kornhuber</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Peters</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Cohn-Sheehy</surname>
              <given-names>BI</given-names>
            </name>
            <name name-style="western">
              <surname>Rabinovici</surname>
              <given-names>GD</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>BL</given-names>
            </name>
            <name name-style="western">
              <surname>Kramer</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Scheltens</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>van der Flier</surname>
              <given-names>WM</given-names>
            </name>
          </person-group>
          <article-title>Cognitive subtypes of probable Alzheimer's disease robustly identified in four cohorts</article-title>
          <source>Alzheimers Dement</source>
          <year>2017</year>
          <month>11</month>
          <day>17</day>
          <volume>13</volume>
          <issue>11</issue>
          <fpage>1226</fpage>
          <lpage>36</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28427934"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jalz.2017.03.002</pub-id>
          <pub-id pub-id-type="medline">28427934</pub-id>
          <pub-id pub-id-type="pmcid">PMC5857387</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Libon</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Drabick</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Giovannetti</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Price</surname>
              <given-names>CC</given-names>
            </name>
            <name name-style="western">
              <surname>Bondi</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Eppig</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nieves</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lamar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Delano-Wood</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Nation</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Brennan</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Au</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Swenson</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Neuropsychological syndromes associated with Alzheimer's/vascular dementia: a latent class analysis</article-title>
          <source>J Alzheimers Dis</source>
          <year>2014</year>
          <month>09</month>
          <day>16</day>
          <volume>42</volume>
          <issue>3</issue>
          <fpage>999</fpage>
          <lpage>1014</lpage>
          <pub-id pub-id-type="doi">10.3233/JAD-132147</pub-id>
          <pub-id pub-id-type="medline">25024329</pub-id>
          <pub-id pub-id-type="pii">8345N78V0162V6V7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Scheltens</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Galindo-Garre</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Pijnenburg</surname>
              <given-names>YA</given-names>
            </name>
            <name name-style="western">
              <surname>van der Vlies</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Smits</surname>
              <given-names>LL</given-names>
            </name>
            <name name-style="western">
              <surname>Koene</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Teunissen</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Barkhof</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Wattjes</surname>
              <given-names>MP</given-names>
            </name>
            <name name-style="western">
              <surname>Scheltens</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>van der Flier</surname>
              <given-names>WM</given-names>
            </name>
          </person-group>
          <article-title>The identification of cognitive subtypes in Alzheimer's disease dementia using latent class analysis</article-title>
          <source>J Neurol Neurosurg Psychiatry</source>
          <year>2016</year>
          <month>03</month>
          <day>17</day>
          <volume>87</volume>
          <issue>3</issue>
          <fpage>235</fpage>
          <lpage>43</lpage>
          <pub-id pub-id-type="doi">10.1136/jnnp-2014-309582</pub-id>
          <pub-id pub-id-type="medline">25783437</pub-id>
          <pub-id pub-id-type="pii">jnnp-2014-309582</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alashwal</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>El Halaby</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Crouse</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Abdalla</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Moustafa</surname>
              <given-names>AA</given-names>
            </name>
          </person-group>
          <article-title>The application of unsupervised clustering methods to Alzheimer's disease</article-title>
          <source>Front Comput Neurosci</source>
          <year>2019</year>
          <month>5</month>
          <day>24</day>
          <volume>13</volume>
          <fpage>31</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31178711"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fncom.2019.00031</pub-id>
          <pub-id pub-id-type="medline">31178711</pub-id>
          <pub-id pub-id-type="pmcid">PMC6543980</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Doshi-Velez</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Comorbidity clusters in autism spectrum disorders: an electronic health record time-series analysis</article-title>
          <source>Pediatrics</source>
          <year>2014</year>
          <month>01</month>
          <volume>133</volume>
          <issue>1</issue>
          <fpage>e54</fpage>
          <lpage>63</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24323995"/>
          </comment>
          <pub-id pub-id-type="doi">10.1542/peds.2013-0819</pub-id>
          <pub-id pub-id-type="medline">24323995</pub-id>
          <pub-id pub-id-type="pii">peds.2013-0819</pub-id>
          <pub-id pub-id-type="pmcid">PMC3876178</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Eran</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Palmer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Avillach</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Levy-Moonshine</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kohane</surname>
              <given-names>IS</given-names>
            </name>
          </person-group>
          <article-title>A multidimensional precision medicine approach identifies an autism subtype characterized by dyslipidemia</article-title>
          <source>Nat Med</source>
          <year>2020</year>
          <month>09</month>
          <day>10</day>
          <volume>26</volume>
          <issue>9</issue>
          <fpage>1375</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1038/s41591-020-1007-0</pub-id>
          <pub-id pub-id-type="medline">32778826</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41591-020-1007-0</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chou</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Liang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Sarva</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Henchcliffe</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Data-driven subtyping of Parkinson's disease using longitudinal clinical records: a cohort study</article-title>
          <source>Sci Rep</source>
          <year>2019</year>
          <month>01</month>
          <day>28</day>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>797</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41598-018-37545-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41598-018-37545-z</pub-id>
          <pub-id pub-id-type="medline">30692568</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41598-018-37545-z</pub-id>
          <pub-id pub-id-type="pmcid">PMC6349906</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Adekkanattu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Brandt</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Jiang</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Kiefer</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mao</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Pacheco</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Rasmussen</surname>
              <given-names>LV</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Isaacson</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pathak</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Data-driven discovery of probable Alzheimer's disease and related dementia subphenotypes using electronic health records</article-title>
          <source>Learn Health Syst</source>
          <year>2020</year>
          <month>10</month>
          <day>10</day>
          <volume>4</volume>
          <issue>4</issue>
          <fpage>e10246</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/33083543"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/lrh2.10246</pub-id>
          <pub-id pub-id-type="medline">33083543</pub-id>
          <pub-id pub-id-type="pii">LRH210246</pub-id>
          <pub-id pub-id-type="pmcid">PMC7556420</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Barkhof</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Denaxas</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Using unsupervised learning to identify clinical subtypes of Alzheimer's disease in electronic health records</article-title>
          <source>Stud Health Technol Inform</source>
          <year>2020</year>
          <month>06</month>
          <day>16</day>
          <volume>270</volume>
          <fpage>499</fpage>
          <lpage>503</lpage>
          <pub-id pub-id-type="doi">10.3233/SHTI200210</pub-id>
          <pub-id pub-id-type="medline">32570434</pub-id>
          <pub-id pub-id-type="pii">SHTI200210</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Alexander</surname>
              <given-names>DC</given-names>
            </name>
            <name name-style="western">
              <surname>Barkhof</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Denaxas</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Identifying and evaluating clinical subtypes of Alzheimer's disease in care electronic health records using unsupervised machine learning</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2021</year>
          <month>12</month>
          <day>08</day>
          <volume>21</volume>
          <issue>1</issue>
          <fpage>343</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-021-01693-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-021-01693-6</pub-id>
          <pub-id pub-id-type="medline">34879829</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-021-01693-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC8653614</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Landi</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>HC</given-names>
            </name>
            <name name-style="western">
              <surname>Cherng</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Landi</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Danieletto</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dudley</surname>
              <given-names>JT</given-names>
            </name>
            <name name-style="western">
              <surname>Furlanello</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Miotto</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Deep representation learning of electronic health records to unlock patient stratification at scale</article-title>
          <source>NPJ Digit Med</source>
          <year>2020</year>
          <volume>3</volume>
          <fpage>96</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-020-0301-z"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-020-0301-z</pub-id>
          <pub-id pub-id-type="medline">32699826</pub-id>
          <pub-id pub-id-type="pii">301</pub-id>
          <pub-id pub-id-type="pmcid">PMC7367859</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>He</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Tian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Erdengasileng</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Charness</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Temporal subtyping of Alzheimer's disease using medical conditions preceding Alzheimer’s disease onset in electronic health records</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2022</year>
          <volume>2022</volume>
          <fpage>226</fpage>
          <lpage>35</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35854753"/>
          </comment>
          <pub-id pub-id-type="medline">35854753</pub-id>
          <pub-id pub-id-type="pii">2172</pub-id>
          <pub-id pub-id-type="pmcid">PMC9285183</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Oskotsky</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Havaldar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mantyh</surname>
              <given-names>WG</given-names>
            </name>
            <name name-style="western">
              <surname>Bicak</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Solsberg</surname>
              <given-names>CW</given-names>
            </name>
            <name name-style="western">
              <surname>Woldemariam</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Oskotsky</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Dubal</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>IE</given-names>
            </name>
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>Sirota</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Deep phenotyping of Alzheimer's disease leveraging electronic medical records identifies sex-specific clinical associations</article-title>
          <source>Nat Commun</source>
          <year>2022</year>
          <month>02</month>
          <day>03</day>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>675</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41467-022-28273-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41467-022-28273-0</pub-id>
          <pub-id pub-id-type="medline">35115528</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41467-022-28273-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC8814236</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tang</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Rankin</surname>
              <given-names>KP</given-names>
            </name>
            <name name-style="western">
              <surname>Cerono</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Miramontes</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Mills</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Roger</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Soman</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Woldemariam</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bove</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Glymour</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Aghaeepour</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Oskotsky</surname>
              <given-names>TT</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>IE</given-names>
            </name>
            <name name-style="western">
              <surname>Sanders</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Baranzini</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Sirota</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Leveraging electronic health records and knowledge networks for Alzheimer's disease prediction and sex-specific biological insights</article-title>
          <source>Nat Aging</source>
          <year>2024</year>
          <month>03</month>
          <day>21</day>
          <volume>4</volume>
          <issue>3</issue>
          <fpage>379</fpage>
          <lpage>95</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/38383858"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s43587-024-00573-8</pub-id>
          <pub-id pub-id-type="medline">38383858</pub-id>
          <pub-id pub-id-type="pii">10.1038/s43587-024-00573-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC10950787</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vaswani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Brain</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Shazeer</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Uszkoreit</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gomez</surname>
              <given-names>AN</given-names>
            </name>
            <name name-style="western">
              <surname>Kaiser</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Polosukhin</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Attention is all you need</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on June 12, 2017</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1706.03762"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>MW</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</source>
          <year>2019</year>
          <conf-name>NAACL-HLT '19</conf-name>
          <conf-date>June 2-7, 2019</conf-date>
          <conf-loc>Minneapolis, MN</conf-loc>
          <fpage>4171</fpage>
          <lpage>86</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/N19-1423.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alsentzer</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Murphy</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Boag</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Jindi</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Naumann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>McDermott</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Publicly available clinical BERT embeddings</article-title>
          <source>Proceedings of the 2nd Clinical Natural Language Processing Workshop</source>
          <year>2019</year>
          <conf-name>ClinicalNLP '19</conf-name>
          <conf-date>June 7, 2019</conf-date>
          <conf-loc>Minneapolis, MN</conf-loc>
          <fpage>72</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://aclanthology.org/W19-1909.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.18653/v1/w19-1909</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lehman</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-III, a freely accessible critical care database</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <month>05</month>
          <day>24</day>
          <volume>3</volume>
          <fpage>160035</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/sdata.2016.35"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id>
          <pub-id pub-id-type="medline">27219127</pub-id>
          <pub-id pub-id-type="pii">sdata201635</pub-id>
          <pub-id pub-id-type="pmcid">PMC4878278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Chiu</surname>
              <given-names>CY</given-names>
            </name>
            <name name-style="western">
              <surname>Sontag</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Learning low-dimensional representations of medical concepts</article-title>
          <source>AMIA Jt Summits Transl Sci Proc</source>
          <year>2016</year>
          <volume>2016</volume>
          <fpage>41</fpage>
          <lpage>50</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/27570647"/>
          </comment>
          <pub-id pub-id-type="medline">27570647</pub-id>
          <pub-id pub-id-type="pmcid">PMC5001761</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shannon</surname>
              <given-names>CE</given-names>
            </name>
          </person-group>
          <article-title>A mathematical theory of communication</article-title>
          <source>Bell Syst Tech J</source>
          <year>1948</year>
          <volume>27</volume>
          <fpage>63</fpage>
          <pub-id pub-id-type="doi">10.1002/j.1538-7305.1948.tb00917.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ebrahimi</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Pflughoeft</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Soofi</surname>
              <given-names>ES</given-names>
            </name>
          </person-group>
          <article-title>Two measures of sample entropy</article-title>
          <source>Stat Probabil Lett</source>
          <year>1994</year>
          <month>6</month>
          <volume>20</volume>
          <issue>3</issue>
          <fpage>225</fpage>
          <lpage>34</lpage>
          <pub-id pub-id-type="doi">10.1016/0167-7152(94)90046-9</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Virtanen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Gommers</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Oliphant</surname>
              <given-names>TE</given-names>
            </name>
            <name name-style="western">
              <surname>Haberland</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Reddy</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cournapeau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Burovski</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Weckesser</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Bright</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>van der Walt</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Brett</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wilson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Millman</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Mayorov</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Kern</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Larson</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Carey</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Polat</surname>
              <given-names>?</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Moore</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>VanderPlas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Laxalde</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Perktold</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Cimrman</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Henriksen</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Quintero</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Harris</surname>
              <given-names>CR</given-names>
            </name>
            <name name-style="western">
              <surname>Archibald</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Ribeiro</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>van Mulbregt</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>SciPy 1.0: fundamental algorithms for scientific computing in Python</article-title>
          <source>Nat Methods</source>
          <year>2020</year>
          <month>03</month>
          <day>3</day>
          <volume>17</volume>
          <issue>3</issue>
          <fpage>261</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://air.unimi.it/handle/2434/848184"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41592-019-0686-2</pub-id>
          <pub-id pub-id-type="medline">32015543</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41592-019-0686-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC7056644</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Abraham</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Eickenberg</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gervais</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mueller</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kossaifi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thirion</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Machine learning for neuroimaging with scikit-learn</article-title>
          <source>Front Neuroinform</source>
          <year>2014</year>
          <volume>8</volume>
          <fpage>14</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/24600388"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fninf.2014.00014</pub-id>
          <pub-id pub-id-type="medline">24600388</pub-id>
          <pub-id pub-id-type="pmcid">PMC3930868</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Flamary</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Courty</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>POT python optimal transport library</article-title>
          <source>GitHub</source>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://pythonot.github.io/">https://pythonot.github.io/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Courty</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Flamary</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Tuia</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Rakotomamonjy</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Optimal Transport for Domain Adaptation</article-title>
          <source>IEEE Trans Pattern Anal Mach Intell</source>
          <year>2017</year>
          <month>9</month>
          <day>1</day>
          <volume>39</volume>
          <issue>9</issue>
          <fpage>1853</fpage>
          <lpage>65</lpage>
          <pub-id pub-id-type="doi">10.1109/tpami.2016.2615921</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Grootendorst</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>BERTopic: Neural topic modeling with a class-based TF-IDF procedure</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on March 11, 2022</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2203.05794"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Achiam</surname>
              <given-names>OJ</given-names>
            </name>
            <name name-style="western">
              <surname>Adler</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ahmad</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Akkaya</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Aleman</surname>
              <given-names>FL</given-names>
            </name>
            <name name-style="western">
              <surname>Almeida</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>GPT-4 technical report</article-title>
          <source>arXiv</source>
          <comment>Preprint posted online on March 15, 2023</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/2303.08774"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Reynolds</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <person-group person-group-type="editor">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>SZ</given-names>
            </name>
            <name name-style="western">
              <surname>Jain</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Gaussian mixture models</article-title>
          <source>Encyclopedia of Biometrics</source>
          <year>2009</year>
          <publisher-loc>Cham, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
          <fpage>659</fpage>
          <lpage>63</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ester</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kriegel</surname>
              <given-names>HP</given-names>
            </name>
            <name name-style="western">
              <surname>Sander</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>A density-based algorithm for discovering clusters in large spatial databases with noise</article-title>
          <source>Proceedings of the Second International Conference on Knowledge Discovery and Data Mining</source>
          <year>1996</year>
          <conf-name>KDD '96</conf-name>
          <conf-date>August 2-4, 1996</conf-date>
          <conf-loc>Portland, OR</conf-loc>
          <fpage>226</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.5555/3001460.3001507"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ribino</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Napoli</surname>
              <given-names>CD</given-names>
            </name>
            <name name-style="western">
              <surname>Paragliola</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Serino</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Gasparini</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Chicco</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Exploratory analysis of longitudinal data of patients with dementia through unsupervised techniques</article-title>
          <source>Proceedings of the 4th Italian Workshop on Artificial Intelligence for an Ageing Society</source>
          <year>2023</year>
          <conf-name>AIxAS '23</conf-name>
          <conf-date>November 6-9, 2023</conf-date>
          <conf-loc>Rome, Italy</conf-loc>
          <fpage>1</fpage>
          <lpage>21</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ceur-ws.org/Vol-3623/AIxAS_2023_paper_8.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Song</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Yin</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Autoencoder to identify sex-specific sub-phenotypes in Alzheimer's disease progression using longitudinal electronic health records</article-title>
          <source>medRxiv</source>
          <comment>Preprint posted online on July 11, 2024</comment>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1101/2024.07.07.24310055"/>
          </comment>
          <pub-id pub-id-type="doi">10.1101/2024.07.07.24310055</pub-id>
          <pub-id pub-id-type="medline">39040206</pub-id>
          <pub-id pub-id-type="pii">2024.07.07.24310055</pub-id>
          <pub-id pub-id-type="pmcid">PMC11261930</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yaldiz</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Prevalence of actinic keratosis in patients attending the dermatology outpatient clinic</article-title>
          <source>Medicine (Baltimore)</source>
          <year>2019</year>
          <month>07</month>
          <volume>98</volume>
          <issue>28</issue>
          <fpage>e16465</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31305480"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/MD.0000000000016465</pub-id>
          <pub-id pub-id-type="medline">31305480</pub-id>
          <pub-id pub-id-type="pii">00005792-201907120-00093</pub-id>
          <pub-id pub-id-type="pmcid">PMC6641668</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Halpern</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>advances in the etiology, detection, and clinical management of seborrheic keratoses</article-title>
          <source>Dermatology</source>
          <year>2022</year>
          <month>7</month>
          <day>26</day>
          <volume>238</volume>
          <issue>2</issue>
          <fpage>205</fpage>
          <lpage>17</lpage>
          <pub-id pub-id-type="doi">10.1159/000517070</pub-id>
          <pub-id pub-id-type="medline">34311463</pub-id>
          <pub-id pub-id-type="pii">000517070</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="web">
          <article-title>Alzheimer's disease facts and figures</article-title>
          <source>Alzheimer's Association</source>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.alz.org/alzheimers-dementia/facts-figures?gad_source=1">https://www.alz.org/alzheimers-dementia/facts-figures?gad_source=1</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lim</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Fong Lim</surname>
              <given-names>YM</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Sivasampu</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Age, sex and primary care setting differences in patients' perception of community healthcare seeking behaviour towards health services</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <month>10</month>
          <day>21</day>
          <volume>14</volume>
          <issue>10</issue>
          <fpage>e0224260</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0224260"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0224260</pub-id>
          <pub-id pub-id-type="medline">31634373</pub-id>
          <pub-id pub-id-type="pii">PONE-D-19-17088</pub-id>
          <pub-id pub-id-type="pmcid">PMC6802842</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Susukida</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mojtabai</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Mendelson</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Sex differences in help seeking for mood and anxiety disorders in the national comorbidity survey-replication</article-title>
          <source>Depress Anxiety</source>
          <year>2015</year>
          <month>11</month>
          <day>22</day>
          <volume>32</volume>
          <issue>11</issue>
          <fpage>853</fpage>
          <lpage>60</lpage>
          <pub-id pub-id-type="doi">10.1002/da.22366</pub-id>
          <pub-id pub-id-type="medline">25903117</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Connelly</surname>
              <given-names>PJ</given-names>
            </name>
            <name name-style="western">
              <surname>Currie</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Delles</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Sex Differences in the prevalence, outcomes and management of hypertension</article-title>
          <source>Curr Hypertens Rep</source>
          <year>2022</year>
          <month>06</month>
          <day>07</day>
          <volume>24</volume>
          <issue>6</issue>
          <fpage>185</fpage>
          <lpage>92</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35254589"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s11906-022-01183-8</pub-id>
          <pub-id pub-id-type="medline">35254589</pub-id>
          <pub-id pub-id-type="pii">10.1007/s11906-022-01183-8</pub-id>
          <pub-id pub-id-type="pmcid">PMC9239955</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bayram</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Coughlin</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Rajmohan</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Litvan</surname>
              <given-names>I</given-names>
            </name>
          </person-group>
          <article-title>Sex differences for clinical correlates of substantia nigra neuron loss in people with Lewy body pathology</article-title>
          <source>Biol Sex Differ</source>
          <year>2024</year>
          <month>01</month>
          <day>19</day>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>8</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bsd.biomedcentral.com/articles/10.1186/s13293-024-00583-6"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s13293-024-00583-6</pub-id>
          <pub-id pub-id-type="medline">38243325</pub-id>
          <pub-id pub-id-type="pii">10.1186/s13293-024-00583-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC10797801</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bayram</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Coughlin</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Koga</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Ross</surname>
              <given-names>OA</given-names>
            </name>
            <name name-style="western">
              <surname>Litvan</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Dickson</surname>
              <given-names>DW</given-names>
            </name>
          </person-group>
          <article-title>Sex differences for regional pathology in people with a high likelihood of Lewy body dementia phenotype based on underlying pathology</article-title>
          <source>Alzheimers Dement (Amst)</source>
          <year>2025</year>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>e70083</fpage>
          <pub-id pub-id-type="doi">10.1002/dad2.70083</pub-id>
          <pub-id pub-id-type="medline">39886324</pub-id>
          <pub-id pub-id-type="pii">DAD270083</pub-id>
          <pub-id pub-id-type="pmcid">PMC11780110</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wei</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Masurkar</surname>
              <given-names>AV</given-names>
            </name>
            <name name-style="western">
              <surname>Razavian</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>On gaps of clinical diagnosis of dementia subtypes: a study of Alzheimer's disease and Lewy body disease</article-title>
          <source>Front Aging Neurosci</source>
          <year>2023</year>
          <month>3</month>
          <day>21</day>
          <volume>15</volume>
          <fpage>1149036</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37025965"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fnagi.2023.1149036</pub-id>
          <pub-id pub-id-type="medline">37025965</pub-id>
          <pub-id pub-id-type="pmcid">PMC10070837</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SE</given-names>
            </name>
          </person-group>
          <article-title>Frontotemporal dementia: clinical features and diagnosis</article-title>
          <source>UpToDate</source>
          <access-date>2024-04-29</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.uptodate.com/contents/frontotemporal-dementia-clinical-features-and-diagnosis">https://www.uptodate.com/contents/frontotemporal-dementia-clinical-features-and-diagnosis</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chapleau</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>La Joie</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Yong</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Agosta</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Allen</surname>
              <given-names>IE</given-names>
            </name>
            <name name-style="western">
              <surname>Apostolova</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Best</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Boon</surname>
              <given-names>BD</given-names>
            </name>
            <name name-style="western">
              <surname>Crutch</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Filippi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Fumagalli</surname>
              <given-names>GG</given-names>
            </name>
            <name name-style="western">
              <surname>Galimberti</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Graff-Radford</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Grinberg</surname>
              <given-names>LT</given-names>
            </name>
            <name name-style="western">
              <surname>Irwin</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Josephs</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Mendez</surname>
              <given-names>MF</given-names>
            </name>
            <name name-style="western">
              <surname>Mendez</surname>
              <given-names>PC</given-names>
            </name>
            <name name-style="western">
              <surname>Migliaccio</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>ZA</given-names>
            </name>
            <name name-style="western">
              <surname>Montembeault</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Murray</surname>
              <given-names>ME</given-names>
            </name>
            <name name-style="western">
              <surname>Nemes</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pelak</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Perani</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Pijnenburg</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Rogalski</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Schott</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Seeley</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>AC</given-names>
            </name>
            <name name-style="western">
              <surname>Spina</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tanner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Walker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Whitwell</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Wolk</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Ossenkoppele</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Rabinovici</surname>
              <given-names>GD</given-names>
            </name>
          </person-group>
          <article-title>Demographic, clinical, biomarker, and neuropathological correlates of posterior cortical atrophy: an international cohort study and individual participant data meta-analysis</article-title>
          <source>Lancet Neurol</source>
          <year>2024</year>
          <month>02</month>
          <volume>23</volume>
          <issue>2</issue>
          <fpage>168</fpage>
          <lpage>77</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://air.unimi.it/handle/2434/1025736"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/S1474-4422(23)00414-3</pub-id>
          <pub-id pub-id-type="medline">38267189</pub-id>
          <pub-id pub-id-type="pii">S1474-4422(23)00414-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC11615965</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cheng</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Ho</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Weintraub</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rentz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gershon</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Dodge</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Predicting brain amyloid status using the National Institute of Health Toolbox (NIHTB) for assessment of neurological and behavioral function</article-title>
          <source>J Prev Alzheimers Dis</source>
          <year>2024</year>
          <volume>11</volume>
          <issue>4</issue>
          <fpage>943</fpage>
          <lpage>57</lpage>
          <pub-id pub-id-type="doi">10.14283/jpad.2024.77</pub-id>
          <pub-id pub-id-type="medline">39044505</pub-id>
          <pub-id pub-id-type="pmcid">PMC11269772</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Adkins-Jackson</surname>
              <given-names>PB</given-names>
            </name>
            <name name-style="western">
              <surname>Kraal</surname>
              <given-names>AZ</given-names>
            </name>
            <name name-style="western">
              <surname>Hill-Jarrett</surname>
              <given-names>TG</given-names>
            </name>
            <name name-style="western">
              <surname>George</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Deters</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Besser</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Avila-Rieger</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Turney</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Manly</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>Riding the merry-go-round of racial disparities in ADRD research</article-title>
          <source>Alzheimers Dement</source>
          <year>2023</year>
          <month>10</month>
          <volume>19</volume>
          <issue>10</issue>
          <fpage>4735</fpage>
          <lpage>42</lpage>
          <pub-id pub-id-type="doi">10.1002/alz.13359</pub-id>
          <pub-id pub-id-type="medline">37394968</pub-id>
          <pub-id pub-id-type="pmcid">PMC11895198</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mielke</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Aggarwal</surname>
              <given-names>NT</given-names>
            </name>
            <name name-style="western">
              <surname>Vila-Castelar</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Agarwal</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Arenaza-Urquijo</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Brett</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Brugulat-Serrat</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>DuBose</surname>
              <given-names>LE</given-names>
            </name>
            <name name-style="western">
              <surname>Eikelboom</surname>
              <given-names>WS</given-names>
            </name>
            <name name-style="western">
              <surname>Flatt</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Foldi</surname>
              <given-names>NS</given-names>
            </name>
            <name name-style="western">
              <surname>Franzen</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Gilsanz</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>McManus</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>van Lent</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Milani</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Shaaban</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Stites</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Sundermann</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Suryadevara</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Trani</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Turner</surname>
              <given-names>AD</given-names>
            </name>
            <name name-style="western">
              <surname>Vonk</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Quiroz</surname>
              <given-names>YT</given-names>
            </name>
            <name name-style="western">
              <surname>Babulal</surname>
              <given-names>GM</given-names>
            </name>
          </person-group>
          <article-title>Consideration of sex and gender in Alzheimer's disease and related disorders from a global perspective</article-title>
          <source>Alzheimer's &amp; Dementia</source>
          <year>2022</year>
          <month>12</month>
          <day>08</day>
          <volume>18</volume>
          <issue>12</issue>
          <fpage>2707</fpage>
          <lpage>24</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35394117"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/alz.12662</pub-id>
          <pub-id pub-id-type="medline">35394117</pub-id>
          <pub-id pub-id-type="pmcid">PMC9547039</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hernandez</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McClendon</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Zhou</surname>
              <given-names>XH</given-names>
            </name>
            <name name-style="western">
              <surname>Sachs</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lerner</surname>
              <given-names>AJ</given-names>
            </name>
          </person-group>
          <article-title>Pharmacological treatment of Alzheimer's disease: effect of race and demographic variables</article-title>
          <source>J Alzheimers Dis</source>
          <year>2010</year>
          <month>01</month>
          <day>07</day>
          <volume>19</volume>
          <issue>2</issue>
          <fpage>665</fpage>
          <lpage>72</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/20110610"/>
          </comment>
          <pub-id pub-id-type="doi">10.3233/JAD-2010-1269</pub-id>
          <pub-id pub-id-type="medline">20110610</pub-id>
          <pub-id pub-id-type="pii">P57T85623M90T72G</pub-id>
          <pub-id pub-id-type="pmcid">PMC2827609</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Steenland</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Tan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wingo</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Xiao</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Wharton</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>The effect of race and co-morbidities on Alzheimer's disease based on Medicare data</article-title>
          <source>Alzheimers Dement</source>
          <year>2023</year>
          <month>05</month>
          <volume>19</volume>
          <issue>5</issue>
          <fpage>1858</fpage>
          <lpage>64</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36327171"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/alz.12838</pub-id>
          <pub-id pub-id-type="medline">36327171</pub-id>
          <pub-id pub-id-type="pmcid">PMC10251261</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Akushevich</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Kolpakov</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yashkin</surname>
              <given-names>AP</given-names>
            </name>
            <name name-style="western">
              <surname>Kravchenko</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Vulnerability to hypertension is a major determinant of racial disparities in Alzheimer's disease risk</article-title>
          <source>Am J Hypertens</source>
          <year>2022</year>
          <month>08</month>
          <day>01</day>
          <volume>35</volume>
          <issue>8</issue>
          <fpage>745</fpage>
          <lpage>51</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35581146"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/ajh/hpac063</pub-id>
          <pub-id pub-id-type="medline">35581146</pub-id>
          <pub-id pub-id-type="pii">6587183</pub-id>
          <pub-id pub-id-type="pmcid">PMC9340628</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eyre</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chapman</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Peterson</surname>
              <given-names>KS</given-names>
            </name>
            <name name-style="western">
              <surname>Shi</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Alba</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Box</surname>
              <given-names>TL</given-names>
            </name>
            <name name-style="western">
              <surname>DuVall</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>OV</given-names>
            </name>
          </person-group>
          <article-title>Launching into clinical space with medspaCy: a new clinical text processing toolkit in Python</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2021</year>
          <volume>2021</volume>
          <fpage>438</fpage>
          <lpage>47</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/35308962"/>
          </comment>
          <pub-id pub-id-type="medline">35308962</pub-id>
          <pub-id pub-id-type="pii">3576697</pub-id>
          <pub-id pub-id-type="pmcid">PMC8861690</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Dusenberry</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Flores</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Xue</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Dai</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Learning the graphical structure of electronic health records with graph convolutional transformer</article-title>
          <source>Proceedings of the 34th AAAI Conference on Artificial Intelligence</source>
          <year>2020</year>
          <month>04</month>
          <day>03</day>
          <conf-name>AAAI '20</conf-name>
          <conf-date>February 7-12, 2020</conf-date>
          <conf-loc>New York, NY</conf-loc>
          <fpage>606</fpage>
          <lpage>13</lpage>
          <pub-id pub-id-type="doi">10.1609/aaai.v34i01.5400</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Razavian</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Variationally regularized graph-based representation learning for electronic health records</article-title>
          <source>Proceedings of the 2021 Conference on Health, Inference, and Learning</source>
          <year>2021</year>
          <conf-name>CHIL '21</conf-name>
          <conf-date>April 8-10, 2021</conf-date>
          <conf-loc>Virtual Event</conf-loc>
          <fpage>1</fpage>
          <lpage>13</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/3450439.3451855"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3450439.3451855</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
