<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article article-type="research-article" dtd-version="2.0" xmlns:xlink="http://www.w3.org/1999/xlink">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JA</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Aging</journal-id>
      <journal-title>JMIR Aging</journal-title>
      <issn pub-type="epub">2561-7605</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i1e57926</article-id>
      <article-id pub-id-type="pmid">39316421</article-id>
      <article-id pub-id-type="doi">10.2196/57926</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Extracting Critical Information from Unstructured Clinicians’ Notes Data to Identify Dementia Severity Using a Rule-Based Approach: Feasibility Study</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Abdulai</surname>
            <given-names>Abdul Fatawu</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Matos</surname>
            <given-names>Sérgio</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chrimes</surname>
            <given-names>Dillon</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Wu</surname>
            <given-names>Wenbo</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Chi</surname>
            <given-names>Chih-Lin</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Prakash</surname>
            <given-names>Ravi</given-names>
          </name>
          <degrees>MS</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-4020-1590</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Dupre</surname>
            <given-names>Matthew E</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0976-4715</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Østbye</surname>
            <given-names>Truls</given-names>
          </name>
          <degrees>MPH, MD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff4" ref-type="aff">4</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-0662-7440</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Xu</surname>
            <given-names>Hanzhang</given-names>
          </name>
          <degrees>PhD, RN</degrees>
          <xref rid="aff4" ref-type="aff">4</xref>
          <address>
            <institution>Department of Family Medicine and Community Health</institution>
            <institution>School of Medicine</institution>
            <institution>Duke Univeristy</institution>
            <addr-line>2100 Erwin Rd</addr-line>
            <addr-line>Durham, NC, 27710</addr-line>
            <country>United States</country>
            <phone>1 9196849465</phone>
            <email>hanzhang.xu@duke.edu</email>
          </address>
          <xref rid="aff5" ref-type="aff">5</xref>
          <xref rid="aff6" ref-type="aff">6</xref>
          <xref rid="aff7" ref-type="aff">7</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9617-247X</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Thomas Lord Department of Mechanical Engineering and Materials Science</institution>
        <institution>Pratt School of Engineering</institution>
        <institution>Duke University</institution>
        <addr-line>Durham, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Population Health Sciences</institution>
        <institution>School of Medicine</institution>
        <institution>Duke University</institution>
        <addr-line>Durham, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Sociology</institution>
        <institution>Trinity College of Arts &amp; Sciences</institution>
        <institution>Duke University</institution>
        <addr-line>Durham, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff4">
        <label>4</label>
        <institution>Department of Family Medicine and Community Health</institution>
        <institution>School of Medicine</institution>
        <institution>Duke Univeristy</institution>
        <addr-line>Durham, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff5">
        <label>5</label>
        <institution>School of Nursing</institution>
        <institution>Duke University</institution>
        <addr-line>Durham, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff6">
        <label>6</label>
        <institution>Center for the Study of Aging and Human Development</institution>
        <institution>Duke University</institution>
        <addr-line>Durham, NC</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff7">
        <label>7</label>
        <institution>Health Services and Systems Research (HSSR)</institution>
        <institution>Duke-NUS Medical School</institution>
        <addr-line>Singapore</addr-line>
        <country>Singapore</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Hanzhang Xu <email>hanzhang.xu@duke.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2024</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>24</day>
        <month>9</month>
        <year>2024</year>
      </pub-date>
      <volume>7</volume>
      <elocation-id>e57926</elocation-id>
      <history>
        <date date-type="received">
          <day>29</day>
          <month>2</month>
          <year>2024</year>
        </date>
        <date date-type="rev-request">
          <day>13</day>
          <month>5</month>
          <year>2024</year>
        </date>
        <date date-type="rev-recd">
          <day>8</day>
          <month>7</month>
          <year>2024</year>
        </date>
        <date date-type="accepted">
          <day>24</day>
          <month>7</month>
          <year>2024</year>
        </date>
      </history>
      <copyright-statement>©Ravi Prakash, Matthew E Dupre, Truls Østbye, Hanzhang Xu. Originally published in JMIR Aging (https://aging.jmir.org), 24.09.2024.</copyright-statement>
      <copyright-year>2024</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Aging, is properly cited. The complete bibliographic information, a link to the original publication on https://aging.jmir.org, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://aging.jmir.org/2024/1/e57926" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>The severity of Alzheimer disease and related dementias (ADRD) is rarely documented in structured data fields in electronic health records (EHRs). Although this information is important for clinical monitoring and decision-making, it is often undocumented or “hidden” in unstructured text fields and not readily available for clinicians to act upon.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>We aimed to assess the feasibility and potential bias in using keywords and rule-based matching for obtaining information about the severity of ADRD from EHR data.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We used EHR data from a large academic health care system that included patients with a primary discharge diagnosis of ADRD based on <italic>ICD-9</italic> (<italic>International Classification of Diseases, Ninth Revision</italic>) and <italic>ICD-10</italic> (<italic>International Statistical Classification of Diseases, Tenth Revision</italic>) codes between 2014 and 2019. We first assessed the presence of ADRD severity information and then the severity of ADRD in the EHR. Clinicians’ notes were used to determine the severity of ADRD based on two criteria: (1) scores from the Mini Mental State Examination and Montreal Cognitive Assessment and (2) explicit terms for ADRD severity (eg, “mild dementia” and “advanced Alzheimer disease”). We compiled a list of common ADRD symptoms, cognitive test names, and disease severity terms, refining it iteratively based on previous literature and clinical expertise. Subsequently, we used rule-based matching in Python using standard open-source data analysis libraries to identify the context in which specific words or phrases were mentioned. We estimated the prevalence of documented ADRD severity and assessed the performance of our rule-based algorithm.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>We included 9115 eligible patients with over 65,000 notes from the providers. Overall, 22.93% (2090/9115) of patients were documented with mild ADRD, 20.87% (1902/9115) were documented with moderate or severe ADRD, and 56.20% (5123/9115) did not have any documentation of the severity of their ADRD. For the task of determining the presence of any ADRD severity information, our algorithm achieved an accuracy of &gt;95%, specificity of &gt;95%, sensitivity of &gt;90%, and an <italic>F</italic><sub>1</sub>-score of &gt;83%. For the specific task of identifying the actual severity of ADRD, the algorithm performed well with an accuracy of &gt;91%, specificity of &gt;80%, sensitivity of &gt;88%, and <italic>F</italic><sub>1</sub>-score of &gt;92%. Comparing patients with mild ADRD to those with more advanced ADRD, the latter group tended to contain older, more likely female, and Black patients, and having received their diagnoses in primary care or in-hospital settings. Relative to patients with undocumented ADRD severity, those with documented ADRD severity had a similar distribution in terms of sex, race, and rural or urban residence.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Our study demonstrates the feasibility of using a rule-based matching algorithm to identify ADRD severity from unstructured EHR report data. However, it is essential to acknowledge potential biases arising from differences in documentation practices across various health care systems.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>electronic health record</kwd>
        <kwd>EHR</kwd>
        <kwd>electric medical record</kwd>
        <kwd>EMR</kwd>
        <kwd>patient record</kwd>
        <kwd>health record</kwd>
        <kwd>personal health record</kwd>
        <kwd>PHR</kwd>
        <kwd>unstructured data</kwd>
        <kwd>rule based analysis</kwd>
        <kwd>artificial intelligence</kwd>
        <kwd>AI</kwd>
        <kwd>large language model</kwd>
        <kwd>LLM</kwd>
        <kwd>natural language processing</kwd>
        <kwd>NLP</kwd>
        <kwd>deep learning</kwd>
        <kwd>Alzheimer's disease and related dementias</kwd>
        <kwd>AD</kwd>
        <kwd>ADRD</kwd>
        <kwd>Alzheimer's disease</kwd>
        <kwd>dementia</kwd>
        <kwd>geriatric syndromes</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <p>More than 6 million Americans aged 65 years and older are currently living with Alzheimer disease and related dementias (ADRD), constituting about 11% of the total American population aged 65 years and older [<xref ref-type="bibr" rid="ref1">1</xref>]. This number is projected to double by 2060, reaching 13.8 million individuals affected by ADRD [<xref ref-type="bibr" rid="ref1">1</xref>]. Despite the absence of a cure, timely identification of ADRD can significantly improve the quality of life of patients and better prepare their families with essential support resources [<xref ref-type="bibr" rid="ref2">2</xref>]. Early identification of ADRD will also allow health care professionals and policy makers to develop adequate care programs for both patients and their families. Furthermore, the recent US Food and Drug Administration approval for ADRD treatment, lecanemab-irmb, has demonstrated promising advancements in the pharmacological management of the disease [<xref ref-type="bibr" rid="ref3">3</xref>]. However, it is important to note that most of these treatments are only targeted at patients with mild cognitive impairment or early-stage dementia. Therefore, identifying ADRD at an early stage of the disease has become even more critical.</p>
      <p>Early identification of ADRD poses significant challenges [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>]. Even among patients with diagnosed ADRD, determining disease severity remains complex from a clinical perspective. Information regarding the presence and severity of ADRD is often limited to structured fields of electronic health records (EHRs) and is more likely to be stored within unstructured EHR sections, such as clinical reports. Moreover, wide variability exists in documentation practices and data structures across different health care systems, specialties, and even among clinicians within the same clinic [<xref ref-type="bibr" rid="ref6">6</xref>]. Over the past decade, there has been a substantial increase in leveraging information contained in the EHR to improve diagnostic precision [<xref ref-type="bibr" rid="ref7">7</xref>]. In this context, natural language processing (NLP) has emerged as a promising approach to extract relevant information from EHR data, bridging the gap between structured and unstructured clinical information.</p>
      <p>In recent years, EHR data and NLP have been used in various ways to improve ADRD care, such as identifying corelated symptoms [<xref ref-type="bibr" rid="ref8">8</xref>] and common description of cognitive impairment used by clinicians [<xref ref-type="bibr" rid="ref9">9</xref>], establishing consensus on cognitive test scores [<xref ref-type="bibr" rid="ref10">10</xref>], phenotyping of cognitive status [<xref ref-type="bibr" rid="ref11">11</xref>], and predicting the onset of cognitive decline [<xref ref-type="bibr" rid="ref12">12</xref>]. However, while structured EHR data have traditionally been used in previous research, they fall short of adequately documenting the severity of ADRD [<xref ref-type="bibr" rid="ref13">13</xref>]. To address this gap, the unstructured component of EHR becomes critical for capturing essential symptoms and severity indicators related to ADRD [<xref ref-type="bibr" rid="ref11">11</xref>]. The extent to which unstructured EHR data can be used to determine the severity of ADRD remains largely unknown.</p>
      <p>In this study, we assess the feasibility and potential bias of a rule-based matching algorithm for extracting information on ADRD severity in patients with a primary discharge diagnosis of ADRD. Specifically, we develop an algorithm that acquires cognitive test scores and identifies distinct mentions of the presence and severity of ADRD from the primary discharge diagnosis. As each health care system may encode clinical information in the EHR differently, we propose a general framework that health care systems can adopt to tailor their needs and reduce irrelevant “noise” in the EHR—any unwanted irrelevant information.</p>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Sources and Study Population</title>
        <p>This is a retrospective cohort study that used data from Duke University Health System. Due to the sensitive nature of the data, qualified researchers trained in human subject confidentiality protocols may send requests to access the data that support the findings of this study to the corresponding author.</p>
        <p>EHR data were extracted using Duke Enterprise Data Unified Content Explorer, a data extraction system based on Epic (Maestro Care) that identifies patient cohorts and provides access to clinical data stored in the organizational data warehouse [<xref ref-type="bibr" rid="ref14">14</xref>]. According to previous research, we identified patients with ADRD as those who had at least one clinical encounter at Duke University Health System with at least one principal discharge diagnosis of ADRD based on <italic>ICD-9</italic> (<italic>International Classification of Diseases, Ninth Revision</italic>) or <italic>ICD-10</italic> (<italic>International Statistical Classification of Diseases,</italic> <italic>Tenth Revision</italic>) codes [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]. The list of <italic>ICD-9/10</italic> codes was based on an established algorithm from previous literature [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref17">17</xref>]. A total of 9115 patients aged 40 years or older, diagnosed with ADRD between January 1, 2014, and December 31, 2019, were included, totaling 65,576 patient records.</p>
      </sec>
      <sec>
        <title>Data Management</title>
        <p>As most of the content present in a patient record is not directly related to the severity of ADRD, we used a keyword list that contains common ADRD terminologies to flag patient records and sections of the record that include words directly related to ADRD. The initial list was generated based on previous work [<xref ref-type="bibr" rid="ref9">9</xref>] and was further modified to include synonyms and additional keywords corresponding to <italic>ICD-9/10</italic> codes related to ADRD. An expert panel of clinicians provided input on the list through an iterative process. The final list (Table S1 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>) included 38 unique ADRD keywords, consisting of terminologies used by clinicians at Duke University Health System to document ADRD-related information in patient records. This step helped us extract the context in which these words and phrases were mentioned to reduce noise (ie, text not related to the severity of ADRD).</p>
      </sec>
      <sec>
        <title>NLP Algorithms</title>
        <p>Unstructured EHR data, characterized by its absence of standardized writing patterns, often manifests inconsistencies in both quality and content. This includes the presence of spelling errors, typographical inaccuracies, formatting inconsistencies, uncommon abbreviations, and other customary challenges inherent in note-taking practices [<xref ref-type="bibr" rid="ref18">18</xref>]. In response to these challenges, progress in NLP capabilities has helped to filter out important and relevant information from EHR data automatically. This can be done through a rule- or learning-based approach. Previous research has suggested that learning-based methods struggle with interpretability [<xref ref-type="bibr" rid="ref19">19</xref>] and require a considerable amount of labeled text data, which can hinder scalability. Therefore, in our study, we used a rule-based approach, allowing us to interpret our results clearly and quantify the scope of our algorithm.</p>
        <p>Specifically, our algorithm worked by sequentially narrowing down the target tokens (parts of the sentence) to extract information pertaining to ADRD textual mentions (ie, ADRD Text) and cognitive scores (ie, ADRD Cognitive Score). Then the algorithm determined the severity of ADRD based on either the direct mention of keywords pertaining to ADRD severity, or cognitive test scores. We categorized the severity of ADRD into three categories that include (1) mild, (2) moderate-to-severe (ie, advanced stage of ADRD), and (3) no severity indicated. Keywords corresponding to each severity stage are included in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. In the absence of any direct mention of the severity keywords in patient records, the severity of ADRD was defined based on cognitive test scores (Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>). Separate lists of keywords for the severity and cognitive scores were generated to aid the NLP algorithm. For patients whose records contained multiple severity levels from the same source (eg, all from cognitive scores), the more severe ADRD was assigned to the patient. As patients are likely to progress from mild to more advanced dementia over time, the more severe disease information was more likely to be the most updated information. In cases where there were discrepancies between the severity indicated by the explicit keywords and the cognitive scores, we defined the severity of ADRD based on the keywords, as providers may characterize the severity of the condition of the patients comprehensively based on additional assessments besides cognitive tests.</p>
        <sec>
          <title>ADRD Text</title>
          <p>We used the Python package spaCy’s pattern-matching function to identify occurrences of words listed in the ADRD keyword list (ie, trigger words). Once a word was identified, we assigned it a positional value of 0. We then extracted 5 tokens before and after the identified word (–5,5), creating a variable with 11 tokens, including the trigger word. The decision to extract this specific number of tokens was based on language constraints and observations from chart reviews, which revealed that most keywords related to the severity of ADRD appeared near the trigger words (eg, “mild dementia”). Next, we performed another pattern search using the severity keywords listed in Table S2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>, but this time only on the previously extracted 11 tokens. If a match was confirmed, we extracted the keyword defining the severity of ADRD. The extracted keyword was then assigned a severity category based on the Montreal Cognitive Assessment (MoCA) and Mini Mental State Examination (MMSE) score ranges as outlined in Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. The flowchart for this method is illustrated in <xref rid="figure1" ref-type="fig">Figure 1</xref>.</p>
          <fig id="figure1" position="float">
            <label>Figure 1</label>
            <caption>
              <p>Flowchart to determine the severity of Alzheimer disease and related dementias based on Alzheimer disease and related dementias trigger words. ADRD: Alzheimer disease and related dementias.</p>
            </caption>
            <graphic xlink:href="aging_v7i1e57926_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>ADRD Cognitive Score</title>
          <p>Based on previous literature and input from clinicians, we focused on the cognitive scores from MMSE and MoCA to define the severity of ADRD [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. These 2 cognitive tests were widely used in clinical practice with established cutoffs to determine the severity of cognitive impairment [<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref20">20</xref>]. Through chart review and consultation with clinicians, we observed the following patterns for reporting the scores in patient records. For MMSE, the scores were reported either as variations of “AB/30” or “AB”. For MoCA, the scores were reported as variations of “AB/30,” “AB,” or a special case, “score AB,” where A ∈ (0,3), B ∈ (0,9). Some exemplars are present in <xref ref-type="table" rid="table1">Table 1</xref>. For each patient record, a pattern-matching search was performed to identify occurrences of MoCA and MMSE trigger words. Once a keyword was identified, it was assigned a positional value of 0, and 10 tokens before and after the word were extracted together (–10,10) into a variable. We then used regular expression (Regex) to extract only the numerical score value from the variables with extracted tokens. The above method was used for all the cases mentioned above, with MoCA scores including a special case, due to a slight deviation in terms of extracted tokens, belonging to (0,50) as seen in <xref rid="figure2" ref-type="fig">Figure 2</xref>.</p>
          <table-wrap position="float" id="table1">
            <label>Table 1</label>
            <caption>
              <p>Examples of potential causes of misclassification and representative phrases.</p>
            </caption>
            <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
              <col width="30"/>
              <col width="230"/>
              <col width="440"/>
              <col width="300"/>
              <thead>
                <tr valign="top">
                  <td colspan="2">Category and cause of error</td>
                  <td>Sample sentence</td>
                  <td>Explanation</td>
                </tr>
              </thead>
              <tbody>
                <tr valign="top">
                  <td colspan="4">
                    <bold>ADRD<sup>a</sup> text</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Incorrect textual representation</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Patient demonstrates decreased function secondary to decreased activity tolerance; cognitive deficits; medical status limitations</p>
                      </list-item>
                      <list-item>
                        <p>[‘contrast. \r\n\r\n indication: dementia \r\n\r\n findings: \r\n no’, ‘ -- -- -- -- -- -- ’]</p>
                      </list-item>
                    </list>
                  </td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Token delimiter missing</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Lack of contextual relationship between texts</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Lost 2 points for recalling only 1 out of 3 words after 3 minutes. Her neuropsychological testing concluded that she had evidence of a “mild cognitive disorder, nos.”</p>
                      </list-item>
                      <list-item>
                        <p>Mini-cognitive total scoring 1-2 recall and normal cdt: negative for cognitive impairment</p>
                      </list-item>
                      <list-item>
                        <p>Vascular dementia with a superimposed severe delirium</p>
                      </list-item>
                    </list>
                  </td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Presence of “mild” and “cognitive” words in close vicinity</p>
                      </list-item>
                      <list-item>
                        <p>Failure to identify negative context.</p>
                      </list-item>
                      <list-item>
                        <p>Presence of “dementia” and “severe” in close vicinity.</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td colspan="4">
                    <bold>ADRD cognitive score</bold>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Particular pattern of reporting MoCA<sup>b</sup> score</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>MoCA XX/XX/20XX trails 1 cube 1 clock 2 naming 3 digit span 1 letter a 1 serial 7s 3 sentence repetition 2 fluency 1 abstraction 2 orientation 6 memory 0 education level 0 total score 23</p>
                      </list-item>
                    </list>
                  </td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Consistent pattern has been addressed in the algorithm.</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Complex score reporting format</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Montreal Cognitive Assessment by on 8/22 (scored 19/30, normal is 26-30/30)</p>
                      </list-item>
                    </list>
                  </td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Multiple scores in AB/30 format.</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
                <tr valign="top">
                  <td>
                    <break/>
                  </td>
                  <td>Human error</td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>MMSE<sup>c</sup> 36/50</p>
                      </list-item>
                    </list>
                  </td>
                  <td>
                    <list list-type="bullet">
                      <list-item>
                        <p>Out of bounds for MMSE score and spelled wrong.</p>
                      </list-item>
                    </list>
                  </td>
                </tr>
              </tbody>
            </table>
            <table-wrap-foot>
              <fn id="table1fn1">
                <p><sup>a</sup>ADRD: Alzheimer disease and related dementias.</p>
              </fn>
              <fn id="table1fn2">
                <p><sup>b</sup>MoCA: Montreal Cognitive Assessment</p>
              </fn>
              <fn id="table1fn3">
                <p><sup>c</sup>MMSE: Mini Mental State Examination.</p>
              </fn>
            </table-wrap-foot>
          </table-wrap>
          <fig id="figure2" position="float">
            <label>Figure 2</label>
            <caption>
              <p>Flowchart to determine Alzheimer disease and related dementias (ADRD) stage based on cognitive test score. EHR: electronic health record; MMSE: Mini Mental State Examination; MoCA: Montreal Cognitive Assessment.</p>
            </caption>
            <graphic xlink:href="aging_v7i1e57926_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
          </fig>
        </sec>
        <sec>
          <title>Sampling, Testing, and Analysis</title>
          <p>The rule-based algorithm was fine-tuned on a set of 200 patient records. To test the performance of the algorithm, we generated 2 additional sample files with 200 records each. The index of the first record was chosen using a random number generator to avoid bias. The annotation and validation were done at the level of each patient visit record. A certified clinician reviewed each EHR and determined the severity of ADRD. This manual annotation method served as our gold standard. All discrepancies were reviewed manually by both the data scientist and the clinician and were discussed on a case-by-case basis for resolution. <xref ref-type="table" rid="table1">Table 1</xref> was also reviewed by 2 additional team members: 1 data scientist and 1 clinical scientist. We assessed the model performance by comparing the results generated from the algorithm against the gold standard based on the following parameters: <italic>F</italic><sub>1</sub>-score (ie, the predictive power of the algorithm), accuracy (ie, correct classification), sensitivity, and specificity. In addition, we compared patient characteristics between patients with and without documented dementia severity using Mann‐Whitney U and Pearson chi‐square tests for continuous and categorical variables, respectively. Among patients with documented severity of dementia, we further compared patient characteristics between those with mild ADRD and those with moderate-to-severe ADRD.</p>
        </sec>
      </sec>
      <sec>
        <title>Ethical Considerations</title>
        <p>This study was approved by the DUHS Institutional Review Board (Pro00104990).</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p>A total of 9115 eligible patients were included in the study with over 65,000 records. The median age of the patient population was 78 (IQR 70-84) years. Approximately 60% (5547/9115) of the patients were female, 22.9% (2087/9115) were non-Hispanic Black, and about half were diagnosed by an ADRD specialist (neurologists, neuropsychiatrists, geriatricians, etc). On average, each record contained 931.15 words.</p>
      <p>Among all included patients, less than half (3992/9115, 43.8%) had documented information on the stage of their dementia in the EHR. Specifically, about 35% (3190/9115) of the records (3172/9115, 34.8%) included explicit terms that indicated dementia severity, whereas about one-third of the notes (n=2977, 32.7%) included scores from cognitive tests that indicated the severity of patients’ dementia. We found no differences between patients with and without their dementia severity documented with regard to sex (<italic>P</italic>=.45) and race (<italic>P</italic>=.31). However, patients who were older at the time of diagnosis (<italic>P</italic>=.01) and those who were diagnosed at an ADRD specialty clinic or an in-hospital setting (<italic>P</italic>&lt;.001) were more likely to have the severity of their dementia documented in the EHR.</p>
      <p>Among those with documented dementia severity, less than 25% (n=920, 23.0%) were determined only based on cognitive scores. In our data, approximately half of these patients (n=1902, 47.7%) were documented to have moderate-to-severe ADRD. Compared with patients with mild ADRD, patients with moderate-to-severe ADRD were more likely to be older.</p>
      <p><xref ref-type="table" rid="table1">Table 1</xref> shows potential causes of misclassification and representative phrases from the data sets used. Common causes of these challenges include (1) incorrect textual representation, (2) lack of contextual relationship between texts, (3) either particular or complex patterns of documenting cognitive scores, and (4) human data entry error.</p>
      <p><xref ref-type="table" rid="table2">Table 2</xref> presents the performance of our algorithm across 3 sets of data. Overall, the algorithm can identify the presence of information on ADRD severity with high levels of accuracy (<italic>F</italic><sub>1</sub>-score=0.94, accuracy=0.97, sensitivity=0.94, and specificity=0.98) for training data (set 1). The overall accuracy across the 4 matrices in the 2 testing data sets (sets 2 and 3) was greater than 0.91, except for the <italic>F</italic><sub>1</sub>-score for set 3. To evaluate the performance of identifying the severity of ADRD, we defined a binary metric with “moderate-to-severe” diagnosis being positive and “mild” being negative. The ability of the algorithm to identify ADRD severity is comparable, if not better than identifying the presence of ADRD severity (<italic>F</italic><sub>1</sub>-score=0.94, accuracy=0.96, sensitivity=0.88, and specificity=1.0) for training data (set 1). The algorithm had accuracy greater than 0.91 with sensitivity of 1.00 in 2 testing data. The specificity for the 2 testing sets was greater than 0.80.</p>
      <table-wrap position="float" id="table2">
        <label>Table 2</label>
        <caption>
          <p>Evaluation of ADRD<sup>a</sup> stage labeling algorithm for patient stage identification and severity of the diagnosis from unstructured EHR data.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="140"/>
          <col width="150"/>
          <col width="130"/>
          <col width="0"/>
          <col width="150"/>
          <col width="130"/>
          <col width="0"/>
          <col width="150"/>
          <col width="150"/>
          <thead>
            <tr valign="top">
              <td>Category</td>
              <td colspan="3">Set 1</td>
              <td colspan="3">Set 2</td>
              <td colspan="2">Set 3</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>ADRD information</td>
              <td>ADRD severity</td>
              <td colspan="2">ADRD information</td>
              <td>ADRD severity</td>
              <td colspan="2">ADRD information</td>
              <td>ADRD severity</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>TP<sup>b</sup></td>
              <td>50</td>
              <td>16</td>
              <td colspan="2">21</td>
              <td>11</td>
              <td colspan="2">26</td>
              <td>15</td>
            </tr>
            <tr valign="top">
              <td>FP<sup>c</sup></td>
              <td>3</td>
              <td>1</td>
              <td colspan="2">3</td>
              <td>2</td>
              <td colspan="2">8</td>
              <td>0</td>
            </tr>
            <tr valign="top">
              <td>FN<sup>d</sup></td>
              <td>3</td>
              <td>2</td>
              <td colspan="2">1</td>
              <td>0</td>
              <td colspan="2">3</td>
              <td>0</td>
            </tr>
            <tr valign="top">
              <td>TN<sup>e</sup></td>
              <td>144</td>
              <td>28</td>
              <td colspan="2">171</td>
              <td>8</td>
              <td colspan="2">163</td>
              <td>11</td>
            </tr>
            <tr valign="top">
              <td>Accuracy</td>
              <td>0.97</td>
              <td>0.96</td>
              <td colspan="2">0.98</td>
              <td>0.91</td>
              <td colspan="2">0.95</td>
              <td>1.0</td>
            </tr>
            <tr valign="top">
              <td>Sensitivity</td>
              <td>0.94</td>
              <td>0.88</td>
              <td colspan="2">0.95</td>
              <td>1.0</td>
              <td colspan="2">0.90</td>
              <td>1.0</td>
            </tr>
            <tr valign="top">
              <td>Specificity</td>
              <td>0.98</td>
              <td>1.0</td>
              <td colspan="2">0.98</td>
              <td>0.8</td>
              <td colspan="2">0.95</td>
              <td>1.0</td>
            </tr>
            <tr valign="top">
              <td><italic>F</italic><sub>1</sub>-score</td>
              <td>0.94</td>
              <td>0.94</td>
              <td colspan="2">0.91</td>
              <td>0.92</td>
              <td colspan="2">0.83</td>
              <td>1</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table2fn1">
            <p><sup>a</sup>ADRD: Alzheimer disease and related dementias.</p>
          </fn>
          <fn id="table2fn2">
            <p><sup>b</sup>TP: True positive.</p>
          </fn>
          <fn id="table2fn3">
            <p><sup>c</sup>FP: False positive.</p>
          </fn>
          <fn id="table2fn4">
            <p><sup>d</sup>FN: False negative.</p>
          </fn>
          <fn id="table2fn5">
            <p><sup>e</sup>TN: True negative.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>In this study, we developed and successfully implemented a rule-based algorithm to identify the severity of ADRD from unstructured EHR data. We detailed the steps to be taken for extracting the relevant information from EHR data and highlighted the challenges associated with it due to heterogeneity in textual representation. We find a lack of access to specialty facilities may impede timely diagnosis and the possibility of treatment at early stages of ADRD progression. As the severity of dementia is critical for health care providers to prescribe appropriate treatment and link resources to patients and their caregivers, our 2-pronged approach to search for relevant information presents a parsimonious yet effective way to make the disease severity information readily available across disciplines and care settings.</p>
        <p>Similar to previous research [<xref ref-type="bibr" rid="ref21">21</xref>-<xref ref-type="bibr" rid="ref24">24</xref>], we developed the algorithm using a rule-based approach. Starting with an initial list of keywords or phrases based on previous work and contextual clinical knowledge, the list is refined iteratively to identify the target information. This step is followed by sampling the reports from the data set and dividing them into training and testing sets for gold-standard comparison and evaluation. Previous research applied a rule-based approach to identify caregiver availability [<xref ref-type="bibr" rid="ref21">21</xref>], a record of mild cognitive impairment or Alzheimer disease [<xref ref-type="bibr" rid="ref22">22</xref>], documentation of cognitive tests [<xref ref-type="bibr" rid="ref23">23</xref>], and social determinants of health for patients with ADRD [<xref ref-type="bibr" rid="ref24">24</xref>]. Unlike previous work, where either the rule definition step specific to the medical system [<xref ref-type="bibr" rid="ref21">21</xref>], included <italic>ICD</italic> (<italic>International Classification of Diseases</italic>) codes [<xref ref-type="bibr" rid="ref22">22</xref>], or had additional biomarker and cognitive tests information [<xref ref-type="bibr" rid="ref23">23</xref>]. In comparison, our method shows robustness by using common occurring keywords and points toward the need for defining a minimum number of umbrella rules that have the potential to be generalizable for the entire data set and have better performance. Our developed algorithm is independent of the health care systems and provides clinicians with the flexibility to either use it without any modification or adapt it to their needs. A recent systematic review paper has suggested that rule-based NLP algorithms had similar performance compared with those using more sophisticated methods when the information is scarce in the EHR [<xref ref-type="bibr" rid="ref25">25</xref>]. In our case, information on the severity of ADRD was presented using a few words, in less than half of the data. To evaluate the performance of our algorithm, we divided the tests into two categories that are (1) identifying the “presence of information on ADRD severity” and (2) “severity of ADRD.” We found our algorithm to be highly accurate in extracting documented information on ADRD severity from the EHR. The performance on sensitivity and specificity also indicates that our algorithm was able to correctly extract stage information where present and reduce false positive results. Taken together, these results support the clinical use of our simplified and generalizable approach to identify the severity of ADRD. Furthermore, compared with previous work, our algorithm showed an improved average <italic>F</italic><sub>1</sub>-score in identifying the ADRD severity of the condition of the patient [<xref ref-type="bibr" rid="ref26">26</xref>]. The better performance of our algorithm compared with previous work could be attributed to the use of unstructured EHR data instead of structured EHR and defining clear umbrella rules by identifying recurring patterns in our data set for ADRD severity categorization.</p>
        <p>The performance of our algorithm is slightly diminished in identifying the severity of dementia from the records. Upon inspection of the wrongly labeled cases, it can be attributed to (1) the test scores not reflecting the correct severity compared with the clinician’s evaluation, (2) lack of contextual understanding of the sentence, and (3) noise in EHR note (irrelevant information), also noted in previous work [<xref ref-type="bibr" rid="ref21">21</xref>]. A majority of the abovementioned issues were mitigated by defining subrules [<xref ref-type="bibr" rid="ref27">27</xref>]. However, any further inclusion would have come at the cost of reduced performance and the need for increased clinician oversight, which limits its generalizability.</p>
        <p>Although the rule-based algorithm worked considerably well in most of the cases, it is limited by the patterns and rules defined by the developer. For cases where the token default token delimiter, in our case “space,” is changed or missing, the algorithm fails to extract information. One approach to solve this could be to have an alternative copy of the algorithm that includes other common delimiters (eg, “;” “,” “:”) to identify word tokens. In our evaluation, we only found a few outliers not following the default way of describing texts with “space” as the delimiter. The urge to include all the stray cases would lead to the hard coding of the algorithm and give rise to new challenges with considerable false positive results, making it difficult to comb through. With the development of large language models (LLMs), 1 potential solution might be to use LLM to shape the EHR data in the same format, such as converting all patient records to have equal spacing, removing random commas, etc, without changing textual content and then follow a rule-based approach as presented in this study. Our design philosophy has been to keep the algorithm general while including common patterns. One possible criticism of our study could be dichotomizing the severity of ADRD. The rationale for dichotomizing the severity of ADRD into mild versus moderate-to-severe dementia is related to clinical decision-making. Given that there are several types of ADRD, such as Alzheimer disease, vascular dementia, and Lewy body dementia, to name a few, the differential treatment and care plans are limited as a considerable number of patients have mixed dementia, and the gold standard for a definitive differential diagnosis is still based on autopsy studies. Therefore, for this study, we only focused on a dichotomized version of the severity of ADRD. Future studies should further investigate a more comprehensive classification of ADRD severity and possibly include other tests for diagnosis of ADRD outside MoCA and MMSE.</p>
        <p>Overall, we demonstrate the ability of our rule-based algorithm to identify the severity of ADRD, where present, in the EHR and narrow it down to the location of occurrence in the EHR. This not only allows us to comb through valuable unstructured data with ease, but the sequential nature of the algorithm provides us with contextual data that has a high probability of containing information about the severity of dementia. The extracted data can be used in future work to train a machine learning (ML) model with rich and high-quality data. We expect to enhance our method to further identify and predict the progression of ADRD over time. As the performance of an ML model depends on the quality of the data set, following a segmented approach of using a rule-based algorithm for extracting relevant paragraphs from the EHR can be used first to enrich the data set and reduce noise (ie, nonrelevant information from the EHR) followed by model training on the data. Previous research has found that combining structured and unstructured data might be a viable approach to classify patients. With structured data containing useful demographic information and unstructured data containing contextual, patient, and clinical notes, the path forward could be to leverage the qualities of both kinds of data [<xref ref-type="bibr" rid="ref28">28</xref>] for the use of EHR.</p>
        <p>Previous studies that used traditional ML models, such as logistic regression and support vector machine, often include only the structured EHR data due to the limited requirement for data management [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. In recent years, increasing numbers of studies have applied deep learning approaches to classify patients for a given condition [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. One of the strengths of the deep learning approach is its ability to incorporate relationships between words and a large amount of data in the analysis, which fits the need for using both structured and unstructured data together. Despite its strength, a common criticism against the implementation of deep learning approaches in clinical settings is the lack of interpretability [<xref ref-type="bibr" rid="ref19">19</xref>]. The use of an interpretable rule-based approach has enabled us to highlight potential biases and pitfalls to be considered when using black-box deep learning models. One potential solution is to use rule-based pattern matching to highlight the trigger words and related neighborhood of words for added context and classify or label the patient record using deep learning techniques [<xref ref-type="bibr" rid="ref31">31</xref>,<xref ref-type="bibr" rid="ref32">32</xref>]. With the improvements in LLMs and their enhanced contextual and semantic understanding of texts, our rule-based method can be coupled with a pretrained LLM in pre- or postprocessing of the extracted texts [<xref ref-type="bibr" rid="ref33">33</xref>]. Care must be taken while using LLMs due to the generative nature of text predictions in avoiding alteration of textual information and being limited to standardizing textual information. The proposed approach needs to be thoroughly evaluated through data privacy and model uncertainty lens before adoption.</p>
        <p>We also found that the percentage of patients with missing information on the severity of ADRD is very high. Given the added significance of such information in recent times due to newly approved treatment, it is critical in current clinical practice to improve documentation of the severity of dementia to promote high-quality care. In addition, despite the missing information, our relatively simple algorithm approach has been successful in making previously inaccessible and hard-to-find information readily available to clinicians for a large number of patients. These patients would have otherwise not had this information available to their care team without our very practical approach.</p>
        <p>Our study has a few limitations due to the algorithm of our choice and design decisions. First, as mentioned earlier, the rules have to be manually defined and fine-tuned based on a training set. This process, although simple in complexity, can be challenging as EHR can be very different based on health care systems. As the rules are manually defined, it has room for human error. On the other hand, this approach gives the researchers the flexibility to adapt the algorithm structure easily to their health care systems and needs to be fine-tuned. Second, rule-based algorithm matching studies are limited by a lack of contextual understanding between text groups and fail to recognize connotations in sentences. For example, the presence of a negative test result may confuse the algorithm pattern identification process unless explicitly included in the algorithm definition. Third, our approach has been able to only include rules for patterns that are common throughout the data set, such as for the ADRD Cognitive Score function, we include every score defined in the format of AB/30, AB, and a special type of definition as mentioned before. Therefore, we might have missed out on some of the cases straying away from the common patterns. For our instance, attempts to include every unique case led to the results being very irrelevant as it started capturing a lot of unimportant information and the algorithm became very rigid. Fourth, the study determines dementia severity based on cognitive test scores and trigger words for ADRD and does not include medical prescriptions being used by the patient which can be a future direction to make our approach holistic.</p>
        <p>Finally, even though we have attempted to keep our method generalizable, the data were extracted from 1 health care system, and the developed rules may not directly apply to data from other health care systems. We have described in detail the steps taken in designing the algorithm with the aim of serving as a baseline approach for research in identifying ADRD severity from unstructured EHR data. The algorithm does the job well for the criteria chosen, and the choice of criteria to include can be a decision of the study designer.</p>
      </sec>
      <sec>
        <title>Conclusion</title>
        <p>Rule-based algorithms can provide an interpretable approach to process unstructured EHR data. This study demonstrates the value of unstructured EHR data in providing critical information about ADRD severity from patient records. Pattern-matching rule-based algorithms can be tuned and adapted to health care systems and study-specific needs. The proposed algorithm can serve as a baseline or initial point to shift through pages of EHR reports to identify the most relevant sections or regions. However, it is important to clearly identify the assumptions made, and their limitations while defining the rules. Differences in documentation may also introduce bias in the algorithm as it is fine-tuned. Overall, rule-based algorithms are powerful in handling unstructured EHR data while being transparent and interpretable.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group>
      <supplementary-material id="app1">
        <label>Multimedia Appendix 1</label>
        <p>Description of the electronic health record data set.</p>
        <media xlink:href="aging_v7i1e57926_app1.doc" xlink:title="DOC File , 133 KB"/>
      </supplementary-material>
    </app-group>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ADRD</term>
          <def>
            <p>Alzheimer disease and related dementias</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">EHR</term>
          <def>
            <p>electronic health record</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">
            <italic>ICD</italic>
          </term>
          <def>
            <p>
              <italic>International Classification of Diseases</italic>
            </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">
            <italic>ICD-9</italic>
          </term>
          <def>
            <p>
              <italic>International Classification of Diseases, Ninth Revision</italic>
            </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">
            <italic>ICD-10</italic>
          </term>
          <def>
            <p>
              <italic>International Statistical Classification of Diseases, Tenth Revision</italic>
            </p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">LLM</term>
          <def>
            <p>large language model</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb8">MMSE</term>
          <def>
            <p>Mini Mental State Examination</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb9">MoCA</term>
          <def>
            <p>Montreal Cognitive Assessment</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb10">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>We would like to thank Dr Xiao Hu for their feedback during the initial phase of the study. A part of our work was presented at Alzheimer’s Association International Conference 2023 by the authors.</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>NA</collab>
          </person-group>
          <article-title>2021 Alzheimer's disease facts and figures</article-title>
          <source>Alzheimers Dement</source>
          <year>2021</year>
          <volume>17</volume>
          <issue>3</issue>
          <fpage>327</fpage>
          <lpage>406</lpage>
          <pub-id pub-id-type="doi">10.1002/alz.12328</pub-id>
          <pub-id pub-id-type="medline">33756057</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <collab>PAD 20/20 Work Group on Community-Based Detection of Cognitive Decline Dementia</collab>
          </person-group>
          <article-title>Improving community health-care systems' early detection of cognitive decline and dementia</article-title>
          <source>Alzheimers Dement</source>
          <year>2022</year>
          <volume>18</volume>
          <issue>11</issue>
          <fpage>2375</fpage>
          <lpage>2381</lpage>
          <pub-id pub-id-type="doi">10.1002/alz.12837</pub-id>
          <pub-id pub-id-type="medline">36314503</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>US Food and Drug Administration</collab>
          </person-group>
          <source>FDA converts novel Alzheimer’s disease treatment to traditional approval</source>
          <access-date>2024-08-06</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fda.gov/news-events/press-announcements/fda-converts-novel-alzheimers-disease-treatment-traditional-approval">https://www.fda.gov/news-events/press-announcements/fda-converts-novel-alzheimers-disease-treatment-traditional-approval</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ford</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>HE</given-names>
            </name>
            <name name-style="western">
              <surname>Scott</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Cassell</surname>
              <given-names>JA</given-names>
            </name>
          </person-group>
          <article-title>Extracting information from the text of electronic medical records to improve case detection: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2016</year>
          <volume>23</volume>
          <issue>5</issue>
          <fpage>1007</fpage>
          <lpage>1015</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/26911811"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocv180</pub-id>
          <pub-id pub-id-type="medline">26911811</pub-id>
          <pub-id pub-id-type="pii">ocv180</pub-id>
          <pub-id pub-id-type="pmcid">PMC4997034</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McCoy</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Pellegrini</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Tanzi</surname>
              <given-names>RE</given-names>
            </name>
            <name name-style="western">
              <surname>Berretta</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Perlis</surname>
              <given-names>RH</given-names>
            </name>
          </person-group>
          <article-title>Stratifying risk for dementia onset using large-scale electronic health record data: a retrospective cohort study</article-title>
          <source>Alzheimers Dement</source>
          <year>2020</year>
          <volume>16</volume>
          <issue>3</issue>
          <fpage>531</fpage>
          <lpage>540</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/31859230"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jalz.2019.09.084</pub-id>
          <pub-id pub-id-type="medline">31859230</pub-id>
          <pub-id pub-id-type="pii">S1552-5260(19)35484-6</pub-id>
          <pub-id pub-id-type="pmcid">PMC7067642</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Roy</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Stewart</surname>
              <given-names>WF</given-names>
            </name>
          </person-group>
          <article-title>Prediction modeling using EHR data: challenges, strategies, and a comparison of machine learning approaches</article-title>
          <source>Med Care</source>
          <year>2010</year>
          <volume>48</volume>
          <issue>6 Suppl</issue>
          <fpage>S106</fpage>
          <lpage>S113</lpage>
          <pub-id pub-id-type="doi">10.1097/MLR.0b013e3181de9e17</pub-id>
          <pub-id pub-id-type="medline">20473190</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Pollard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Shen</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lehman</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Feng</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ghassemi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Szolovits</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Celi</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Mark</surname>
              <given-names>RG</given-names>
            </name>
          </person-group>
          <article-title>MIMIC-III, a freely accessible critical care database</article-title>
          <source>Sci Data</source>
          <year>2016</year>
          <volume>3</volume>
          <fpage>160035</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/sdata.2016.35"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/sdata.2016.35</pub-id>
          <pub-id pub-id-type="medline">27219127</pub-id>
          <pub-id pub-id-type="pii">sdata201635</pub-id>
          <pub-id pub-id-type="pmcid">PMC4878278</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Anzaldi</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Davison</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Boyd</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Leff</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kharrazi</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Comparing clinician descriptions of frailty and geriatric syndromes using electronic health records: a retrospective cohort study</article-title>
          <source>BMC Geriatr</source>
          <year>2017</year>
          <volume>17</volume>
          <issue>1</issue>
          <fpage>248</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcgeriatr.biomedcentral.com/articles/10.1186/s12877-017-0645-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12877-017-0645-7</pub-id>
          <pub-id pub-id-type="medline">29070036</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12877-017-0645-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC5657074</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gilmore-Bykovskyi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Block</surname>
              <given-names>L M</given-names>
            </name>
            <name name-style="western">
              <surname>Walljasper</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Gleason</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>MN</given-names>
            </name>
          </person-group>
          <article-title>Unstructured clinical documentation reflecting cognitive and behavioral dysfunction: toward an EHR-based phenotype for cognitive impairment</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2018</year>
          <volume>25</volume>
          <issue>9</issue>
          <fpage>1206</fpage>
          <lpage>1212</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29947805"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocy070</pub-id>
          <pub-id pub-id-type="medline">29947805</pub-id>
          <pub-id pub-id-type="pii">5045461</pub-id>
          <pub-id pub-id-type="pmcid">PMC6118865</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Harding</surname>
              <given-names>BN</given-names>
            </name>
            <name name-style="western">
              <surname>Floyd</surname>
              <given-names>JS</given-names>
            </name>
            <name name-style="western">
              <surname>Scherrer</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Salas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Morley</surname>
              <given-names>JE</given-names>
            </name>
            <name name-style="western">
              <surname>Farr</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Dublin</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Methods to identify dementia in the electronic health record: comparing cognitive test scores with dementia algorithms</article-title>
          <source>Healthc (Amst)</source>
          <year>2020</year>
          <volume>8</volume>
          <issue>2</issue>
          <fpage>100430</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/32553526"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.hjdsi.2020.100430</pub-id>
          <pub-id pub-id-type="medline">32553526</pub-id>
          <pub-id pub-id-type="pii">S2213-0764(20)30029-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC7363308</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kharrazi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Anzaldi</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Davison</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Boyd</surname>
              <given-names>CM</given-names>
            </name>
            <name name-style="western">
              <surname>Leff</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Kimura</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weiner</surname>
              <given-names>JP</given-names>
            </name>
          </person-group>
          <article-title>The value of unstructured electronic health record data in geriatric syndrome case identification</article-title>
          <source>J Am Geriatr Soc</source>
          <year>2018</year>
          <volume>66</volume>
          <issue>8</issue>
          <fpage>1499</fpage>
          <lpage>1507</lpage>
          <pub-id pub-id-type="doi">10.1111/jgs.15411</pub-id>
          <pub-id pub-id-type="medline">29972595</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hane</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Nori</surname>
              <given-names>VS</given-names>
            </name>
            <name name-style="western">
              <surname>Crown</surname>
              <given-names>WH</given-names>
            </name>
            <name name-style="western">
              <surname>Sanghavi</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Bleicher</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Predicting onset of dementia using clinical notes and machine learning: case-control study</article-title>
          <source>JMIR Med Inform</source>
          <year>2020</year>
          <volume>8</volume>
          <issue>6</issue>
          <fpage>e17819</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://medinform.jmir.org/2020/6/e17819/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/17819</pub-id>
          <pub-id pub-id-type="medline">32490841</pub-id>
          <pub-id pub-id-type="pii">v8i6e17819</pub-id>
          <pub-id pub-id-type="pmcid">PMC7301255</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ferrão</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Janela</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Oliveira</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Martins</surname>
              <given-names>HMG</given-names>
            </name>
          </person-group>
          <article-title>Using structured EHR data and SVM to support ICD-9-CM coding</article-title>
          <year>2013</year>
          <conf-name>2013 IEEE International Conference on Healthcare Informatics</conf-name>
          <conf-date>2013 September 09-11</conf-date>
          <conf-loc>Philadelphia, PA</conf-loc>
          <fpage>511</fpage>
          <lpage>516</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Horvath</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Winfield</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Evans</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Slopek</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ferranti</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The DEDUCE guided query tool: providing simplified access to clinical data for research and quality improvement</article-title>
          <source>J Biomed Inform</source>
          <year>2011</year>
          <volume>44</volume>
          <issue>2</issue>
          <fpage>266</fpage>
          <lpage>276</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S1532-0464(10)00174-7"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.jbi.2010.11.008</pub-id>
          <pub-id pub-id-type="medline">21130181</pub-id>
          <pub-id pub-id-type="pii">S1532-0464(10)00174-7</pub-id>
          <pub-id pub-id-type="pmcid">PMC3063322</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>QT</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Shutes-David</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Thielke</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Tsuang</surname>
              <given-names>DW</given-names>
            </name>
          </person-group>
          <article-title>Detection of probable dementia cases in undiagnosed patients using structured and unstructured electronic health records</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2019</year>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>128</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-019-0846-4"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-019-0846-4</pub-id>
          <pub-id pub-id-type="medline">31288818</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-019-0846-4</pub-id>
          <pub-id pub-id-type="pmcid">PMC6617952</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Halpern</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Seare</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Tong</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Hartry</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Olaoye</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Aigbogun</surname>
              <given-names>MS</given-names>
            </name>
          </person-group>
          <article-title>Using electronic health records to estimate the prevalence of agitation in Alzheimer disease/dementia</article-title>
          <source>Int J Geriatr Psychiatry</source>
          <year>2019</year>
          <volume>34</volume>
          <issue>3</issue>
          <fpage>420</fpage>
          <lpage>431</lpage>
          <pub-id pub-id-type="doi">10.1002/gps.5030</pub-id>
          <pub-id pub-id-type="medline">30430642</pub-id>
          <pub-id pub-id-type="pmcid">PMC7379654</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Fillenbaum</surname>
              <given-names>GG</given-names>
            </name>
            <name name-style="western">
              <surname>Ezell</surname>
              <given-names>ME</given-names>
            </name>
          </person-group>
          <article-title>The accuracy of medicare claims data in identifying Alzheimer's disease</article-title>
          <source>J Clin Epidemiol</source>
          <year>2002</year>
          <volume>55</volume>
          <issue>9</issue>
          <fpage>929</fpage>
          <lpage>937</lpage>
          <pub-id pub-id-type="doi">10.1016/s0895-4356(02)00452-3</pub-id>
          <pub-id pub-id-type="medline">12393082</pub-id>
          <pub-id pub-id-type="pii">S0895435602004523</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tayefi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ngo</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Chomutare</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Dalianis</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Salvi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Budrionis</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Godtliebsen</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Challenges and opportunities beyond structured data in analysis of electronic health records</article-title>
          <source>WIREs Computational Stats</source>
          <year>2021</year>
          <month>02</month>
          <day>14</day>
          <volume>13</volume>
          <issue>6</issue>
          <fpage>e1549</fpage>
          <pub-id pub-id-type="doi">10.1002/wics.1549</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Seinen</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Fridgeirsson</surname>
              <given-names>EA</given-names>
            </name>
            <name name-style="western">
              <surname>Ioannou</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jeannetot</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>John</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Kors</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Markus</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>Pera</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Rekkas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>van Mulligen</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Rijnbeek</surname>
              <given-names>PR</given-names>
            </name>
          </person-group>
          <article-title>Use of unstructured text in prognostic clinical prediction models: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2022</year>
          <volume>29</volume>
          <issue>7</issue>
          <fpage>1292</fpage>
          <lpage>1302</lpage>
          <pub-id pub-id-type="doi">10.1093/jamia/ocac058</pub-id>
          <pub-id pub-id-type="medline">35475536</pub-id>
          <pub-id pub-id-type="pii">6574714</pub-id>
          <pub-id pub-id-type="pmcid">PMC9196702</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nasreddine</surname>
              <given-names>ZS</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Bédirian</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Charbonneau</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Whitehead</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Collin</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Cummings</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Chertkow</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>The Montreal Cognitive Assessment, MoCA: a brief screening tool for mild cognitive impairment</article-title>
          <source>J Am Geriatr Soc</source>
          <year>2005</year>
          <volume>53</volume>
          <issue>4</issue>
          <fpage>695</fpage>
          <lpage>699</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1532-5415.2005.53221.x</pub-id>
          <pub-id pub-id-type="medline">15817019</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mahmoudi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Najarian</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Aikens</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Bynum</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vydiswaran</surname>
              <given-names>VGV</given-names>
            </name>
          </person-group>
          <article-title>Identifying caregiver availability using medical notes with rule-based natural language processing: retrospective cohort study</article-title>
          <source>JMIR Aging</source>
          <year>2022</year>
          <volume>5</volume>
          <issue>3</issue>
          <fpage>e40241</fpage>
          <pub-id pub-id-type="doi">10.2196/40241</pub-id>
          <pub-id pub-id-type="medline">35998328</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Aguilar</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Miller</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Jasuja</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Shishova</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Morin</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Berlowitz</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Monfared</surname>
              <given-names>AAT</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Xia</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>Rule-based identification of individuals with mild cognitive impairment or Alzheimer's disease using clinical notes from the United States veterans affairs healthcare system</article-title>
          <source>Neurol Ther</source>
          <year>2023</year>
          <volume>12</volume>
          <issue>6</issue>
          <fpage>2067</fpage>
          <lpage>2078</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37747662"/>
          </comment>
          <pub-id pub-id-type="doi">10.1007/s40120-023-00540-2</pub-id>
          <pub-id pub-id-type="medline">37747662</pub-id>
          <pub-id pub-id-type="pii">10.1007/s40120-023-00540-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC10630261</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>He</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Prosperi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>DeKosky</surname>
              <given-names>ST</given-names>
            </name>
            <name name-style="western">
              <surname>Farrer</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Guo</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Assess the documentation of cognitive tests and biomarkers in electronic health records via natural language processing for Alzheimer's disease and related dementias</article-title>
          <source>Int J Med Inform</source>
          <year>2023</year>
          <volume>170</volume>
          <fpage>104973</fpage>
          <pub-id pub-id-type="doi">10.1016/j.ijmedinf.2022.104973</pub-id>
          <pub-id pub-id-type="medline">36577203</pub-id>
          <pub-id pub-id-type="pii">S1386-5056(22)00287-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Holkeboer</surname>
              <given-names>KJ</given-names>
            </name>
            <name name-style="western">
              <surname>Kolawole</surname>
              <given-names>TO</given-names>
            </name>
            <name name-style="western">
              <surname>Carbone</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Mahmoudi</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Natural language processing to identify social determinants of health in Alzheimer's disease and related dementia from electronic health records</article-title>
          <source>Health Serv Res</source>
          <year>2023</year>
          <volume>58</volume>
          <issue>6</issue>
          <fpage>1292</fpage>
          <lpage>1302</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/37534741"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/1475-6773.14210</pub-id>
          <pub-id pub-id-type="medline">37534741</pub-id>
          <pub-id pub-id-type="pmcid">PMC10622277</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Patra</surname>
              <given-names>BG</given-names>
            </name>
            <name name-style="western">
              <surname>Sharma</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Vekaria</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Adekkanattu</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Patterson</surname>
              <given-names>OV</given-names>
            </name>
            <name name-style="western">
              <surname>Glicksberg</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Lepow</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Ryu</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Biernacka</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Furmanchuk</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>George</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Hogan</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Bian</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Weissman</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wickramaratne</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mann</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Olfson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Campion</surname>
              <given-names>TR</given-names>
            </name>
            <name name-style="western">
              <surname>Weiner</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pathak</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Extracting social determinants of health from electronic health records using natural language processing: a systematic review</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2021</year>
          <volume>28</volume>
          <issue>12</issue>
          <fpage>2716</fpage>
          <lpage>2727</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/34613399"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocab170</pub-id>
          <pub-id pub-id-type="medline">34613399</pub-id>
          <pub-id pub-id-type="pii">6382241</pub-id>
          <pub-id pub-id-type="pmcid">PMC8633615</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vyas</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Aisopos</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Vidal</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Garrard</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Paliouras</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Calibrating Mini-Mental State Examination scores to predict misdiagnosed dementia patients</article-title>
          <source>Applied Sciences</source>
          <year>2021</year>
          <volume>11</volume>
          <issue>17</issue>
          <fpage>8055</fpage>
          <pub-id pub-id-type="doi">10.3390/app11178055</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Oh</surname>
              <given-names>IY</given-names>
            </name>
            <name name-style="western">
              <surname>Schindler</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Ghoshal</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lai</surname>
              <given-names>AM</given-names>
            </name>
            <name name-style="western">
              <surname>Payne</surname>
              <given-names>PRO</given-names>
            </name>
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Extraction of clinical phenotypes for Alzheimer's disease dementia from clinical notes using natural language processing</article-title>
          <source>JAMIA Open</source>
          <year>2023</year>
          <volume>6</volume>
          <issue>1</issue>
          <fpage>ooad014</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/36844369"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamiaopen/ooad014</pub-id>
          <pub-id pub-id-type="medline">36844369</pub-id>
          <pub-id pub-id-type="pii">ooad014</pub-id>
          <pub-id pub-id-type="pmcid">PMC9952043</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bayramli</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Castro</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Barak-Corren</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Madsen</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Nock</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Smoller</surname>
              <given-names>JW</given-names>
            </name>
            <name name-style="western">
              <surname>Reis</surname>
              <given-names>BY</given-names>
            </name>
          </person-group>
          <article-title>Predictive structured-unstructured interactions in EHR models: a case study of suicide prediction</article-title>
          <source>NPJ Digit Med</source>
          <year>2022</year>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>15</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-022-00558-0"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-022-00558-0</pub-id>
          <pub-id pub-id-type="medline">35087182</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41746-022-00558-0</pub-id>
          <pub-id pub-id-type="pmcid">PMC8795240</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gandhi</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Shao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Han</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Chandrasekaran</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Turzhitsky</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Bali</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>AR</given-names>
            </name>
            <name name-style="western">
              <surname>Metzger</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>La Rosa</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Weaver</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dexter</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Huang</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>Applying interpretable deep learning models to identify chronic cough patients using EHR data</article-title>
          <source>Comput Methods Programs Biomed</source>
          <year>2021</year>
          <volume>210</volume>
          <fpage>106395</fpage>
          <pub-id pub-id-type="doi">10.1016/j.cmpb.2021.106395</pub-id>
          <pub-id pub-id-type="medline">34525412</pub-id>
          <pub-id pub-id-type="pii">S0169-2607(21)00469-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Magdamo</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>ZM</given-names>
            </name>
            <name name-style="western">
              <surname>Noori</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sheu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Deodhar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Brenner</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Robbins</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Mukerji</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zafar</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Benson</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Moura</surname>
              <given-names>LMV</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Arnold</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Hyman</surname>
              <given-names>BT</given-names>
            </name>
            <name name-style="western">
              <surname>Serrano‐Pozo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Westover</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Blacker</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Active deep learning to detect cognitive concerns in electronic health records</article-title>
          <source>Alzheimer's &amp; Dementia</source>
          <year>2021</year>
          <volume>17</volume>
          <issue>S11</issue>
          <pub-id pub-id-type="doi">10.1002/alz.055362</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Magdamo</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Hong</surname>
              <given-names>ZM</given-names>
            </name>
            <name name-style="western">
              <surname>Noori</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sheu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Deodhar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Sun</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Brenner</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Robbins</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Mukerji</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Zafar</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Benson</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Moura</surname>
              <given-names>LMV</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Arnold</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Hyman</surname>
              <given-names>BT</given-names>
            </name>
            <name name-style="western">
              <surname>Serrano‐Pozo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Westover</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Blacker</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Active deep learning to detect cognitive concerns in electronic health records</article-title>
          <source>Alzheimers  Dement</source>
          <year>2021</year>
          <volume>17</volume>
          <issue>S11</issue>
          <fpage>e055362</fpage>
          <pub-id pub-id-type="doi">10.1002/alz.055362</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Noori</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Magdamo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Tyagi</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Kondepudi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Alabsi</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Rudmann</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Wilcox</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brenner</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Robbins</surname>
              <given-names>GK</given-names>
            </name>
            <name name-style="western">
              <surname>Moura</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Zafar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Benson</surname>
              <given-names>NM</given-names>
            </name>
            <name name-style="western">
              <surname>Hsu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>R Dickson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Serrano-Pozo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hyman</surname>
              <given-names>BT</given-names>
            </name>
            <name name-style="western">
              <surname>Blacker</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Westover</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Mukerji</surname>
              <given-names>SS</given-names>
            </name>
            <name name-style="western">
              <surname>Das</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Development and evaluation of a natural language processing annotation tool to facilitate phenotyping of cognitive status in electronic health records: diagnostic study</article-title>
          <source>J Med Internet Res</source>
          <year>2022</year>
          <volume>24</volume>
          <issue>8</issue>
          <fpage>e40384</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2022/8/e40384/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/40384</pub-id>
          <pub-id pub-id-type="medline">36040790</pub-id>
          <pub-id pub-id-type="pii">v24i8e40384</pub-id>
          <pub-id pub-id-type="pmcid">PMC9472045</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goel</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gueta</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gilon</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Erell</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Hao</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Jaber</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Reddy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kartha</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Steiner</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Laish</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Feder</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>LLMs Accelerate Annotation for Medical Information Extraction</article-title>
          <source>LLMs accelerate annotation for medical information extraction</source>
          <year>2023</year>
          <conf-name>Machine Learning for Health (ML4H)</conf-name>
          <conf-date>10th December, 2023</conf-date>
          <conf-loc>New Orleans, United States</conf-loc>
          <publisher-name>Proceedings of Machine Learning Research</publisher-name>
          <fpage>82</fpage>
          <lpage>100</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://proceedings.mlr.press/v225/goel23a/goel23a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
